diff --git "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 2.5511, "train/learning_rate": 0.0002958, "train/epoch": 0.31, "train/global_step": 500, "_runtime": 7041, "_timestamp": 1651779339, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 57.0, 831.0, 115.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.239689350128174, -6.919302940368652, -6.598917007446289, -6.278530597686768, -5.958144187927246, -5.637757778167725, -5.317371368408203, -4.99698543548584, -4.676599025726318, -4.356212615966797, -4.035826683044434, -3.715440273284912, -3.3950538635253906, -3.074667453765869, -2.7542812824249268, -2.4338951110839844, -2.113508701324463, -1.793122410774231, -1.472736120223999, -1.152349829673767, -0.8319635391235352, -0.5115772485733032, -0.1911909580230713, 0.1291952133178711, 0.4495816230773926, 0.7699679136276245, 1.0903542041778564, 1.4107404947280884, 1.7311267852783203, 2.051513195037842, 2.371899366378784, 2.6922855377197266, 3.0126724243164062, 3.3330588340759277, 3.65344500541687, 3.9738311767578125, 4.294217586517334, 4.6146039962768555, 4.934989929199219, 5.25537633895874, 5.575762748718262, 5.896149158477783, 6.216535568237305, 6.536921501159668, 6.8573079109191895, 7.177694320678711, 7.498080253601074, 7.818466663360596, 8.138853073120117, 8.45923900604248, 8.77962589263916, 9.100011825561523, 9.420398712158203, 9.740784645080566, 10.06117057800293, 10.38155746459961, 10.701943397521973, 11.022329330444336, 11.342716217041016, 11.663102149963379, 11.983488082885742, 12.303874969482422, 12.624260902404785, 12.944646835327148, 13.265033721923828]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 16.0, 24.0, 51.0, 80.0, 91.0, 110.0, 132.0, 131.0, 114.0, 89.0, 63.0, 46.0, 20.0, 16.0, 3.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4819183349609375, -3.3273098468780518, -3.172701358795166, -3.018092632293701, -2.8634841442108154, -2.7088756561279297, -2.554267168045044, -2.399658679962158, -2.2450499534606934, -2.0904414653778076, -1.9358328580856323, -1.7812243700027466, -1.6266157627105713, -1.4720072746276855, -1.3173987865447998, -1.1627901792526245, -1.0081818103790283, -0.8535732626914978, -0.6989647150039673, -0.5443562269210815, -0.389747679233551, -0.2351391315460205, -0.08053064346313477, 0.07407796382904053, 0.22868645191192627, 0.3832949995994568, 0.5379035472869873, 0.692512035369873, 0.8471205830574036, 1.001729130744934, 1.1563376188278198, 1.3109462261199951, 1.4655547142028809, 1.6201632022857666, 1.774771809577942, 1.9293802976608276, 2.083988904953003, 2.2385973930358887, 2.3932058811187744, 2.54781436920166, 2.702423095703125, 2.8570315837860107, 3.0116400718688965, 3.1662487983703613, 3.320857286453247, 3.475465774536133, 3.6300742626190186, 3.7846827507019043, 3.93929123878479, 4.093899726867676, 4.248508453369141, 4.403116703033447, 4.557725429534912, 4.712333679199219, 4.866942405700684, 5.021551132202148, 5.176159381866455, 5.33076810836792, 5.485376358032227, 5.639985084533691, 5.794593334197998, 5.949202060699463, 6.1038103103637695, 6.258419036865234, 6.413027763366699]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 12.0, 15.0, 15.0, 30.0, 52.0, 370.0, 812.0, 1837.0, 4454.0, 22312.0, 1771122.0, 2365524.0, 24202.0, 2803.0, 317.0, 184.0, 81.0, 48.0, 33.0, 16.0, 14.0, 12.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -5.001220703125, -4.82275390625, -4.644287109375, -4.4658203125, -4.287353515625, -4.10888671875, -3.930419921875, -3.751953125, -3.573486328125, -3.39501953125, -3.216552734375, -3.0380859375, -2.859619140625, -2.68115234375, -2.502685546875, -2.32421875, -2.145751953125, -1.96728515625, -1.788818359375, -1.6103515625, -1.431884765625, -1.25341796875, -1.074951171875, -0.896484375, -0.718017578125, -0.53955078125, -0.361083984375, -0.1826171875, -0.004150390625, 0.17431640625, 0.352783203125, 0.53125, 0.709716796875, 0.88818359375, 1.066650390625, 1.2451171875, 1.423583984375, 1.60205078125, 1.780517578125, 1.958984375, 2.137451171875, 2.31591796875, 2.494384765625, 2.6728515625, 2.851318359375, 3.02978515625, 3.208251953125, 3.38671875, 3.565185546875, 3.74365234375, 3.922119140625, 4.1005859375, 4.279052734375, 4.45751953125, 4.635986328125, 4.814453125, 4.992919921875, 5.17138671875, 5.349853515625, 5.5283203125, 5.706787109375, 5.88525390625, 6.063720703125, 6.2421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 22.0, 55.0, 64.0, 78.0, 102.0, 113.0, 141.0, 114.0, 93.0, 66.0, 47.0, 37.0, 25.0, 15.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53515625, -2.3968505859375, -2.258544921875, -2.1202392578125, -1.98193359375, -1.8436279296875, -1.705322265625, -1.5670166015625, -1.4287109375, -1.2904052734375, -1.152099609375, -1.0137939453125, -0.87548828125, -0.7371826171875, -0.598876953125, -0.4605712890625, -0.322265625, -0.1839599609375, -0.045654296875, 0.0926513671875, 0.23095703125, 0.3692626953125, 0.507568359375, 0.6458740234375, 0.7841796875, 0.9224853515625, 1.060791015625, 1.1990966796875, 1.33740234375, 1.4757080078125, 1.614013671875, 1.7523193359375, 1.890625, 2.0289306640625, 2.167236328125, 2.3055419921875, 2.44384765625, 2.5821533203125, 2.720458984375, 2.8587646484375, 2.9970703125, 3.1353759765625, 3.273681640625, 3.4119873046875, 3.55029296875, 3.6885986328125, 3.826904296875, 3.9652099609375, 4.103515625, 4.2418212890625, 4.380126953125, 4.5184326171875, 4.65673828125, 4.7950439453125, 4.933349609375, 5.0716552734375, 5.2099609375, 5.3482666015625, 5.486572265625, 5.6248779296875, 5.76318359375, 5.9014892578125, 6.039794921875, 6.1781005859375, 6.31640625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 12.0, 13.0, 36.0, 221.0, 4192900.0, 1003.0, 62.0, 18.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5625, -61.3916015625, -57.220703125, -53.0498046875, -48.87890625, -44.7080078125, -40.537109375, -36.3662109375, -32.1953125, -28.0244140625, -23.853515625, -19.6826171875, -15.51171875, -11.3408203125, -7.169921875, -2.9990234375, 1.171875, 5.3427734375, 9.513671875, 13.6845703125, 17.85546875, 22.0263671875, 26.197265625, 30.3681640625, 34.5390625, 38.7099609375, 42.880859375, 47.0517578125, 51.22265625, 55.3935546875, 59.564453125, 63.7353515625, 67.90625, 72.0771484375, 76.248046875, 80.4189453125, 84.58984375, 88.7607421875, 92.931640625, 97.1025390625, 101.2734375, 105.4443359375, 109.615234375, 113.7861328125, 117.95703125, 122.1279296875, 126.298828125, 130.4697265625, 134.640625, 138.8115234375, 142.982421875, 147.1533203125, 151.32421875, 155.4951171875, 159.666015625, 163.8369140625, 168.0078125, 172.1787109375, 176.349609375, 180.5205078125, 184.69140625, 188.8623046875, 193.033203125, 197.2041015625, 201.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 17.0, 52.0, 786.0, 3030.0, 124.0, 24.0, 13.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5302734375, -1.4300689697265625, -1.329864501953125, -1.2296600341796875, -1.12945556640625, -1.0292510986328125, -0.929046630859375, -0.8288421630859375, -0.7286376953125, -0.6284332275390625, -0.528228759765625, -0.4280242919921875, -0.32781982421875, -0.2276153564453125, -0.127410888671875, -0.0272064208984375, 0.072998046875, 0.1732025146484375, 0.273406982421875, 0.3736114501953125, 0.47381591796875, 0.5740203857421875, 0.674224853515625, 0.7744293212890625, 0.8746337890625, 0.9748382568359375, 1.075042724609375, 1.1752471923828125, 1.27545166015625, 1.3756561279296875, 1.475860595703125, 1.5760650634765625, 1.67626953125, 1.7764739990234375, 1.876678466796875, 1.9768829345703125, 2.07708740234375, 2.1772918701171875, 2.277496337890625, 2.3777008056640625, 2.4779052734375, 2.5781097412109375, 2.678314208984375, 2.7785186767578125, 2.87872314453125, 2.9789276123046875, 3.079132080078125, 3.1793365478515625, 3.279541015625, 3.3797454833984375, 3.479949951171875, 3.5801544189453125, 3.68035888671875, 3.7805633544921875, 3.880767822265625, 3.9809722900390625, 4.0811767578125, 4.1813812255859375, 4.281585693359375, 4.3817901611328125, 4.48199462890625, 4.5821990966796875, 4.682403564453125, 4.7826080322265625, 4.8828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 10.0, 21.0, 21.0, 36.0, 63.0, 99.0, 145.0, 176.0, 137.0, 94.0, 61.0, 45.0, 21.0, 17.0, 16.0, 14.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.282334089279175, -3.166180372238159, -3.0500266551971436, -2.933872938156128, -2.8177194595336914, -2.701565742492676, -2.58541202545166, -2.4692583084106445, -2.353104591369629, -2.2369508743286133, -2.1207971572875977, -2.004643440246582, -1.888489842414856, -1.7723361253738403, -1.6561825275421143, -1.5400288105010986, -1.423875093460083, -1.3077213764190674, -1.1915676593780518, -1.0754140615463257, -0.9592603445053101, -0.8431066274642944, -0.7269529700279236, -0.6107993125915527, -0.4946455955505371, -0.37849190831184387, -0.26233822107315063, -0.1461845338344574, -0.03003084659576416, 0.08612287044525146, 0.20227652788162231, 0.31843018531799316, 0.4345836639404297, 0.5507373809814453, 0.6668910384178162, 0.783044695854187, 0.8991984128952026, 1.0153521299362183, 1.1315057277679443, 1.24765944480896, 1.3638131618499756, 1.4799668788909912, 1.5961205959320068, 1.712274193763733, 1.8284279108047485, 1.9445816278457642, 2.0607352256774902, 2.176888942718506, 2.2930426597595215, 2.409196376800537, 2.5253500938415527, 2.6415038108825684, 2.757657527923584, 2.8738112449645996, 2.989964723587036, 3.1061184406280518, 3.2222721576690674, 3.338425874710083, 3.4545795917510986, 3.5707333087921143, 3.686886787414551, 3.8030405044555664, 3.919194221496582, 4.035347938537598, 4.151501655578613]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 8.0, 2.0, 16.0, 8.0, 21.0, 33.0, 39.0, 50.0, 58.0, 55.0, 68.0, 64.0, 87.0, 97.0, 62.0, 59.0, 61.0, 45.0, 48.0, 33.0, 34.0, 20.0, 16.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3885703086853027, -3.258063554763794, -3.1275570392608643, -2.9970502853393555, -2.866543769836426, -2.736037015914917, -2.605530261993408, -2.4750237464904785, -2.3445169925689697, -2.214010238647461, -2.0835037231445312, -1.9529969692230225, -1.8224903345108032, -1.691983699798584, -1.5614769458770752, -1.430970311164856, -1.3004636764526367, -1.1699570417404175, -1.0394504070281982, -0.9089436531066895, -0.7784370183944702, -0.647930383682251, -0.517423689365387, -0.38691699504852295, -0.2564103603363037, -0.12590369582176208, 0.004602968692779541, 0.13510963320732117, 0.2656162977218628, 0.39612293243408203, 0.526629626750946, 0.6571363210678101, 0.7876429557800293, 0.9181495904922485, 1.0486562252044678, 1.1791629791259766, 1.3096696138381958, 1.440176248550415, 1.5706830024719238, 1.701189637184143, 1.8316962718963623, 1.9622029066085815, 2.092709541320801, 2.2232162952423096, 2.3537230491638184, 2.484229564666748, 2.614736318588257, 2.7452430725097656, 2.8757495880126953, 3.006256341934204, 3.136762857437134, 3.2672696113586426, 3.3977761268615723, 3.528282880783081, 3.65878963470459, 3.7892961502075195, 3.9198029041290283, 4.050309658050537, 4.180816173553467, 4.3113226890563965, 4.441829681396484, 4.572336196899414, 4.702842712402344, 4.833349704742432, 4.963856220245361]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 7.0, 11.0, 11.0, 17.0, 26.0, 34.0, 73.0, 121.0, 191.0, 313.0, 681.0, 1411.0, 3544.0, 10715.0, 40437.0, 209426.0, 616211.0, 124660.0, 27649.0, 7891.0, 2756.0, 1142.0, 492.0, 282.0, 173.0, 83.0, 62.0, 37.0, 27.0, 20.0, 8.0, 15.0, 6.0, 7.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2451171875, -1.207794189453125, -1.17047119140625, -1.133148193359375, -1.0958251953125, -1.058502197265625, -1.02117919921875, -0.983856201171875, -0.946533203125, -0.909210205078125, -0.87188720703125, -0.834564208984375, -0.7972412109375, -0.759918212890625, -0.72259521484375, -0.685272216796875, -0.64794921875, -0.610626220703125, -0.57330322265625, -0.535980224609375, -0.4986572265625, -0.461334228515625, -0.42401123046875, -0.386688232421875, -0.349365234375, -0.312042236328125, -0.27471923828125, -0.237396240234375, -0.2000732421875, -0.162750244140625, -0.12542724609375, -0.088104248046875, -0.05078125, -0.013458251953125, 0.02386474609375, 0.061187744140625, 0.0985107421875, 0.135833740234375, 0.17315673828125, 0.210479736328125, 0.247802734375, 0.285125732421875, 0.32244873046875, 0.359771728515625, 0.3970947265625, 0.434417724609375, 0.47174072265625, 0.509063720703125, 0.54638671875, 0.583709716796875, 0.62103271484375, 0.658355712890625, 0.6956787109375, 0.733001708984375, 0.77032470703125, 0.807647705078125, 0.844970703125, 0.882293701171875, 0.91961669921875, 0.956939697265625, 0.9942626953125, 1.031585693359375, 1.06890869140625, 1.106231689453125, 1.1435546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 12.0, 15.0, 24.0, 27.0, 56.0, 76.0, 73.0, 97.0, 101.0, 114.0, 86.0, 83.0, 63.0, 41.0, 46.0, 35.0, 19.0, 15.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9296875, -3.80322265625, -3.6767578125, -3.55029296875, -3.423828125, -3.29736328125, -3.1708984375, -3.04443359375, -2.91796875, -2.79150390625, -2.6650390625, -2.53857421875, -2.412109375, -2.28564453125, -2.1591796875, -2.03271484375, -1.90625, -1.77978515625, -1.6533203125, -1.52685546875, -1.400390625, -1.27392578125, -1.1474609375, -1.02099609375, -0.89453125, -0.76806640625, -0.6416015625, -0.51513671875, -0.388671875, -0.26220703125, -0.1357421875, -0.00927734375, 0.1171875, 0.24365234375, 0.3701171875, 0.49658203125, 0.623046875, 0.74951171875, 0.8759765625, 1.00244140625, 1.12890625, 1.25537109375, 1.3818359375, 1.50830078125, 1.634765625, 1.76123046875, 1.8876953125, 2.01416015625, 2.140625, 2.26708984375, 2.3935546875, 2.52001953125, 2.646484375, 2.77294921875, 2.8994140625, 3.02587890625, 3.15234375, 3.27880859375, 3.4052734375, 3.53173828125, 3.658203125, 3.78466796875, 3.9111328125, 4.03759765625, 4.1640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 11.0, 18.0, 23.0, 26.0, 31.0, 44.0, 83.0, 129.0, 198.0, 318.0, 448.0, 762.0, 1322.0, 2158.0, 3756.0, 6808.0, 13471.0, 28139.0, 63203.0, 151133.0, 301534.0, 260625.0, 118102.0, 49394.0, 22447.0, 10909.0, 5516.0, 3226.0, 1816.0, 1064.0, 711.0, 389.0, 256.0, 147.0, 105.0, 66.0, 43.0, 35.0, 37.0, 14.0, 10.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21399688720703125, -0.2063140869140625, -0.19863128662109375, -0.190948486328125, -0.18326568603515625, -0.1755828857421875, -0.16790008544921875, -0.16021728515625, -0.15253448486328125, -0.1448516845703125, -0.13716888427734375, -0.129486083984375, -0.12180328369140625, -0.1141204833984375, -0.10643768310546875, -0.0987548828125, -0.09107208251953125, -0.0833892822265625, -0.07570648193359375, -0.068023681640625, -0.06034088134765625, -0.0526580810546875, -0.04497528076171875, -0.03729248046875, -0.02960968017578125, -0.0219268798828125, -0.01424407958984375, -0.006561279296875, 0.00112152099609375, 0.0088043212890625, 0.01648712158203125, 0.024169921875, 0.03185272216796875, 0.0395355224609375, 0.04721832275390625, 0.054901123046875, 0.06258392333984375, 0.0702667236328125, 0.07794952392578125, 0.08563232421875, 0.09331512451171875, 0.1009979248046875, 0.10868072509765625, 0.116363525390625, 0.12404632568359375, 0.1317291259765625, 0.13941192626953125, 0.1470947265625, 0.15477752685546875, 0.1624603271484375, 0.17014312744140625, 0.177825927734375, 0.18550872802734375, 0.1931915283203125, 0.20087432861328125, 0.20855712890625, 0.21623992919921875, 0.2239227294921875, 0.23160552978515625, 0.239288330078125, 0.24697113037109375, 0.2546539306640625, 0.26233673095703125, 0.27001953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 13.0, 19.0, 15.0, 21.0, 21.0, 23.0, 29.0, 30.0, 45.0, 42.0, 42.0, 42.0, 45.0, 47.0, 37.0, 51.0, 57.0, 59.0, 47.0, 39.0, 34.0, 35.0, 36.0, 22.0, 26.0, 22.0, 11.0, 14.0, 13.0, 7.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6328125, -2.547454833984375, -2.46209716796875, -2.376739501953125, -2.2913818359375, -2.206024169921875, -2.12066650390625, -2.035308837890625, -1.949951171875, -1.864593505859375, -1.77923583984375, -1.693878173828125, -1.6085205078125, -1.523162841796875, -1.43780517578125, -1.352447509765625, -1.26708984375, -1.181732177734375, -1.09637451171875, -1.011016845703125, -0.9256591796875, -0.840301513671875, -0.75494384765625, -0.669586181640625, -0.584228515625, -0.498870849609375, -0.41351318359375, -0.328155517578125, -0.2427978515625, -0.157440185546875, -0.07208251953125, 0.013275146484375, 0.0986328125, 0.183990478515625, 0.26934814453125, 0.354705810546875, 0.4400634765625, 0.525421142578125, 0.61077880859375, 0.696136474609375, 0.781494140625, 0.866851806640625, 0.95220947265625, 1.037567138671875, 1.1229248046875, 1.208282470703125, 1.29364013671875, 1.378997802734375, 1.46435546875, 1.549713134765625, 1.63507080078125, 1.720428466796875, 1.8057861328125, 1.891143798828125, 1.97650146484375, 2.061859130859375, 2.147216796875, 2.232574462890625, 2.31793212890625, 2.403289794921875, 2.4886474609375, 2.574005126953125, 2.65936279296875, 2.744720458984375, 2.830078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 5.0, 10.0, 11.0, 10.0, 10.0, 14.0, 18.0, 23.0, 39.0, 55.0, 74.0, 124.0, 147.0, 221.0, 341.0, 525.0, 825.0, 1182.0, 1832.0, 3067.0, 5114.0, 9881.0, 22551.0, 69126.0, 348322.0, 446072.0, 86847.0, 26436.0, 11023.0, 5622.0, 3247.0, 1964.0, 1233.0, 862.0, 547.0, 370.0, 237.0, 168.0, 113.0, 73.0, 53.0, 38.0, 30.0, 14.0, 19.0, 9.0, 8.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0], "bins": [-0.032928466796875, -0.03196239471435547, -0.030996322631835938, -0.030030250549316406, -0.029064178466796875, -0.028098106384277344, -0.027132034301757812, -0.02616596221923828, -0.02519989013671875, -0.02423381805419922, -0.023267745971679688, -0.022301673889160156, -0.021335601806640625, -0.020369529724121094, -0.019403457641601562, -0.01843738555908203, -0.0174713134765625, -0.01650524139404297, -0.015539169311523438, -0.014573097229003906, -0.013607025146484375, -0.012640953063964844, -0.011674880981445312, -0.010708808898925781, -0.00974273681640625, -0.008776664733886719, -0.0078105926513671875, -0.006844520568847656, -0.005878448486328125, -0.004912376403808594, -0.0039463043212890625, -0.0029802322387695312, -0.00201416015625, -0.0010480880737304688, -8.20159912109375e-05, 0.0008840560913085938, 0.001850128173828125, 0.0028162002563476562, 0.0037822723388671875, 0.004748344421386719, 0.00571441650390625, 0.006680488586425781, 0.0076465606689453125, 0.008612632751464844, 0.009578704833984375, 0.010544776916503906, 0.011510848999023438, 0.012476921081542969, 0.0134429931640625, 0.014409065246582031, 0.015375137329101562, 0.016341209411621094, 0.017307281494140625, 0.018273353576660156, 0.019239425659179688, 0.02020549774169922, 0.02117156982421875, 0.02213764190673828, 0.023103713989257812, 0.024069786071777344, 0.025035858154296875, 0.026001930236816406, 0.026968002319335938, 0.02793407440185547, 0.028900146484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 20.0, 20.0, 47.0, 69.0, 95.0, 150.0, 178.0, 132.0, 98.0, 71.0, 37.0, 17.0, 15.0, 13.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80685043334961e-05, -6.595812737941742e-05, -6.384775042533875e-05, -6.173737347126007e-05, -5.9626996517181396e-05, -5.751661956310272e-05, -5.540624260902405e-05, -5.3295865654945374e-05, -5.11854887008667e-05, -4.9075111746788025e-05, -4.696473479270935e-05, -4.4854357838630676e-05, -4.2743980884552e-05, -4.063360393047333e-05, -3.852322697639465e-05, -3.641285002231598e-05, -3.4302473068237305e-05, -3.219209611415863e-05, -3.0081719160079956e-05, -2.7971342206001282e-05, -2.5860965251922607e-05, -2.3750588297843933e-05, -2.164021134376526e-05, -1.9529834389686584e-05, -1.741945743560791e-05, -1.5309080481529236e-05, -1.3198703527450562e-05, -1.1088326573371887e-05, -8.977949619293213e-06, -6.8675726652145386e-06, -4.757195711135864e-06, -2.64681875705719e-06, -5.364418029785156e-07, 1.5739351511001587e-06, 3.684312105178833e-06, 5.794689059257507e-06, 7.905066013336182e-06, 1.0015442967414856e-05, 1.212581992149353e-05, 1.4236196875572205e-05, 1.634657382965088e-05, 1.8456950783729553e-05, 2.0567327737808228e-05, 2.2677704691886902e-05, 2.4788081645965576e-05, 2.689845860004425e-05, 2.9008835554122925e-05, 3.11192125082016e-05, 3.3229589462280273e-05, 3.533996641635895e-05, 3.745034337043762e-05, 3.9560720324516296e-05, 4.167109727859497e-05, 4.3781474232673645e-05, 4.589185118675232e-05, 4.8002228140830994e-05, 5.011260509490967e-05, 5.222298204898834e-05, 5.4333359003067017e-05, 5.644373595714569e-05, 5.8554112911224365e-05, 6.066448986530304e-05, 6.277486681938171e-05, 6.488524377346039e-05, 6.699562072753906e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 10.0, 16.0, 11.0, 27.0, 32.0, 44.0, 75.0, 147.0, 606.0, 19831.0, 1023483.0, 3647.0, 287.0, 92.0, 59.0, 56.0, 23.0, 22.0, 13.0, 9.0, 13.0, 11.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3662109375, -0.3552207946777344, -0.34423065185546875, -0.3332405090332031, -0.3222503662109375, -0.3112602233886719, -0.30027008056640625, -0.2892799377441406, -0.278289794921875, -0.2672996520996094, -0.25630950927734375, -0.24531936645507812, -0.2343292236328125, -0.22333908081054688, -0.21234893798828125, -0.20135879516601562, -0.19036865234375, -0.17937850952148438, -0.16838836669921875, -0.15739822387695312, -0.1464080810546875, -0.13541793823242188, -0.12442779541015625, -0.11343765258789062, -0.102447509765625, -0.09145736694335938, -0.08046722412109375, -0.06947708129882812, -0.0584869384765625, -0.047496795654296875, -0.03650665283203125, -0.025516510009765625, -0.0145263671875, -0.003536224365234375, 0.00745391845703125, 0.018444061279296875, 0.0294342041015625, 0.040424346923828125, 0.05141448974609375, 0.062404632568359375, 0.073394775390625, 0.08438491821289062, 0.09537506103515625, 0.10636520385742188, 0.1173553466796875, 0.12834548950195312, 0.13933563232421875, 0.15032577514648438, 0.16131591796875, 0.17230606079101562, 0.18329620361328125, 0.19428634643554688, 0.2052764892578125, 0.21626663208007812, 0.22725677490234375, 0.23824691772460938, 0.249237060546875, 0.2602272033691406, 0.27121734619140625, 0.2822074890136719, 0.2931976318359375, 0.3041877746582031, 0.31517791748046875, 0.3261680603027344, 0.337158203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 6.0, 8.0, 11.0, 20.0, 26.0, 25.0, 44.0, 51.0, 109.0, 130.0, 151.0, 118.0, 75.0, 59.0, 35.0, 36.0, 9.0, 16.0, 9.0, 7.0, 12.0, 11.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0295257568359375, -0.028641700744628906, -0.027757644653320312, -0.02687358856201172, -0.025989532470703125, -0.02510547637939453, -0.024221420288085938, -0.023337364196777344, -0.02245330810546875, -0.021569252014160156, -0.020685195922851562, -0.01980113983154297, -0.018917083740234375, -0.01803302764892578, -0.017148971557617188, -0.016264915466308594, -0.015380859375, -0.014496803283691406, -0.013612747192382812, -0.012728691101074219, -0.011844635009765625, -0.010960578918457031, -0.010076522827148438, -0.009192466735839844, -0.00830841064453125, -0.007424354553222656, -0.0065402984619140625, -0.005656242370605469, -0.004772186279296875, -0.0038881301879882812, -0.0030040740966796875, -0.0021200180053710938, -0.0012359619140625, -0.00035190582275390625, 0.0005321502685546875, 0.0014162063598632812, 0.002300262451171875, 0.0031843185424804688, 0.0040683746337890625, 0.004952430725097656, 0.00583648681640625, 0.006720542907714844, 0.0076045989990234375, 0.008488655090332031, 0.009372711181640625, 0.010256767272949219, 0.011140823364257812, 0.012024879455566406, 0.012908935546875, 0.013792991638183594, 0.014677047729492188, 0.015561103820800781, 0.016445159912109375, 0.01732921600341797, 0.018213272094726562, 0.019097328186035156, 0.01998138427734375, 0.020865440368652344, 0.021749496459960938, 0.02263355255126953, 0.023517608642578125, 0.02440166473388672, 0.025285720825195312, 0.026169776916503906, 0.0270538330078125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 39.0, 218.0, 564.0, 146.0, 23.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.993537902832031, -8.652512550354004, -8.31148624420166, -7.970460414886475, -7.629434585571289, -7.2884087562561035, -6.947382926940918, -6.606357574462891, -6.265331268310547, -5.924305438995361, -5.583279609680176, -5.24225378036499, -4.901227951049805, -4.560202121734619, -4.219176292419434, -3.878150701522827, -3.5371251106262207, -3.196099281311035, -2.8550734519958496, -2.514047622680664, -2.1730217933654785, -1.8319960832595825, -1.4909703731536865, -1.149944543838501, -0.8089187145233154, -0.46789291501045227, -0.1268671154975891, 0.21415865421295166, 0.5551844835281372, 0.8962103128433228, 1.2372360229492188, 1.5782618522644043, 1.9192876815795898, 2.2603135108947754, 2.601339340209961, 2.9423651695251465, 3.283390998840332, 3.6244168281555176, 3.965442419052124, 4.3064680099487305, 4.647494316101074, 4.98852014541626, 5.329545974731445, 5.670571804046631, 6.011597633361816, 6.352623462677002, 6.6936492919921875, 7.034674644470215, 7.3757004737854, 7.716726303100586, 8.057751655578613, 8.398777961730957, 8.739803314208984, 9.080829620361328, 9.421854972839355, 9.7628812789917, 10.103906631469727, 10.444931983947754, 10.785958290100098, 11.126983642578125, 11.468009948730469, 11.809035301208496, 12.15006160736084, 12.491086959838867, 12.832113265991211]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 11.0, 12.0, 27.0, 23.0, 60.0, 76.0, 65.0, 85.0, 95.0, 127.0, 77.0, 92.0, 64.0, 55.0, 47.0, 35.0, 19.0, 17.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6336677074432373, -3.5092740058898926, -3.3848800659179688, -3.260486364364624, -3.1360926628112793, -3.0116989612579346, -2.88730525970459, -2.762911319732666, -2.6385176181793213, -2.5141239166259766, -2.3897299766540527, -2.265336275100708, -2.1409425735473633, -2.0165488719940186, -1.8921550512313843, -1.76776123046875, -1.6433675289154053, -1.5189738273620605, -1.3945800065994263, -1.270186185836792, -1.1457924842834473, -1.0213987827301025, -0.8970049619674683, -0.7726112008094788, -0.6482174396514893, -0.5238236784934998, -0.39942991733551025, -0.27503615617752075, -0.15064239501953125, -0.026248633861541748, 0.09814512729644775, 0.22253888845443726, 0.34693288803100586, 0.47132664918899536, 0.5957204103469849, 0.7201141715049744, 0.8445079326629639, 0.9689016938209534, 1.0932954549789429, 1.2176892757415771, 1.3420829772949219, 1.4664766788482666, 1.5908704996109009, 1.7152643203735352, 1.8396580219268799, 1.9640517234802246, 2.0884456634521484, 2.212839365005493, 2.337233066558838, 2.4616267681121826, 2.5860204696655273, 2.710414409637451, 2.834808111190796, 2.9592018127441406, 3.0835957527160645, 3.207989454269409, 3.332383155822754, 3.4567768573760986, 3.5811705589294434, 3.705564498901367, 3.829958200454712, 3.9543519020080566, 4.0787458419799805, 4.203139305114746, 4.32753324508667]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 16.0, 16.0, 26.0, 34.0, 45.0, 75.0, 125.0, 179.0, 288.0, 438.0, 781.0, 1368.0, 2427.0, 4996.0, 10768.0, 25281.0, 64836.0, 224125.0, 494328.0, 136815.0, 45098.0, 18892.0, 8461.0, 3999.0, 2089.0, 1243.0, 685.0, 390.0, 247.0, 163.0, 95.0, 76.0, 37.0, 23.0, 19.0, 17.0, 13.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.33026123046875, -2.2581787109375, -2.18609619140625, -2.114013671875, -2.04193115234375, -1.9698486328125, -1.89776611328125, -1.82568359375, -1.75360107421875, -1.6815185546875, -1.60943603515625, -1.537353515625, -1.46527099609375, -1.3931884765625, -1.32110595703125, -1.2490234375, -1.17694091796875, -1.1048583984375, -1.03277587890625, -0.960693359375, -0.88861083984375, -0.8165283203125, -0.74444580078125, -0.67236328125, -0.60028076171875, -0.5281982421875, -0.45611572265625, -0.384033203125, -0.31195068359375, -0.2398681640625, -0.16778564453125, -0.095703125, -0.02362060546875, 0.0484619140625, 0.12054443359375, 0.192626953125, 0.26470947265625, 0.3367919921875, 0.40887451171875, 0.48095703125, 0.55303955078125, 0.6251220703125, 0.69720458984375, 0.769287109375, 0.84136962890625, 0.9134521484375, 0.98553466796875, 1.0576171875, 1.12969970703125, 1.2017822265625, 1.27386474609375, 1.345947265625, 1.41802978515625, 1.4901123046875, 1.56219482421875, 1.63427734375, 1.70635986328125, 1.7784423828125, 1.85052490234375, 1.922607421875, 1.99468994140625, 2.0667724609375, 2.13885498046875, 2.2109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 7.0, 9.0, 17.0, 19.0, 27.0, 27.0, 35.0, 31.0, 45.0, 55.0, 48.0, 68.0, 69.0, 73.0, 69.0, 66.0, 53.0, 49.0, 42.0, 45.0, 36.0, 23.0, 22.0, 17.0, 10.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.53125, -17.852294921875, -17.17333984375, -16.494384765625, -15.8154296875, -15.136474609375, -14.45751953125, -13.778564453125, -13.099609375, -12.420654296875, -11.74169921875, -11.062744140625, -10.3837890625, -9.704833984375, -9.02587890625, -8.346923828125, -7.66796875, -6.989013671875, -6.31005859375, -5.631103515625, -4.9521484375, -4.273193359375, -3.59423828125, -2.915283203125, -2.236328125, -1.557373046875, -0.87841796875, -0.199462890625, 0.4794921875, 1.158447265625, 1.83740234375, 2.516357421875, 3.1953125, 3.874267578125, 4.55322265625, 5.232177734375, 5.9111328125, 6.590087890625, 7.26904296875, 7.947998046875, 8.626953125, 9.305908203125, 9.98486328125, 10.663818359375, 11.3427734375, 12.021728515625, 12.70068359375, 13.379638671875, 14.05859375, 14.737548828125, 15.41650390625, 16.095458984375, 16.7744140625, 17.453369140625, 18.13232421875, 18.811279296875, 19.490234375, 20.169189453125, 20.84814453125, 21.527099609375, 22.2060546875, 22.885009765625, 23.56396484375, 24.242919921875, 24.921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 9.0, 12.0, 17.0, 42.0, 49.0, 67.0, 124.0, 186.0, 301.0, 675.0, 7599.0, 1026583.0, 11375.0, 672.0, 302.0, 158.0, 117.0, 70.0, 47.0, 35.0, 28.0, 18.0, 13.0, 11.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.81689453125, -19.2431640625, -18.66943359375, -18.095703125, -17.52197265625, -16.9482421875, -16.37451171875, -15.80078125, -15.22705078125, -14.6533203125, -14.07958984375, -13.505859375, -12.93212890625, -12.3583984375, -11.78466796875, -11.2109375, -10.63720703125, -10.0634765625, -9.48974609375, -8.916015625, -8.34228515625, -7.7685546875, -7.19482421875, -6.62109375, -6.04736328125, -5.4736328125, -4.89990234375, -4.326171875, -3.75244140625, -3.1787109375, -2.60498046875, -2.03125, -1.45751953125, -0.8837890625, -0.31005859375, 0.263671875, 0.83740234375, 1.4111328125, 1.98486328125, 2.55859375, 3.13232421875, 3.7060546875, 4.27978515625, 4.853515625, 5.42724609375, 6.0009765625, 6.57470703125, 7.1484375, 7.72216796875, 8.2958984375, 8.86962890625, 9.443359375, 10.01708984375, 10.5908203125, 11.16455078125, 11.73828125, 12.31201171875, 12.8857421875, 13.45947265625, 14.033203125, 14.60693359375, 15.1806640625, 15.75439453125, 16.328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 18.0, 19.0, 24.0, 33.0, 53.0, 71.0, 64.0, 68.0, 87.0, 91.0, 96.0, 77.0, 63.0, 56.0, 44.0, 26.0, 24.0, 18.0, 15.0, 11.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.0625, -31.158935546875, -30.25537109375, -29.351806640625, -28.4482421875, -27.544677734375, -26.64111328125, -25.737548828125, -24.833984375, -23.930419921875, -23.02685546875, -22.123291015625, -21.2197265625, -20.316162109375, -19.41259765625, -18.509033203125, -17.60546875, -16.701904296875, -15.79833984375, -14.894775390625, -13.9912109375, -13.087646484375, -12.18408203125, -11.280517578125, -10.376953125, -9.473388671875, -8.56982421875, -7.666259765625, -6.7626953125, -5.859130859375, -4.95556640625, -4.052001953125, -3.1484375, -2.244873046875, -1.34130859375, -0.437744140625, 0.4658203125, 1.369384765625, 2.27294921875, 3.176513671875, 4.080078125, 4.983642578125, 5.88720703125, 6.790771484375, 7.6943359375, 8.597900390625, 9.50146484375, 10.405029296875, 11.30859375, 12.212158203125, 13.11572265625, 14.019287109375, 14.9228515625, 15.826416015625, 16.72998046875, 17.633544921875, 18.537109375, 19.440673828125, 20.34423828125, 21.247802734375, 22.1513671875, 23.054931640625, 23.95849609375, 24.862060546875, 25.765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 7.0, 10.0, 10.0, 23.0, 42.0, 104.0, 300.0, 1990.0, 86272.0, 954662.0, 4329.0, 556.0, 125.0, 53.0, 28.0, 18.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381103515625, -0.3621864318847656, -0.34326934814453125, -0.3243522644042969, -0.3054351806640625, -0.2865180969238281, -0.26760101318359375, -0.24868392944335938, -0.229766845703125, -0.21084976196289062, -0.19193267822265625, -0.17301559448242188, -0.1540985107421875, -0.13518142700195312, -0.11626434326171875, -0.09734725952148438, -0.07843017578125, -0.059513092041015625, -0.04059600830078125, -0.021678924560546875, -0.0027618408203125, 0.016155242919921875, 0.03507232666015625, 0.053989410400390625, 0.072906494140625, 0.09182357788085938, 0.11074066162109375, 0.12965774536132812, 0.1485748291015625, 0.16749191284179688, 0.18640899658203125, 0.20532608032226562, 0.2242431640625, 0.24316024780273438, 0.26207733154296875, 0.2809944152832031, 0.2999114990234375, 0.3188285827636719, 0.33774566650390625, 0.3566627502441406, 0.375579833984375, 0.3944969177246094, 0.41341400146484375, 0.4323310852050781, 0.4512481689453125, 0.4701652526855469, 0.48908233642578125, 0.5079994201660156, 0.52691650390625, 0.5458335876464844, 0.5647506713867188, 0.5836677551269531, 0.6025848388671875, 0.6215019226074219, 0.6404190063476562, 0.6593360900878906, 0.678253173828125, 0.6971702575683594, 0.7160873413085938, 0.7350044250488281, 0.7539215087890625, 0.7728385925292969, 0.7917556762695312, 0.8106727600097656, 0.82958984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 3.0, 12.0, 17.0, 18.0, 22.0, 56.0, 107.0, 183.0, 246.0, 140.0, 68.0, 41.0, 27.0, 18.0, 10.0, 9.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8135644495487213e-05, -1.7138198018074036e-05, -1.6140751540660858e-05, -1.514330506324768e-05, -1.4145858585834503e-05, -1.3148412108421326e-05, -1.2150965631008148e-05, -1.115351915359497e-05, -1.0156072676181793e-05, -9.158626198768616e-06, -8.161179721355438e-06, -7.163733243942261e-06, -6.166286766529083e-06, -5.168840289115906e-06, -4.171393811702728e-06, -3.1739473342895508e-06, -2.1765008568763733e-06, -1.1790543794631958e-06, -1.816079020500183e-07, 8.158385753631592e-07, 1.8132850527763367e-06, 2.810731530189514e-06, 3.8081780076026917e-06, 4.805624485015869e-06, 5.803070962429047e-06, 6.800517439842224e-06, 7.797963917255402e-06, 8.795410394668579e-06, 9.792856872081757e-06, 1.0790303349494934e-05, 1.1787749826908112e-05, 1.2785196304321289e-05, 1.3782642781734467e-05, 1.4780089259147644e-05, 1.577753573656082e-05, 1.6774982213974e-05, 1.7772428691387177e-05, 1.8769875168800354e-05, 1.976732164621353e-05, 2.076476812362671e-05, 2.1762214601039886e-05, 2.2759661078453064e-05, 2.375710755586624e-05, 2.475455403327942e-05, 2.5752000510692596e-05, 2.6749446988105774e-05, 2.774689346551895e-05, 2.874433994293213e-05, 2.9741786420345306e-05, 3.0739232897758484e-05, 3.173667937517166e-05, 3.273412585258484e-05, 3.3731572329998016e-05, 3.4729018807411194e-05, 3.572646528482437e-05, 3.672391176223755e-05, 3.7721358239650726e-05, 3.8718804717063904e-05, 3.971625119447708e-05, 4.071369767189026e-05, 4.1711144149303436e-05, 4.2708590626716614e-05, 4.370603710412979e-05, 4.470348358154297e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 2.0, 11.0, 12.0, 16.0, 25.0, 42.0, 77.0, 254.0, 1061.0, 9725.0, 973855.0, 59963.0, 2740.0, 468.0, 153.0, 56.0, 19.0, 19.0, 20.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.537109375, -0.5211944580078125, -0.505279541015625, -0.4893646240234375, -0.47344970703125, -0.4575347900390625, -0.441619873046875, -0.4257049560546875, -0.4097900390625, -0.3938751220703125, -0.377960205078125, -0.3620452880859375, -0.34613037109375, -0.3302154541015625, -0.314300537109375, -0.2983856201171875, -0.282470703125, -0.2665557861328125, -0.250640869140625, -0.2347259521484375, -0.21881103515625, -0.2028961181640625, -0.186981201171875, -0.1710662841796875, -0.1551513671875, -0.1392364501953125, -0.123321533203125, -0.1074066162109375, -0.09149169921875, -0.0755767822265625, -0.059661865234375, -0.0437469482421875, -0.02783203125, -0.0119171142578125, 0.003997802734375, 0.0199127197265625, 0.03582763671875, 0.0517425537109375, 0.067657470703125, 0.0835723876953125, 0.0994873046875, 0.1154022216796875, 0.131317138671875, 0.1472320556640625, 0.16314697265625, 0.1790618896484375, 0.194976806640625, 0.2108917236328125, 0.226806640625, 0.2427215576171875, 0.258636474609375, 0.2745513916015625, 0.29046630859375, 0.3063812255859375, 0.322296142578125, 0.3382110595703125, 0.3541259765625, 0.3700408935546875, 0.385955810546875, 0.4018707275390625, 0.41778564453125, 0.4337005615234375, 0.449615478515625, 0.4655303955078125, 0.4814453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 7.0, 17.0, 6.0, 20.0, 21.0, 54.0, 76.0, 155.0, 347.0, 109.0, 59.0, 31.0, 22.0, 10.0, 11.0, 8.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.089111328125, -0.08651351928710938, -0.08391571044921875, -0.08131790161132812, -0.0787200927734375, -0.07612228393554688, -0.07352447509765625, -0.07092666625976562, -0.068328857421875, -0.06573104858398438, -0.06313323974609375, -0.060535430908203125, -0.0579376220703125, -0.055339813232421875, -0.05274200439453125, -0.050144195556640625, -0.04754638671875, -0.044948577880859375, -0.04235076904296875, -0.039752960205078125, -0.0371551513671875, -0.034557342529296875, -0.03195953369140625, -0.029361724853515625, -0.026763916015625, -0.024166107177734375, -0.02156829833984375, -0.018970489501953125, -0.0163726806640625, -0.013774871826171875, -0.01117706298828125, -0.008579254150390625, -0.0059814453125, -0.003383636474609375, -0.00078582763671875, 0.001811981201171875, 0.0044097900390625, 0.007007598876953125, 0.00960540771484375, 0.012203216552734375, 0.014801025390625, 0.017398834228515625, 0.01999664306640625, 0.022594451904296875, 0.0251922607421875, 0.027790069580078125, 0.03038787841796875, 0.032985687255859375, 0.03558349609375, 0.038181304931640625, 0.04077911376953125, 0.043376922607421875, 0.0459747314453125, 0.048572540283203125, 0.05117034912109375, 0.053768157958984375, 0.056365966796875, 0.058963775634765625, 0.06156158447265625, 0.06415939331054688, 0.0667572021484375, 0.06935501098632812, 0.07195281982421875, 0.07455062866210938, 0.0771484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 426.0, 578.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.75569152832031, -61.655418395996094, -60.555145263671875, -59.454872131347656, -58.35459899902344, -57.25432586669922, -56.154052734375, -55.05377960205078, -53.95350646972656, -52.853233337402344, -51.752960205078125, -50.652687072753906, -49.55241394042969, -48.45214080810547, -47.35186767578125, -46.25159454345703, -45.15131759643555, -44.05104446411133, -42.95077133178711, -41.85049819946289, -40.75022506713867, -39.64995193481445, -38.549678802490234, -37.44940185546875, -36.34912872314453, -35.24885559082031, -34.148582458496094, -33.048309326171875, -31.948036193847656, -30.847763061523438, -29.747488021850586, -28.647214889526367, -27.546945571899414, -26.446672439575195, -25.346399307250977, -24.246126174926758, -23.145851135253906, -22.045578002929688, -20.94530487060547, -19.84503173828125, -18.74475860595703, -17.644485473632812, -16.544212341308594, -15.443938255310059, -14.34366512298584, -13.243391990661621, -12.143117904663086, -11.042844772338867, -9.942571640014648, -8.84229850769043, -7.742024898529053, -6.641751289367676, -5.541478157043457, -4.441205024719238, -3.3409314155578613, -2.2406578063964844, -1.1403851509094238, -0.04011178016662598, 1.0601615905761719, 2.1604349613189697, 3.2607083320617676, 4.360981464385986, 5.461255073547363, 6.56152868270874, 7.661801815032959]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 8.0, 6.0, 7.0, 11.0, 10.0, 13.0, 16.0, 22.0, 31.0, 23.0, 33.0, 28.0, 46.0, 39.0, 42.0, 41.0, 43.0, 44.0, 52.0, 61.0, 47.0, 42.0, 41.0, 52.0, 31.0, 38.0, 30.0, 23.0, 23.0, 15.0, 12.0, 17.0, 16.0, 6.0, 7.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.28492259979248, -14.719724655151367, -14.154525756835938, -13.589326858520508, -13.024128913879395, -12.458930969238281, -11.893732070922852, -11.328533172607422, -10.763335227966309, -10.198137283325195, -9.632938385009766, -9.067739486694336, -8.502541542053223, -7.937343120574951, -7.37214469909668, -6.806946277618408, -6.241747856140137, -5.676549434661865, -5.111351013183594, -4.546152591705322, -3.980954170227051, -3.4157557487487793, -2.850557327270508, -2.2853589057922363, -1.7201604843139648, -1.1549620628356934, -0.5897636413574219, -0.02456521987915039, 0.5406332015991211, 1.1058316230773926, 1.671030044555664, 2.2362284660339355, 2.8014259338378906, 3.366624355316162, 3.9318227767944336, 4.497021198272705, 5.062219619750977, 5.627418041229248, 6.1926164627075195, 6.757814884185791, 7.3230133056640625, 7.888211727142334, 8.453410148620605, 9.018608093261719, 9.583806991577148, 10.149005889892578, 10.714203834533691, 11.279401779174805, 11.844600677490234, 12.409799575805664, 12.974997520446777, 13.54019546508789, 14.10539436340332, 14.67059326171875, 15.235791206359863, 15.800989151000977, 16.366188049316406, 16.931386947631836, 17.496585845947266, 18.061782836914062, 18.626981735229492, 19.192180633544922, 19.75737762451172, 20.32257652282715, 20.887775421142578]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 5.0, 13.0, 11.0, 10.0, 13.0, 24.0, 36.0, 33.0, 48.0, 52.0, 78.0, 127.0, 174.0, 301.0, 624.0, 2421.0, 14147.0, 1013910.0, 3126971.0, 31254.0, 2270.0, 708.0, 352.0, 206.0, 118.0, 74.0, 59.0, 49.0, 37.0, 18.0, 23.0, 13.0, 17.0, 19.0, 10.0, 12.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.09375, -3.962158203125, -3.83056640625, -3.698974609375, -3.5673828125, -3.435791015625, -3.30419921875, -3.172607421875, -3.041015625, -2.909423828125, -2.77783203125, -2.646240234375, -2.5146484375, -2.383056640625, -2.25146484375, -2.119873046875, -1.98828125, -1.856689453125, -1.72509765625, -1.593505859375, -1.4619140625, -1.330322265625, -1.19873046875, -1.067138671875, -0.935546875, -0.803955078125, -0.67236328125, -0.540771484375, -0.4091796875, -0.277587890625, -0.14599609375, -0.014404296875, 0.1171875, 0.248779296875, 0.38037109375, 0.511962890625, 0.6435546875, 0.775146484375, 0.90673828125, 1.038330078125, 1.169921875, 1.301513671875, 1.43310546875, 1.564697265625, 1.6962890625, 1.827880859375, 1.95947265625, 2.091064453125, 2.22265625, 2.354248046875, 2.48583984375, 2.617431640625, 2.7490234375, 2.880615234375, 3.01220703125, 3.143798828125, 3.275390625, 3.406982421875, 3.53857421875, 3.670166015625, 3.8017578125, 3.933349609375, 4.06494140625, 4.196533203125, 4.328125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 11.0, 17.0, 14.0, 18.0, 30.0, 34.0, 36.0, 57.0, 65.0, 56.0, 80.0, 82.0, 68.0, 81.0, 61.0, 60.0, 49.0, 36.0, 30.0, 38.0, 21.0, 13.0, 8.0, 9.0, 4.0, 0.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.712066650390625, -1.64288330078125, -1.573699951171875, -1.5045166015625, -1.435333251953125, -1.36614990234375, -1.296966552734375, -1.227783203125, -1.158599853515625, -1.08941650390625, -1.020233154296875, -0.9510498046875, -0.881866455078125, -0.81268310546875, -0.743499755859375, -0.67431640625, -0.605133056640625, -0.53594970703125, -0.466766357421875, -0.3975830078125, -0.328399658203125, -0.25921630859375, -0.190032958984375, -0.120849609375, -0.051666259765625, 0.01751708984375, 0.086700439453125, 0.1558837890625, 0.225067138671875, 0.29425048828125, 0.363433837890625, 0.4326171875, 0.501800537109375, 0.57098388671875, 0.640167236328125, 0.7093505859375, 0.778533935546875, 0.84771728515625, 0.916900634765625, 0.986083984375, 1.055267333984375, 1.12445068359375, 1.193634033203125, 1.2628173828125, 1.332000732421875, 1.40118408203125, 1.470367431640625, 1.53955078125, 1.608734130859375, 1.67791748046875, 1.747100830078125, 1.8162841796875, 1.885467529296875, 1.95465087890625, 2.023834228515625, 2.093017578125, 2.162200927734375, 2.23138427734375, 2.300567626953125, 2.3697509765625, 2.438934326171875, 2.50811767578125, 2.577301025390625, 2.646484375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 26.0, 4194047.0, 180.0, 21.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.25, -296.65234375, -283.0546875, -269.45703125, -255.859375, -242.26171875, -228.6640625, -215.06640625, -201.46875, -187.87109375, -174.2734375, -160.67578125, -147.078125, -133.48046875, -119.8828125, -106.28515625, -92.6875, -79.08984375, -65.4921875, -51.89453125, -38.296875, -24.69921875, -11.1015625, 2.49609375, 16.09375, 29.69140625, 43.2890625, 56.88671875, 70.484375, 84.08203125, 97.6796875, 111.27734375, 124.875, 138.47265625, 152.0703125, 165.66796875, 179.265625, 192.86328125, 206.4609375, 220.05859375, 233.65625, 247.25390625, 260.8515625, 274.44921875, 288.046875, 301.64453125, 315.2421875, 328.83984375, 342.4375, 356.03515625, 369.6328125, 383.23046875, 396.828125, 410.42578125, 424.0234375, 437.62109375, 451.21875, 464.81640625, 478.4140625, 492.01171875, 505.609375, 519.20703125, 532.8046875, 546.40234375, 560.0]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 28.0, 131.0, 2512.0, 1286.0, 87.0, 19.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.849609375, -1.768829345703125, -1.68804931640625, -1.607269287109375, -1.5264892578125, -1.445709228515625, -1.36492919921875, -1.284149169921875, -1.203369140625, -1.122589111328125, -1.04180908203125, -0.961029052734375, -0.8802490234375, -0.799468994140625, -0.71868896484375, -0.637908935546875, -0.55712890625, -0.476348876953125, -0.39556884765625, -0.314788818359375, -0.2340087890625, -0.153228759765625, -0.07244873046875, 0.008331298828125, 0.089111328125, 0.169891357421875, 0.25067138671875, 0.331451416015625, 0.4122314453125, 0.493011474609375, 0.57379150390625, 0.654571533203125, 0.7353515625, 0.816131591796875, 0.89691162109375, 0.977691650390625, 1.0584716796875, 1.139251708984375, 1.22003173828125, 1.300811767578125, 1.381591796875, 1.462371826171875, 1.54315185546875, 1.623931884765625, 1.7047119140625, 1.785491943359375, 1.86627197265625, 1.947052001953125, 2.02783203125, 2.108612060546875, 2.18939208984375, 2.270172119140625, 2.3509521484375, 2.431732177734375, 2.51251220703125, 2.593292236328125, 2.674072265625, 2.754852294921875, 2.83563232421875, 2.916412353515625, 2.9971923828125, 3.077972412109375, 3.15875244140625, 3.239532470703125, 3.3203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 13.0, 64.0, 378.0, 444.0, 89.0, 16.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.55516242980957, -16.230932235717773, -15.906702995300293, -15.582472801208496, -15.258243560791016, -14.934013366699219, -14.609783172607422, -14.285553932189941, -13.961323738098145, -13.637093544006348, -13.312864303588867, -12.98863410949707, -12.66440486907959, -12.340174674987793, -12.015945434570312, -11.691715240478516, -11.367485046386719, -11.043254852294922, -10.719025611877441, -10.394795417785645, -10.070566177368164, -9.746335983276367, -9.42210578918457, -9.09787654876709, -8.77364730834961, -8.449417114257812, -8.125187873840332, -7.800957679748535, -7.4767279624938965, -7.152498245239258, -6.828268527984619, -6.5040388107299805, -6.179808616638184, -5.855578899383545, -5.531349182128906, -5.207118988037109, -4.882889270782471, -4.558659553527832, -4.234429836273193, -3.9101998805999756, -3.585970163345337, -3.2617404460906982, -2.9375104904174805, -2.613280773162842, -2.289051055908203, -1.9648211002349854, -1.6405913829803467, -1.316361427307129, -0.9921317100524902, -0.667901873588562, -0.34367209672927856, -0.019442319869995117, 0.3047875165939331, 0.6290173530578613, 0.9532470703125, 1.2774770259857178, 1.6017067432403564, 1.9259365797042847, 2.250166416168213, 2.5743961334228516, 2.8986258506774902, 3.222855806350708, 3.5470855236053467, 3.8713154792785645, 4.195545196533203]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 12.0, 22.0, 20.0, 29.0, 40.0, 35.0, 49.0, 57.0, 60.0, 69.0, 86.0, 78.0, 82.0, 56.0, 70.0, 60.0, 35.0, 35.0, 24.0, 24.0, 21.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.708440065383911, -3.605536460876465, -3.5026328563690186, -3.3997292518615723, -3.296825408935547, -3.1939220428466797, -3.0910181999206543, -2.988114595413208, -2.8852109909057617, -2.7823073863983154, -2.679403781890869, -2.576500177383423, -2.4735965728759766, -2.370692729949951, -2.267789125442505, -2.1648855209350586, -2.0619819164276123, -1.959078311920166, -1.8561747074127197, -1.7532709836959839, -1.6503673791885376, -1.5474637746810913, -1.4445600509643555, -1.3416564464569092, -1.238752841949463, -1.1358492374420166, -1.0329456329345703, -0.9300419092178345, -0.8271383047103882, -0.7242347002029419, -0.6213310360908508, -0.5184273719787598, -0.4155240058898926, -0.3126203715801239, -0.20971673727035522, -0.10681310296058655, -0.003909468650817871, 0.09899413585662842, 0.20189779996871948, 0.30480146408081055, 0.40770506858825684, 0.5106086730957031, 0.6135123372077942, 0.7164160013198853, 0.8193196058273315, 0.9222232103347778, 1.0251269340515137, 1.12803053855896, 1.2309341430664062, 1.3338377475738525, 1.4367413520812988, 1.5396450757980347, 1.642548680305481, 1.7454522848129272, 1.848356008529663, 1.9512596130371094, 2.0541632175445557, 2.157066822052002, 2.2599704265594482, 2.3628740310668945, 2.46577787399292, 2.568681240081787, 2.6715850830078125, 2.774488687515259, 2.877392292022705]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 13.0, 6.0, 14.0, 28.0, 44.0, 75.0, 129.0, 266.0, 468.0, 965.0, 1950.0, 4713.0, 16036.0, 98399.0, 756668.0, 139147.0, 19629.0, 5518.0, 2221.0, 1033.0, 574.0, 296.0, 140.0, 93.0, 44.0, 20.0, 18.0, 13.0, 8.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7694549560546875, -0.742523193359375, -0.7155914306640625, -0.68865966796875, -0.6617279052734375, -0.634796142578125, -0.6078643798828125, -0.5809326171875, -0.5540008544921875, -0.527069091796875, -0.5001373291015625, -0.47320556640625, -0.4462738037109375, -0.419342041015625, -0.3924102783203125, -0.365478515625, -0.3385467529296875, -0.311614990234375, -0.2846832275390625, -0.25775146484375, -0.2308197021484375, -0.203887939453125, -0.1769561767578125, -0.1500244140625, -0.1230926513671875, -0.096160888671875, -0.0692291259765625, -0.04229736328125, -0.0153656005859375, 0.011566162109375, 0.0384979248046875, 0.0654296875, 0.0923614501953125, 0.119293212890625, 0.1462249755859375, 0.17315673828125, 0.2000885009765625, 0.227020263671875, 0.2539520263671875, 0.2808837890625, 0.3078155517578125, 0.334747314453125, 0.3616790771484375, 0.38861083984375, 0.4155426025390625, 0.442474365234375, 0.4694061279296875, 0.496337890625, 0.5232696533203125, 0.550201416015625, 0.5771331787109375, 0.60406494140625, 0.6309967041015625, 0.657928466796875, 0.6848602294921875, 0.7117919921875, 0.7387237548828125, 0.765655517578125, 0.7925872802734375, 0.81951904296875, 0.8464508056640625, 0.873382568359375, 0.9003143310546875, 0.92724609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 16.0, 22.0, 26.0, 36.0, 31.0, 47.0, 49.0, 65.0, 69.0, 83.0, 85.0, 79.0, 70.0, 69.0, 52.0, 42.0, 36.0, 23.0, 29.0, 13.0, 14.0, 10.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.484375, -2.425628662109375, -2.36688232421875, -2.308135986328125, -2.2493896484375, -2.190643310546875, -2.13189697265625, -2.073150634765625, -2.014404296875, -1.955657958984375, -1.89691162109375, -1.838165283203125, -1.7794189453125, -1.720672607421875, -1.66192626953125, -1.603179931640625, -1.54443359375, -1.485687255859375, -1.42694091796875, -1.368194580078125, -1.3094482421875, -1.250701904296875, -1.19195556640625, -1.133209228515625, -1.074462890625, -1.015716552734375, -0.95697021484375, -0.898223876953125, -0.8394775390625, -0.780731201171875, -0.72198486328125, -0.663238525390625, -0.6044921875, -0.545745849609375, -0.48699951171875, -0.428253173828125, -0.3695068359375, -0.310760498046875, -0.25201416015625, -0.193267822265625, -0.134521484375, -0.075775146484375, -0.01702880859375, 0.041717529296875, 0.1004638671875, 0.159210205078125, 0.21795654296875, 0.276702880859375, 0.33544921875, 0.394195556640625, 0.45294189453125, 0.511688232421875, 0.5704345703125, 0.629180908203125, 0.68792724609375, 0.746673583984375, 0.805419921875, 0.864166259765625, 0.92291259765625, 0.981658935546875, 1.0404052734375, 1.099151611328125, 1.15789794921875, 1.216644287109375, 1.275390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 10.0, 17.0, 21.0, 28.0, 42.0, 63.0, 98.0, 153.0, 251.0, 344.0, 547.0, 968.0, 1691.0, 2951.0, 5232.0, 10738.0, 24060.0, 59631.0, 166675.0, 365084.0, 253106.0, 91731.0, 34325.0, 14684.0, 7109.0, 3743.0, 2028.0, 1201.0, 699.0, 473.0, 305.0, 177.0, 123.0, 70.0, 47.0, 38.0, 18.0, 16.0, 13.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.196533203125, -0.19052505493164062, -0.18451690673828125, -0.17850875854492188, -0.1725006103515625, -0.16649246215820312, -0.16048431396484375, -0.15447616577148438, -0.148468017578125, -0.14245986938476562, -0.13645172119140625, -0.13044357299804688, -0.1244354248046875, -0.11842727661132812, -0.11241912841796875, -0.10641098022460938, -0.10040283203125, -0.09439468383789062, -0.08838653564453125, -0.08237838745117188, -0.0763702392578125, -0.07036209106445312, -0.06435394287109375, -0.058345794677734375, -0.052337646484375, -0.046329498291015625, -0.04032135009765625, -0.034313201904296875, -0.0283050537109375, -0.022296905517578125, -0.01628875732421875, -0.010280609130859375, -0.0042724609375, 0.001735687255859375, 0.00774383544921875, 0.013751983642578125, 0.0197601318359375, 0.025768280029296875, 0.03177642822265625, 0.037784576416015625, 0.043792724609375, 0.049800872802734375, 0.05580902099609375, 0.061817169189453125, 0.0678253173828125, 0.07383346557617188, 0.07984161376953125, 0.08584976196289062, 0.09185791015625, 0.09786605834960938, 0.10387420654296875, 0.10988235473632812, 0.1158905029296875, 0.12189865112304688, 0.12790679931640625, 0.13391494750976562, 0.139923095703125, 0.14593124389648438, 0.15193939208984375, 0.15794754028320312, 0.1639556884765625, 0.16996383666992188, 0.17597198486328125, 0.18198013305664062, 0.18798828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 6.0, 5.0, 9.0, 9.0, 8.0, 14.0, 13.0, 21.0, 15.0, 19.0, 19.0, 32.0, 43.0, 38.0, 32.0, 41.0, 39.0, 37.0, 36.0, 40.0, 47.0, 38.0, 50.0, 48.0, 41.0, 33.0, 39.0, 28.0, 26.0, 24.0, 27.0, 13.0, 16.0, 15.0, 12.0, 9.0, 17.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6494140625, -1.5981903076171875, -1.546966552734375, -1.4957427978515625, -1.44451904296875, -1.3932952880859375, -1.342071533203125, -1.2908477783203125, -1.2396240234375, -1.1884002685546875, -1.137176513671875, -1.0859527587890625, -1.03472900390625, -0.9835052490234375, -0.932281494140625, -0.8810577392578125, -0.829833984375, -0.7786102294921875, -0.727386474609375, -0.6761627197265625, -0.62493896484375, -0.5737152099609375, -0.522491455078125, -0.4712677001953125, -0.4200439453125, -0.3688201904296875, -0.317596435546875, -0.2663726806640625, -0.21514892578125, -0.1639251708984375, -0.112701416015625, -0.0614776611328125, -0.01025390625, 0.0409698486328125, 0.092193603515625, 0.1434173583984375, 0.19464111328125, 0.2458648681640625, 0.297088623046875, 0.3483123779296875, 0.3995361328125, 0.4507598876953125, 0.501983642578125, 0.5532073974609375, 0.60443115234375, 0.6556549072265625, 0.706878662109375, 0.7581024169921875, 0.809326171875, 0.8605499267578125, 0.911773681640625, 0.9629974365234375, 1.01422119140625, 1.0654449462890625, 1.116668701171875, 1.1678924560546875, 1.2191162109375, 1.2703399658203125, 1.321563720703125, 1.3727874755859375, 1.42401123046875, 1.4752349853515625, 1.526458740234375, 1.5776824951171875, 1.62890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 28.0, 22.0, 28.0, 71.0, 99.0, 147.0, 271.0, 461.0, 884.0, 1767.0, 3960.0, 9715.0, 30148.0, 149968.0, 708288.0, 103894.0, 23620.0, 8413.0, 3341.0, 1615.0, 737.0, 416.0, 233.0, 151.0, 78.0, 58.0, 36.0, 26.0, 13.0, 18.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.036376953125, -0.03521871566772461, -0.03406047821044922, -0.03290224075317383, -0.03174400329589844, -0.030585765838623047, -0.029427528381347656, -0.028269290924072266, -0.027111053466796875, -0.025952816009521484, -0.024794578552246094, -0.023636341094970703, -0.022478103637695312, -0.021319866180419922, -0.02016162872314453, -0.01900339126586914, -0.01784515380859375, -0.01668691635131836, -0.015528678894042969, -0.014370441436767578, -0.013212203979492188, -0.012053966522216797, -0.010895729064941406, -0.009737491607666016, -0.008579254150390625, -0.007421016693115234, -0.006262779235839844, -0.005104541778564453, -0.0039463043212890625, -0.002788066864013672, -0.0016298294067382812, -0.0004715919494628906, 0.0006866455078125, 0.0018448829650878906, 0.0030031204223632812, 0.004161357879638672, 0.0053195953369140625, 0.006477832794189453, 0.007636070251464844, 0.008794307708740234, 0.009952545166015625, 0.011110782623291016, 0.012269020080566406, 0.013427257537841797, 0.014585494995117188, 0.015743732452392578, 0.01690196990966797, 0.01806020736694336, 0.01921844482421875, 0.02037668228149414, 0.02153491973876953, 0.022693157196044922, 0.023851394653320312, 0.025009632110595703, 0.026167869567871094, 0.027326107025146484, 0.028484344482421875, 0.029642581939697266, 0.030800819396972656, 0.03195905685424805, 0.03311729431152344, 0.03427553176879883, 0.03543376922607422, 0.03659200668334961, 0.037750244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 15.0, 12.0, 35.0, 58.0, 99.0, 152.0, 194.0, 171.0, 89.0, 46.0, 26.0, 22.0, 17.0, 7.0, 12.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40614128112793e-05, -5.222950130701065e-05, -5.0397589802742004e-05, -4.856567829847336e-05, -4.673376679420471e-05, -4.4901855289936066e-05, -4.306994378566742e-05, -4.123803228139877e-05, -3.940612077713013e-05, -3.757420927286148e-05, -3.5742297768592834e-05, -3.391038626432419e-05, -3.207847476005554e-05, -3.0246563255786896e-05, -2.841465175151825e-05, -2.6582740247249603e-05, -2.4750828742980957e-05, -2.291891723871231e-05, -2.1087005734443665e-05, -1.925509423017502e-05, -1.7423182725906372e-05, -1.5591271221637726e-05, -1.375935971736908e-05, -1.1927448213100433e-05, -1.0095536708831787e-05, -8.263625204563141e-06, -6.431713700294495e-06, -4.599802196025848e-06, -2.767890691757202e-06, -9.359791874885559e-07, 8.959323167800903e-07, 2.7278438210487366e-06, 4.559755325317383e-06, 6.391666829586029e-06, 8.223578333854675e-06, 1.0055489838123322e-05, 1.1887401342391968e-05, 1.3719312846660614e-05, 1.555122435092926e-05, 1.7383135855197906e-05, 1.9215047359466553e-05, 2.10469588637352e-05, 2.2878870368003845e-05, 2.471078187227249e-05, 2.6542693376541138e-05, 2.8374604880809784e-05, 3.020651638507843e-05, 3.2038427889347076e-05, 3.387033939361572e-05, 3.570225089788437e-05, 3.7534162402153015e-05, 3.936607390642166e-05, 4.119798541069031e-05, 4.3029896914958954e-05, 4.48618084192276e-05, 4.6693719923496246e-05, 4.852563142776489e-05, 5.035754293203354e-05, 5.2189454436302185e-05, 5.402136594057083e-05, 5.585327744483948e-05, 5.7685188949108124e-05, 5.951710045337677e-05, 6.134901195764542e-05, 6.318092346191406e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 5.0, 8.0, 7.0, 14.0, 11.0, 12.0, 18.0, 29.0, 37.0, 55.0, 94.0, 210.0, 5048.0, 1040207.0, 2297.0, 182.0, 79.0, 50.0, 29.0, 28.0, 23.0, 18.0, 11.0, 10.0, 9.0, 12.0, 6.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2900390625, -0.28050994873046875, -0.2709808349609375, -0.26145172119140625, -0.251922607421875, -0.24239349365234375, -0.2328643798828125, -0.22333526611328125, -0.21380615234375, -0.20427703857421875, -0.1947479248046875, -0.18521881103515625, -0.175689697265625, -0.16616058349609375, -0.1566314697265625, -0.14710235595703125, -0.1375732421875, -0.12804412841796875, -0.1185150146484375, -0.10898590087890625, -0.099456787109375, -0.08992767333984375, -0.0803985595703125, -0.07086944580078125, -0.06134033203125, -0.05181121826171875, -0.0422821044921875, -0.03275299072265625, -0.023223876953125, -0.01369476318359375, -0.0041656494140625, 0.00536346435546875, 0.014892578125, 0.02442169189453125, 0.0339508056640625, 0.04347991943359375, 0.053009033203125, 0.06253814697265625, 0.0720672607421875, 0.08159637451171875, 0.09112548828125, 0.10065460205078125, 0.1101837158203125, 0.11971282958984375, 0.129241943359375, 0.13877105712890625, 0.1483001708984375, 0.15782928466796875, 0.1673583984375, 0.17688751220703125, 0.1864166259765625, 0.19594573974609375, 0.205474853515625, 0.21500396728515625, 0.2245330810546875, 0.23406219482421875, 0.24359130859375, 0.25312042236328125, 0.2626495361328125, 0.27217864990234375, 0.281707763671875, 0.29123687744140625, 0.3007659912109375, 0.31029510498046875, 0.31982421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 5.0, 11.0, 9.0, 12.0, 13.0, 12.0, 11.0, 26.0, 39.0, 48.0, 54.0, 74.0, 148.0, 164.0, 90.0, 62.0, 36.0, 40.0, 30.0, 18.0, 13.0, 11.0, 10.0, 15.0, 9.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0157623291015625, -0.015272021293640137, -0.014781713485717773, -0.01429140567779541, -0.013801097869873047, -0.013310790061950684, -0.01282048225402832, -0.012330174446105957, -0.011839866638183594, -0.01134955883026123, -0.010859251022338867, -0.010368943214416504, -0.00987863540649414, -0.009388327598571777, -0.008898019790649414, -0.00840771198272705, -0.007917404174804688, -0.007427096366882324, -0.006936788558959961, -0.006446480751037598, -0.005956172943115234, -0.005465865135192871, -0.004975557327270508, -0.0044852495193481445, -0.003994941711425781, -0.003504633903503418, -0.0030143260955810547, -0.0025240182876586914, -0.002033710479736328, -0.0015434026718139648, -0.0010530948638916016, -0.0005627870559692383, -7.2479248046875e-05, 0.0004178285598754883, 0.0009081363677978516, 0.0013984441757202148, 0.0018887519836425781, 0.0023790597915649414, 0.0028693675994873047, 0.003359675407409668, 0.0038499832153320312, 0.0043402910232543945, 0.004830598831176758, 0.005320906639099121, 0.005811214447021484, 0.006301522254943848, 0.006791830062866211, 0.007282137870788574, 0.0077724456787109375, 0.0082627534866333, 0.008753061294555664, 0.009243369102478027, 0.00973367691040039, 0.010223984718322754, 0.010714292526245117, 0.01120460033416748, 0.011694908142089844, 0.012185215950012207, 0.01267552375793457, 0.013165831565856934, 0.013656139373779297, 0.01414644718170166, 0.014636754989624023, 0.015127062797546387, 0.01561737060546875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 22.0, 301.0, 608.0, 71.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.055634498596191, -11.782862663269043, -11.510089874267578, -11.23731803894043, -10.964546203613281, -10.691773414611816, -10.419001579284668, -10.146228790283203, -9.873456954956055, -9.600685119628906, -9.327912330627441, -9.055140495300293, -8.782367706298828, -8.50959587097168, -8.236824035644531, -7.964051723480225, -7.691279411315918, -7.418507099151611, -7.145734786987305, -6.872962951660156, -6.60019063949585, -6.327418327331543, -6.0546464920043945, -5.781874179840088, -5.509101867675781, -5.236329555511475, -4.963557243347168, -4.6907854080200195, -4.418013095855713, -4.145240783691406, -3.8724687099456787, -3.599696636199951, -3.3269248008728027, -3.054152488708496, -2.7813804149627686, -2.508608341217041, -2.2358360290527344, -1.9630638360977173, -1.6902916431427002, -1.417519450187683, -1.144747257232666, -0.8719750642776489, -0.5992028713226318, -0.32643067836761475, -0.053658485412597656, 0.21911370754241943, 0.4918859004974365, 0.7646580934524536, 1.0374302864074707, 1.3102024793624878, 1.5829746723175049, 1.855746865272522, 2.128519058227539, 2.4012913703918457, 2.6740634441375732, 2.946835517883301, 3.2196078300476074, 3.492380142211914, 3.7651522159576416, 4.037924289703369, 4.310696601867676, 4.583468914031982, 4.856241226196289, 5.1290130615234375, 5.401785373687744]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 16.0, 31.0, 40.0, 55.0, 64.0, 99.0, 95.0, 132.0, 112.0, 99.0, 74.0, 60.0, 48.0, 28.0, 19.0, 11.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462564468383789, -2.3763587474823, -2.2901527881622314, -2.203947067260742, -2.117741107940674, -2.0315353870391846, -1.9453295469284058, -1.859123706817627, -1.7729178667068481, -1.6867120265960693, -1.6005061864852905, -1.5143003463745117, -1.4280946254730225, -1.341888666152954, -1.2556829452514648, -1.169477105140686, -1.0832712650299072, -0.9970654249191284, -0.9108595848083496, -0.8246538043022156, -0.7384479641914368, -0.652242124080658, -0.5660363435745239, -0.4798305034637451, -0.3936246633529663, -0.3074188232421875, -0.22121301293373108, -0.13500720262527466, -0.04880136251449585, 0.03740447759628296, 0.12361025810241699, 0.2098160982131958, 0.2960221767425537, 0.3822280168533325, 0.46843382716178894, 0.5546396374702454, 0.6408454775810242, 0.727051317691803, 0.813257098197937, 0.8994629383087158, 0.9856687784194946, 1.0718746185302734, 1.1580804586410522, 1.244286298751831, 1.3304920196533203, 1.4166979789733887, 1.502903699874878, 1.5891095399856567, 1.6753153800964355, 1.7615212202072144, 1.8477270603179932, 1.9339327812194824, 2.020138740539551, 2.10634446144104, 2.1925501823425293, 2.2787561416625977, 2.364962100982666, 2.4511678218841553, 2.5373737812042236, 2.623579502105713, 2.7097854614257812, 2.7959911823272705, 2.8821969032287598, 2.968402862548828, 3.0546085834503174]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 12.0, 18.0, 21.0, 27.0, 26.0, 49.0, 100.0, 218.0, 579.0, 1645.0, 5606.0, 27263.0, 302020.0, 657174.0, 42431.0, 7932.0, 2102.0, 728.0, 280.0, 128.0, 49.0, 32.0, 25.0, 17.0, 9.0, 11.0, 11.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.93359375, -2.842254638671875, -2.75091552734375, -2.659576416015625, -2.5682373046875, -2.476898193359375, -2.38555908203125, -2.294219970703125, -2.202880859375, -2.111541748046875, -2.02020263671875, -1.928863525390625, -1.8375244140625, -1.746185302734375, -1.65484619140625, -1.563507080078125, -1.47216796875, -1.380828857421875, -1.28948974609375, -1.198150634765625, -1.1068115234375, -1.015472412109375, -0.92413330078125, -0.832794189453125, -0.741455078125, -0.650115966796875, -0.55877685546875, -0.467437744140625, -0.3760986328125, -0.284759521484375, -0.19342041015625, -0.102081298828125, -0.0107421875, 0.080596923828125, 0.17193603515625, 0.263275146484375, 0.3546142578125, 0.445953369140625, 0.53729248046875, 0.628631591796875, 0.719970703125, 0.811309814453125, 0.90264892578125, 0.993988037109375, 1.0853271484375, 1.176666259765625, 1.26800537109375, 1.359344482421875, 1.45068359375, 1.542022705078125, 1.63336181640625, 1.724700927734375, 1.8160400390625, 1.907379150390625, 1.99871826171875, 2.090057373046875, 2.181396484375, 2.272735595703125, 2.36407470703125, 2.455413818359375, 2.5467529296875, 2.638092041015625, 2.72943115234375, 2.820770263671875, 2.912109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 17.0, 23.0, 36.0, 37.0, 66.0, 77.0, 109.0, 114.0, 134.0, 109.0, 88.0, 76.0, 34.0, 28.0, 23.0, 15.0, 12.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.650146484375, -9.14404296875, -8.637939453125, -8.1318359375, -7.625732421875, -7.11962890625, -6.613525390625, -6.107421875, -5.601318359375, -5.09521484375, -4.589111328125, -4.0830078125, -3.576904296875, -3.07080078125, -2.564697265625, -2.05859375, -1.552490234375, -1.04638671875, -0.540283203125, -0.0341796875, 0.471923828125, 0.97802734375, 1.484130859375, 1.990234375, 2.496337890625, 3.00244140625, 3.508544921875, 4.0146484375, 4.520751953125, 5.02685546875, 5.532958984375, 6.0390625, 6.545166015625, 7.05126953125, 7.557373046875, 8.0634765625, 8.569580078125, 9.07568359375, 9.581787109375, 10.087890625, 10.593994140625, 11.10009765625, 11.606201171875, 12.1123046875, 12.618408203125, 13.12451171875, 13.630615234375, 14.13671875, 14.642822265625, 15.14892578125, 15.655029296875, 16.1611328125, 16.667236328125, 17.17333984375, 17.679443359375, 18.185546875, 18.691650390625, 19.19775390625, 19.703857421875, 20.2099609375, 20.716064453125, 21.22216796875, 21.728271484375, 22.234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 9.0, 14.0, 17.0, 18.0, 30.0, 30.0, 47.0, 55.0, 103.0, 297.0, 1043611.0, 3845.0, 162.0, 75.0, 50.0, 34.0, 39.0, 18.0, 21.0, 14.0, 13.0, 7.0, 7.0, 5.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.84375, -39.47509765625, -38.1064453125, -36.73779296875, -35.369140625, -34.00048828125, -32.6318359375, -31.26318359375, -29.89453125, -28.52587890625, -27.1572265625, -25.78857421875, -24.419921875, -23.05126953125, -21.6826171875, -20.31396484375, -18.9453125, -17.57666015625, -16.2080078125, -14.83935546875, -13.470703125, -12.10205078125, -10.7333984375, -9.36474609375, -7.99609375, -6.62744140625, -5.2587890625, -3.89013671875, -2.521484375, -1.15283203125, 0.2158203125, 1.58447265625, 2.953125, 4.32177734375, 5.6904296875, 7.05908203125, 8.427734375, 9.79638671875, 11.1650390625, 12.53369140625, 13.90234375, 15.27099609375, 16.6396484375, 18.00830078125, 19.376953125, 20.74560546875, 22.1142578125, 23.48291015625, 24.8515625, 26.22021484375, 27.5888671875, 28.95751953125, 30.326171875, 31.69482421875, 33.0634765625, 34.43212890625, 35.80078125, 37.16943359375, 38.5380859375, 39.90673828125, 41.275390625, 42.64404296875, 44.0126953125, 45.38134765625, 46.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 9.0, 6.0, 10.0, 14.0, 17.0, 19.0, 29.0, 30.0, 46.0, 50.0, 78.0, 97.0, 116.0, 101.0, 91.0, 65.0, 51.0, 33.0, 36.0, 19.0, 22.0, 13.0, 14.0, 7.0, 7.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.2421875, -13.7652587890625, -13.288330078125, -12.8114013671875, -12.33447265625, -11.8575439453125, -11.380615234375, -10.9036865234375, -10.4267578125, -9.9498291015625, -9.472900390625, -8.9959716796875, -8.51904296875, -8.0421142578125, -7.565185546875, -7.0882568359375, -6.611328125, -6.1343994140625, -5.657470703125, -5.1805419921875, -4.70361328125, -4.2266845703125, -3.749755859375, -3.2728271484375, -2.7958984375, -2.3189697265625, -1.842041015625, -1.3651123046875, -0.88818359375, -0.4112548828125, 0.065673828125, 0.5426025390625, 1.01953125, 1.4964599609375, 1.973388671875, 2.4503173828125, 2.92724609375, 3.4041748046875, 3.881103515625, 4.3580322265625, 4.8349609375, 5.3118896484375, 5.788818359375, 6.2657470703125, 6.74267578125, 7.2196044921875, 7.696533203125, 8.1734619140625, 8.650390625, 9.1273193359375, 9.604248046875, 10.0811767578125, 10.55810546875, 11.0350341796875, 11.511962890625, 11.9888916015625, 12.4658203125, 12.9427490234375, 13.419677734375, 13.8966064453125, 14.37353515625, 14.8504638671875, 15.327392578125, 15.8043212890625, 16.28125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 6.0, 13.0, 15.0, 26.0, 37.0, 58.0, 122.0, 368.0, 1343.0, 7755.0, 680066.0, 349804.0, 6948.0, 1280.0, 350.0, 155.0, 67.0, 36.0, 19.0, 19.0, 17.0, 4.0, 5.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55517578125, -0.5397453308105469, -0.5243148803710938, -0.5088844299316406, -0.4934539794921875, -0.4780235290527344, -0.46259307861328125, -0.4471626281738281, -0.431732177734375, -0.4163017272949219, -0.40087127685546875, -0.3854408264160156, -0.3700103759765625, -0.3545799255371094, -0.33914947509765625, -0.3237190246582031, -0.30828857421875, -0.2928581237792969, -0.27742767333984375, -0.2619972229003906, -0.2465667724609375, -0.23113632202148438, -0.21570587158203125, -0.20027542114257812, -0.184844970703125, -0.16941452026367188, -0.15398406982421875, -0.13855361938476562, -0.1231231689453125, -0.10769271850585938, -0.09226226806640625, -0.07683181762695312, -0.0614013671875, -0.045970916748046875, -0.03054046630859375, -0.015110015869140625, 0.0003204345703125, 0.015750885009765625, 0.03118133544921875, 0.046611785888671875, 0.062042236328125, 0.07747268676757812, 0.09290313720703125, 0.10833358764648438, 0.1237640380859375, 0.13919448852539062, 0.15462493896484375, 0.17005538940429688, 0.18548583984375, 0.20091629028320312, 0.21634674072265625, 0.23177719116210938, 0.2472076416015625, 0.2626380920410156, 0.27806854248046875, 0.2934989929199219, 0.308929443359375, 0.3243598937988281, 0.33979034423828125, 0.3552207946777344, 0.3706512451171875, 0.3860816955566406, 0.40151214599609375, 0.4169425964355469, 0.432373046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 5.0, 17.0, 19.0, 24.0, 26.0, 61.0, 103.0, 180.0, 220.0, 135.0, 54.0, 36.0, 22.0, 14.0, 11.0, 17.0, 8.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.27978453040123e-05, -2.1813437342643738e-05, -2.0829029381275177e-05, -1.9844621419906616e-05, -1.8860213458538055e-05, -1.7875805497169495e-05, -1.6891397535800934e-05, -1.5906989574432373e-05, -1.4922581613063812e-05, -1.3938173651695251e-05, -1.295376569032669e-05, -1.196935772895813e-05, -1.0984949767589569e-05, -1.0000541806221008e-05, -9.016133844852448e-06, -8.031725883483887e-06, -7.047317922115326e-06, -6.062909960746765e-06, -5.078501999378204e-06, -4.0940940380096436e-06, -3.1096860766410828e-06, -2.125278115272522e-06, -1.1408701539039612e-06, -1.564621925354004e-07, 8.279457688331604e-07, 1.8123537302017212e-06, 2.796761691570282e-06, 3.7811696529388428e-06, 4.7655776143074036e-06, 5.749985575675964e-06, 6.734393537044525e-06, 7.718801498413086e-06, 8.703209459781647e-06, 9.687617421150208e-06, 1.0672025382518768e-05, 1.1656433343887329e-05, 1.264084130525589e-05, 1.362524926662445e-05, 1.4609657227993011e-05, 1.5594065189361572e-05, 1.6578473150730133e-05, 1.7562881112098694e-05, 1.8547289073467255e-05, 1.9531697034835815e-05, 2.0516104996204376e-05, 2.1500512957572937e-05, 2.2484920918941498e-05, 2.346932888031006e-05, 2.445373684167862e-05, 2.543814480304718e-05, 2.642255276441574e-05, 2.7406960725784302e-05, 2.8391368687152863e-05, 2.9375776648521423e-05, 3.0360184609889984e-05, 3.1344592571258545e-05, 3.2329000532627106e-05, 3.3313408493995667e-05, 3.429781645536423e-05, 3.528222441673279e-05, 3.626663237810135e-05, 3.725104033946991e-05, 3.823544830083847e-05, 3.921985626220703e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 3.0, 8.0, 10.0, 23.0, 20.0, 41.0, 76.0, 215.0, 591.0, 1998.0, 9513.0, 745574.0, 279984.0, 7870.0, 1707.0, 517.0, 195.0, 68.0, 31.0, 25.0, 18.0, 11.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.421478271484375, -0.40692138671875, -0.392364501953125, -0.3778076171875, -0.363250732421875, -0.34869384765625, -0.334136962890625, -0.319580078125, -0.305023193359375, -0.29046630859375, -0.275909423828125, -0.2613525390625, -0.246795654296875, -0.23223876953125, -0.217681884765625, -0.203125, -0.188568115234375, -0.17401123046875, -0.159454345703125, -0.1448974609375, -0.130340576171875, -0.11578369140625, -0.101226806640625, -0.086669921875, -0.072113037109375, -0.05755615234375, -0.042999267578125, -0.0284423828125, -0.013885498046875, 0.00067138671875, 0.015228271484375, 0.02978515625, 0.044342041015625, 0.05889892578125, 0.073455810546875, 0.0880126953125, 0.102569580078125, 0.11712646484375, 0.131683349609375, 0.146240234375, 0.160797119140625, 0.17535400390625, 0.189910888671875, 0.2044677734375, 0.219024658203125, 0.23358154296875, 0.248138427734375, 0.2626953125, 0.277252197265625, 0.29180908203125, 0.306365966796875, 0.3209228515625, 0.335479736328125, 0.35003662109375, 0.364593505859375, 0.379150390625, 0.393707275390625, 0.40826416015625, 0.422821044921875, 0.4373779296875, 0.451934814453125, 0.46649169921875, 0.481048583984375, 0.49560546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 12.0, 33.0, 35.0, 94.0, 209.0, 306.0, 137.0, 51.0, 37.0, 15.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11354351043701172, -0.11002159118652344, -0.10649967193603516, -0.10297775268554688, -0.0994558334350586, -0.09593391418457031, -0.09241199493408203, -0.08889007568359375, -0.08536815643310547, -0.08184623718261719, -0.0783243179321289, -0.07480239868164062, -0.07128047943115234, -0.06775856018066406, -0.06423664093017578, -0.0607147216796875, -0.05719280242919922, -0.05367088317871094, -0.050148963928222656, -0.046627044677734375, -0.043105125427246094, -0.03958320617675781, -0.03606128692626953, -0.03253936767578125, -0.02901744842529297, -0.025495529174804688, -0.021973609924316406, -0.018451690673828125, -0.014929771423339844, -0.011407852172851562, -0.007885932922363281, -0.004364013671875, -0.0008420944213867188, 0.0026798248291015625, 0.006201744079589844, 0.009723663330078125, 0.013245582580566406, 0.016767501831054688, 0.02028942108154297, 0.02381134033203125, 0.02733325958251953, 0.030855178833007812, 0.034377098083496094, 0.037899017333984375, 0.041420936584472656, 0.04494285583496094, 0.04846477508544922, 0.0519866943359375, 0.05550861358642578, 0.05903053283691406, 0.06255245208740234, 0.06607437133789062, 0.0695962905883789, 0.07311820983886719, 0.07664012908935547, 0.08016204833984375, 0.08368396759033203, 0.08720588684082031, 0.0907278060913086, 0.09424972534179688, 0.09777164459228516, 0.10129356384277344, 0.10481548309326172, 0.10833740234375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 55.0, 944.0, 16.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8372344970703125, -2.6986899375915527, -1.5601451396942139, -0.421600341796875, 0.7169442176818848, 1.8554887771606445, 2.9940338134765625, 4.132578372955322, 5.271122932434082, 6.409667491912842, 7.548212051391602, 8.68675708770752, 9.825302124023438, 10.963846206665039, 12.102391242980957, 13.240936279296875, 14.379480361938477, 15.518025398254395, 16.656570434570312, 17.795114517211914, 18.933658599853516, 20.07220458984375, 21.21074867248535, 22.349292755126953, 23.487838745117188, 24.62638282775879, 25.764928817749023, 26.903472900390625, 28.042016983032227, 29.180561065673828, 30.319107055664062, 31.457651138305664, 32.596195220947266, 33.7347412109375, 34.87328338623047, 36.0118293762207, 37.15037536621094, 38.288917541503906, 39.42746353149414, 40.566009521484375, 41.704551696777344, 42.84309768676758, 43.98163986206055, 45.12018585205078, 46.258731842041016, 47.397274017333984, 48.53582000732422, 49.67436599731445, 50.81291198730469, 51.95145797729492, 53.09000015258789, 54.228546142578125, 55.36709213256836, 56.50563430786133, 57.64418029785156, 58.7827262878418, 59.921268463134766, 61.059814453125, 62.19835662841797, 63.3369026184082, 64.47544860839844, 65.6139907836914, 66.75253295898438, 67.89108276367188, 69.02962493896484]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 9.0, 22.0, 15.0, 14.0, 27.0, 33.0, 35.0, 46.0, 46.0, 52.0, 65.0, 61.0, 60.0, 70.0, 60.0, 56.0, 46.0, 45.0, 38.0, 40.0, 35.0, 25.0, 22.0, 21.0, 16.0, 14.0, 5.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.642409324645996, -13.173080444335938, -12.703750610351562, -12.234421730041504, -11.765092849731445, -11.29576301574707, -10.826434135437012, -10.357105255126953, -9.887775421142578, -9.41844654083252, -8.949116706848145, -8.479787826538086, -8.010458946228027, -7.5411295890808105, -7.071800231933594, -6.602471351623535, -6.133142471313477, -5.66381311416626, -5.194484233856201, -4.725154876708984, -4.255825996398926, -3.786496639251709, -3.317167282104492, -2.8478381633758545, -2.378509044647217, -1.909179925918579, -1.4398506879806519, -0.9705214500427246, -0.5011923313140869, -0.03186321258544922, 0.4374661445617676, 0.9067952632904053, 1.3761234283447266, 1.8454525470733643, 2.314781665802002, 2.7841110229492188, 3.2534401416778564, 3.722769260406494, 4.192098617553711, 4.6614274978637695, 5.130756855010986, 5.600086212158203, 6.069415092468262, 6.5387444496154785, 7.008073806762695, 7.477402687072754, 7.946732044219971, 8.416061401367188, 8.885390281677246, 9.354719161987305, 9.82404899597168, 10.293377876281738, 10.762706756591797, 11.232036590576172, 11.70136547088623, 12.170694351196289, 12.640024185180664, 13.109353065490723, 13.578682899475098, 14.048011779785156, 14.517340660095215, 14.986669540405273, 15.455999374389648, 15.925328254699707, 16.394657135009766]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 10.0, 6.0, 10.0, 15.0, 25.0, 33.0, 37.0, 43.0, 65.0, 78.0, 177.0, 551.0, 2245.0, 30304.0, 1497307.0, 2598957.0, 59383.0, 3868.0, 621.0, 195.0, 86.0, 60.0, 39.0, 32.0, 29.0, 15.0, 14.0, 9.0, 10.0, 11.0, 9.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.501800537109375, -2.40203857421875, -2.302276611328125, -2.2025146484375, -2.102752685546875, -2.00299072265625, -1.903228759765625, -1.803466796875, -1.703704833984375, -1.60394287109375, -1.504180908203125, -1.4044189453125, -1.304656982421875, -1.20489501953125, -1.105133056640625, -1.00537109375, -0.905609130859375, -0.80584716796875, -0.706085205078125, -0.6063232421875, -0.506561279296875, -0.40679931640625, -0.307037353515625, -0.207275390625, -0.107513427734375, -0.00775146484375, 0.092010498046875, 0.1917724609375, 0.291534423828125, 0.39129638671875, 0.491058349609375, 0.5908203125, 0.690582275390625, 0.79034423828125, 0.890106201171875, 0.9898681640625, 1.089630126953125, 1.18939208984375, 1.289154052734375, 1.388916015625, 1.488677978515625, 1.58843994140625, 1.688201904296875, 1.7879638671875, 1.887725830078125, 1.98748779296875, 2.087249755859375, 2.18701171875, 2.286773681640625, 2.38653564453125, 2.486297607421875, 2.5860595703125, 2.685821533203125, 2.78558349609375, 2.885345458984375, 2.985107421875, 3.084869384765625, 3.18463134765625, 3.284393310546875, 3.3841552734375, 3.483917236328125, 3.58367919921875, 3.683441162109375, 3.783203125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 15.0, 8.0, 8.0, 11.0, 15.0, 24.0, 33.0, 37.0, 45.0, 48.0, 66.0, 58.0, 61.0, 60.0, 66.0, 58.0, 61.0, 46.0, 39.0, 50.0, 37.0, 28.0, 26.0, 16.0, 11.0, 12.0, 8.0, 6.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3039398193359375, -1.263153076171875, -1.2223663330078125, -1.18157958984375, -1.1407928466796875, -1.100006103515625, -1.0592193603515625, -1.0184326171875, -0.9776458740234375, -0.936859130859375, -0.8960723876953125, -0.85528564453125, -0.8144989013671875, -0.773712158203125, -0.7329254150390625, -0.692138671875, -0.6513519287109375, -0.610565185546875, -0.5697784423828125, -0.52899169921875, -0.4882049560546875, -0.447418212890625, -0.4066314697265625, -0.3658447265625, -0.3250579833984375, -0.284271240234375, -0.2434844970703125, -0.20269775390625, -0.1619110107421875, -0.121124267578125, -0.0803375244140625, -0.03955078125, 0.0012359619140625, 0.042022705078125, 0.0828094482421875, 0.12359619140625, 0.1643829345703125, 0.205169677734375, 0.2459564208984375, 0.2867431640625, 0.3275299072265625, 0.368316650390625, 0.4091033935546875, 0.44989013671875, 0.4906768798828125, 0.531463623046875, 0.5722503662109375, 0.613037109375, 0.6538238525390625, 0.694610595703125, 0.7353973388671875, 0.77618408203125, 0.8169708251953125, 0.857757568359375, 0.8985443115234375, 0.9393310546875, 0.9801177978515625, 1.020904541015625, 1.0616912841796875, 1.10247802734375, 1.1432647705078125, 1.184051513671875, 1.2248382568359375, 1.265625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 15.0, 41.0, 57.0, 116.0, 299.0, 585.0, 4191700.0, 712.0, 350.0, 200.0, 75.0, 44.0, 22.0, 13.0, 12.0, 9.0, 3.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.96875, -24.05224609375, -22.1357421875, -20.21923828125, -18.302734375, -16.38623046875, -14.4697265625, -12.55322265625, -10.63671875, -8.72021484375, -6.8037109375, -4.88720703125, -2.970703125, -1.05419921875, 0.8623046875, 2.77880859375, 4.6953125, 6.61181640625, 8.5283203125, 10.44482421875, 12.361328125, 14.27783203125, 16.1943359375, 18.11083984375, 20.02734375, 21.94384765625, 23.8603515625, 25.77685546875, 27.693359375, 29.60986328125, 31.5263671875, 33.44287109375, 35.359375, 37.27587890625, 39.1923828125, 41.10888671875, 43.025390625, 44.94189453125, 46.8583984375, 48.77490234375, 50.69140625, 52.60791015625, 54.5244140625, 56.44091796875, 58.357421875, 60.27392578125, 62.1904296875, 64.10693359375, 66.0234375, 67.93994140625, 69.8564453125, 71.77294921875, 73.689453125, 75.60595703125, 77.5224609375, 79.43896484375, 81.35546875, 83.27197265625, 85.1884765625, 87.10498046875, 89.021484375, 90.93798828125, 92.8544921875, 94.77099609375, 96.6875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 10.0, 5.0, 11.0, 20.0, 46.0, 51.0, 77.0, 232.0, 607.0, 1196.0, 981.0, 418.0, 204.0, 83.0, 41.0, 31.0, 17.0, 18.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69580078125, -0.6724090576171875, -0.649017333984375, -0.6256256103515625, -0.60223388671875, -0.5788421630859375, -0.555450439453125, -0.5320587158203125, -0.5086669921875, -0.4852752685546875, -0.461883544921875, -0.4384918212890625, -0.41510009765625, -0.3917083740234375, -0.368316650390625, -0.3449249267578125, -0.321533203125, -0.2981414794921875, -0.274749755859375, -0.2513580322265625, -0.22796630859375, -0.2045745849609375, -0.181182861328125, -0.1577911376953125, -0.1343994140625, -0.1110076904296875, -0.087615966796875, -0.0642242431640625, -0.04083251953125, -0.0174407958984375, 0.005950927734375, 0.0293426513671875, 0.052734375, 0.0761260986328125, 0.099517822265625, 0.1229095458984375, 0.14630126953125, 0.1696929931640625, 0.193084716796875, 0.2164764404296875, 0.2398681640625, 0.2632598876953125, 0.286651611328125, 0.3100433349609375, 0.33343505859375, 0.3568267822265625, 0.380218505859375, 0.4036102294921875, 0.427001953125, 0.4503936767578125, 0.473785400390625, 0.4971771240234375, 0.52056884765625, 0.5439605712890625, 0.567352294921875, 0.5907440185546875, 0.6141357421875, 0.6375274658203125, 0.660919189453125, 0.6843109130859375, 0.70770263671875, 0.7310943603515625, 0.754486083984375, 0.7778778076171875, 0.80126953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 12.0, 19.0, 38.0, 93.0, 180.0, 269.0, 208.0, 92.0, 49.0, 19.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.337700366973877, -4.242169380187988, -4.1466383934021, -4.051106929779053, -3.955575942993164, -3.8600449562072754, -3.7645139694213867, -3.668982744216919, -3.5734517574310303, -3.4779207706451416, -3.382389545440674, -3.286858558654785, -3.1913273334503174, -3.0957963466644287, -3.000265121459961, -2.9047341346740723, -2.8092031478881836, -2.713672161102295, -2.618140935897827, -2.5226099491119385, -2.4270787239074707, -2.331547737121582, -2.2360167503356934, -2.1404855251312256, -2.044954299926758, -1.9494231939315796, -1.8538920879364014, -1.7583611011505127, -1.6628299951553345, -1.5672988891601562, -1.471767783164978, -1.3762366771697998, -1.2807055711746216, -1.1851744651794434, -1.0896433591842651, -0.9941123127937317, -0.8985812664031982, -0.80305016040802, -0.7075190544128418, -0.6119880080223083, -0.5164569020271301, -0.4209258258342743, -0.32539474964141846, -0.22986364364624023, -0.1343325674533844, -0.038801491260528564, 0.05672961473464966, 0.1522606611251831, 0.24779176712036133, 0.34332284331321716, 0.438853919506073, 0.5343850255012512, 0.6299160718917847, 0.7254471778869629, 0.8209782838821411, 0.9165093302726746, 1.012040376663208, 1.1075714826583862, 1.2031025886535645, 1.2986335754394531, 1.3941646814346313, 1.4896957874298096, 1.5852268934249878, 1.680757999420166, 1.7762891054153442]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 15.0, 16.0, 27.0, 22.0, 25.0, 42.0, 34.0, 39.0, 47.0, 39.0, 54.0, 61.0, 58.0, 57.0, 60.0, 42.0, 51.0, 56.0, 30.0, 34.0, 36.0, 23.0, 22.0, 24.0, 9.0, 9.0, 8.0, 9.0, 5.0, 8.0, 1.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.6991792917251587, -1.653623104095459, -1.6080669164657593, -1.56251060962677, -1.5169544219970703, -1.4713982343673706, -1.425842046737671, -1.3802857398986816, -1.334729552268982, -1.2891733646392822, -1.2436171770095825, -1.1980608701705933, -1.1525046825408936, -1.1069484949111938, -1.0613923072814941, -1.0158360004425049, -0.97027987241745, -0.9247236847877502, -0.8791674375534058, -0.833611249923706, -0.7880550026893616, -0.7424988150596619, -0.6969425678253174, -0.6513863801956177, -0.605830192565918, -0.5602740049362183, -0.5147177577018738, -0.4691615700721741, -0.4236053228378296, -0.3780491352081299, -0.3324929177761078, -0.2869367003440857, -0.2413804531097412, -0.19582423567771912, -0.15026801824569702, -0.10471181571483612, -0.059155598282814026, -0.013599380850791931, 0.03195682168006897, 0.07751303911209106, 0.12306925654411316, 0.16862547397613525, 0.21418169140815735, 0.25973790884017944, 0.30529409646987915, 0.35085034370422363, 0.39640653133392334, 0.44196274876594543, 0.48751896619796753, 0.5330751538276672, 0.5786314010620117, 0.6241875886917114, 0.6697438359260559, 0.7153000235557556, 0.7608562707901001, 0.8064124584197998, 0.8519686460494995, 0.8975248336791992, 0.9430810809135437, 0.9886372685432434, 1.034193515777588, 1.0797497034072876, 1.1253058910369873, 1.1708621978759766, 1.2164183855056763]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 3.0, 7.0, 7.0, 22.0, 18.0, 23.0, 37.0, 66.0, 96.0, 167.0, 308.0, 502.0, 1036.0, 2355.0, 6213.0, 27423.0, 426750.0, 539597.0, 32197.0, 6813.0, 2498.0, 1107.0, 535.0, 292.0, 190.0, 90.0, 63.0, 41.0, 22.0, 16.0, 21.0, 12.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.5969772338867188, -0.5777435302734375, -0.5585098266601562, -0.539276123046875, -0.5200424194335938, -0.5008087158203125, -0.48157501220703125, -0.46234130859375, -0.44310760498046875, -0.4238739013671875, -0.40464019775390625, -0.385406494140625, -0.36617279052734375, -0.3469390869140625, -0.32770538330078125, -0.3084716796875, -0.28923797607421875, -0.2700042724609375, -0.25077056884765625, -0.231536865234375, -0.21230316162109375, -0.1930694580078125, -0.17383575439453125, -0.15460205078125, -0.13536834716796875, -0.1161346435546875, -0.09690093994140625, -0.077667236328125, -0.05843353271484375, -0.0391998291015625, -0.01996612548828125, -0.000732421875, 0.01850128173828125, 0.0377349853515625, 0.05696868896484375, 0.076202392578125, 0.09543609619140625, 0.1146697998046875, 0.13390350341796875, 0.15313720703125, 0.17237091064453125, 0.1916046142578125, 0.21083831787109375, 0.230072021484375, 0.24930572509765625, 0.2685394287109375, 0.28777313232421875, 0.3070068359375, 0.32624053955078125, 0.3454742431640625, 0.36470794677734375, 0.383941650390625, 0.40317535400390625, 0.4224090576171875, 0.44164276123046875, 0.46087646484375, 0.48011016845703125, 0.4993438720703125, 0.5185775756835938, 0.537811279296875, 0.5570449829101562, 0.5762786865234375, 0.5955123901367188, 0.61474609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 7.0, 6.0, 5.0, 9.0, 18.0, 30.0, 45.0, 54.0, 59.0, 79.0, 81.0, 114.0, 86.0, 96.0, 69.0, 55.0, 56.0, 43.0, 30.0, 13.0, 13.0, 17.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.561187744140625, -1.51397705078125, -1.466766357421875, -1.4195556640625, -1.372344970703125, -1.32513427734375, -1.277923583984375, -1.230712890625, -1.183502197265625, -1.13629150390625, -1.089080810546875, -1.0418701171875, -0.994659423828125, -0.94744873046875, -0.900238037109375, -0.85302734375, -0.805816650390625, -0.75860595703125, -0.711395263671875, -0.6641845703125, -0.616973876953125, -0.56976318359375, -0.522552490234375, -0.475341796875, -0.428131103515625, -0.38092041015625, -0.333709716796875, -0.2864990234375, -0.239288330078125, -0.19207763671875, -0.144866943359375, -0.09765625, -0.050445556640625, -0.00323486328125, 0.043975830078125, 0.0911865234375, 0.138397216796875, 0.18560791015625, 0.232818603515625, 0.280029296875, 0.327239990234375, 0.37445068359375, 0.421661376953125, 0.4688720703125, 0.516082763671875, 0.56329345703125, 0.610504150390625, 0.65771484375, 0.704925537109375, 0.75213623046875, 0.799346923828125, 0.8465576171875, 0.893768310546875, 0.94097900390625, 0.988189697265625, 1.035400390625, 1.082611083984375, 1.12982177734375, 1.177032470703125, 1.2242431640625, 1.271453857421875, 1.31866455078125, 1.365875244140625, 1.4130859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 9.0, 24.0, 23.0, 37.0, 54.0, 79.0, 92.0, 123.0, 175.0, 238.0, 355.0, 487.0, 705.0, 1121.0, 1511.0, 2269.0, 3395.0, 5274.0, 8248.0, 13257.0, 22389.0, 39945.0, 73993.0, 138986.0, 227327.0, 219100.0, 128330.0, 67800.0, 36861.0, 20941.0, 12366.0, 7815.0, 4837.0, 3189.0, 2183.0, 1517.0, 1050.0, 770.0, 483.0, 314.0, 270.0, 164.0, 151.0, 76.0, 64.0, 49.0, 28.0, 22.0, 15.0, 11.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08056640625, -0.07796192169189453, -0.07535743713378906, -0.0727529525756836, -0.07014846801757812, -0.06754398345947266, -0.06493949890136719, -0.06233501434326172, -0.05973052978515625, -0.05712604522705078, -0.05452156066894531, -0.051917076110839844, -0.049312591552734375, -0.046708106994628906, -0.04410362243652344, -0.04149913787841797, -0.0388946533203125, -0.03629016876220703, -0.03368568420410156, -0.031081199645996094, -0.028476715087890625, -0.025872230529785156, -0.023267745971679688, -0.02066326141357422, -0.01805877685546875, -0.015454292297363281, -0.012849807739257812, -0.010245323181152344, -0.007640838623046875, -0.005036354064941406, -0.0024318695068359375, 0.00017261505126953125, 0.002777099609375, 0.005381584167480469, 0.007986068725585938, 0.010590553283691406, 0.013195037841796875, 0.015799522399902344, 0.018404006958007812, 0.02100849151611328, 0.02361297607421875, 0.02621746063232422, 0.028821945190429688, 0.031426429748535156, 0.034030914306640625, 0.036635398864746094, 0.03923988342285156, 0.04184436798095703, 0.0444488525390625, 0.04705333709716797, 0.04965782165527344, 0.052262306213378906, 0.054866790771484375, 0.057471275329589844, 0.06007575988769531, 0.06268024444580078, 0.06528472900390625, 0.06788921356201172, 0.07049369812011719, 0.07309818267822266, 0.07570266723632812, 0.0783071517944336, 0.08091163635253906, 0.08351612091064453, 0.08612060546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 12.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 24.0, 30.0, 37.0, 34.0, 32.0, 53.0, 49.0, 49.0, 46.0, 45.0, 45.0, 55.0, 39.0, 42.0, 38.0, 45.0, 38.0, 34.0, 29.0, 26.0, 18.0, 16.0, 13.0, 8.0, 13.0, 8.0, 5.0, 5.0, 7.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5068359375, -1.4614105224609375, -1.415985107421875, -1.3705596923828125, -1.32513427734375, -1.2797088623046875, -1.234283447265625, -1.1888580322265625, -1.1434326171875, -1.0980072021484375, -1.052581787109375, -1.0071563720703125, -0.96173095703125, -0.9163055419921875, -0.870880126953125, -0.8254547119140625, -0.780029296875, -0.7346038818359375, -0.689178466796875, -0.6437530517578125, -0.59832763671875, -0.5529022216796875, -0.507476806640625, -0.4620513916015625, -0.4166259765625, -0.3712005615234375, -0.325775146484375, -0.2803497314453125, -0.23492431640625, -0.1894989013671875, -0.144073486328125, -0.0986480712890625, -0.05322265625, -0.0077972412109375, 0.037628173828125, 0.0830535888671875, 0.12847900390625, 0.1739044189453125, 0.219329833984375, 0.2647552490234375, 0.3101806640625, 0.3556060791015625, 0.401031494140625, 0.4464569091796875, 0.49188232421875, 0.5373077392578125, 0.582733154296875, 0.6281585693359375, 0.673583984375, 0.7190093994140625, 0.764434814453125, 0.8098602294921875, 0.85528564453125, 0.9007110595703125, 0.946136474609375, 0.9915618896484375, 1.0369873046875, 1.0824127197265625, 1.127838134765625, 1.1732635498046875, 1.21868896484375, 1.2641143798828125, 1.309539794921875, 1.3549652099609375, 1.400390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 9.0, 6.0, 8.0, 16.0, 20.0, 34.0, 36.0, 67.0, 88.0, 130.0, 238.0, 299.0, 533.0, 906.0, 1695.0, 3523.0, 8166.0, 22961.0, 85311.0, 393318.0, 404256.0, 87611.0, 23606.0, 8098.0, 3427.0, 1710.0, 921.0, 524.0, 357.0, 197.0, 139.0, 86.0, 68.0, 53.0, 37.0, 32.0, 16.0, 12.0, 6.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0127105712890625, -0.012287020683288574, -0.011863470077514648, -0.011439919471740723, -0.011016368865966797, -0.010592818260192871, -0.010169267654418945, -0.00974571704864502, -0.009322166442871094, -0.008898615837097168, -0.008475065231323242, -0.008051514625549316, -0.007627964019775391, -0.007204413414001465, -0.006780862808227539, -0.006357312202453613, -0.0059337615966796875, -0.005510210990905762, -0.005086660385131836, -0.00466310977935791, -0.004239559173583984, -0.0038160085678100586, -0.003392457962036133, -0.002968907356262207, -0.0025453567504882812, -0.0021218061447143555, -0.0016982555389404297, -0.001274704933166504, -0.0008511543273925781, -0.00042760372161865234, -4.0531158447265625e-06, 0.0004194974899291992, 0.000843048095703125, 0.0012665987014770508, 0.0016901493072509766, 0.0021136999130249023, 0.002537250518798828, 0.002960801124572754, 0.0033843517303466797, 0.0038079023361206055, 0.004231452941894531, 0.004655003547668457, 0.005078554153442383, 0.005502104759216309, 0.005925655364990234, 0.00634920597076416, 0.006772756576538086, 0.007196307182312012, 0.0076198577880859375, 0.008043408393859863, 0.008466958999633789, 0.008890509605407715, 0.00931406021118164, 0.009737610816955566, 0.010161161422729492, 0.010584712028503418, 0.011008262634277344, 0.01143181324005127, 0.011855363845825195, 0.012278914451599121, 0.012702465057373047, 0.013126015663146973, 0.013549566268920898, 0.013973116874694824, 0.01439666748046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 11.0, 17.0, 12.0, 25.0, 33.0, 42.0, 58.0, 56.0, 62.0, 64.0, 85.0, 88.0, 68.0, 65.0, 49.0, 52.0, 41.0, 31.0, 28.0, 25.0, 17.0, 8.0, 5.0, 10.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.6748905181884766e-05, -1.6198493540287018e-05, -1.564808189868927e-05, -1.5097670257091522e-05, -1.4547258615493774e-05, -1.3996846973896027e-05, -1.3446435332298279e-05, -1.2896023690700531e-05, -1.2345612049102783e-05, -1.1795200407505035e-05, -1.1244788765907288e-05, -1.069437712430954e-05, -1.0143965482711792e-05, -9.593553841114044e-06, -9.043142199516296e-06, -8.492730557918549e-06, -7.9423189163208e-06, -7.391907274723053e-06, -6.841495633125305e-06, -6.291083991527557e-06, -5.7406723499298096e-06, -5.190260708332062e-06, -4.639849066734314e-06, -4.089437425136566e-06, -3.5390257835388184e-06, -2.9886141419410706e-06, -2.4382025003433228e-06, -1.887790858745575e-06, -1.3373792171478271e-06, -7.869675755500793e-07, -2.3655593395233154e-07, 3.1385570764541626e-07, 8.642673492431641e-07, 1.4146789908409119e-06, 1.9650906324386597e-06, 2.5155022740364075e-06, 3.0659139156341553e-06, 3.616325557231903e-06, 4.166737198829651e-06, 4.717148840427399e-06, 5.2675604820251465e-06, 5.817972123622894e-06, 6.368383765220642e-06, 6.91879540681839e-06, 7.469207048416138e-06, 8.019618690013885e-06, 8.570030331611633e-06, 9.120441973209381e-06, 9.670853614807129e-06, 1.0221265256404877e-05, 1.0771676898002625e-05, 1.1322088539600372e-05, 1.187250018119812e-05, 1.2422911822795868e-05, 1.2973323464393616e-05, 1.3523735105991364e-05, 1.4074146747589111e-05, 1.4624558389186859e-05, 1.5174970030784607e-05, 1.5725381672382355e-05, 1.6275793313980103e-05, 1.682620495557785e-05, 1.7376616597175598e-05, 1.7927028238773346e-05, 1.8477439880371094e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 15.0, 18.0, 22.0, 24.0, 35.0, 51.0, 74.0, 127.0, 371.0, 8257.0, 1023476.0, 15223.0, 439.0, 142.0, 76.0, 43.0, 35.0, 19.0, 15.0, 19.0, 14.0, 8.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.076507568359375, -0.07415771484375, -0.071807861328125, -0.0694580078125, -0.067108154296875, -0.06475830078125, -0.062408447265625, -0.06005859375, -0.057708740234375, -0.05535888671875, -0.053009033203125, -0.0506591796875, -0.048309326171875, -0.04595947265625, -0.043609619140625, -0.041259765625, -0.038909912109375, -0.03656005859375, -0.034210205078125, -0.0318603515625, -0.029510498046875, -0.02716064453125, -0.024810791015625, -0.0224609375, -0.020111083984375, -0.01776123046875, -0.015411376953125, -0.0130615234375, -0.010711669921875, -0.00836181640625, -0.006011962890625, -0.003662109375, -0.001312255859375, 0.00103759765625, 0.003387451171875, 0.0057373046875, 0.008087158203125, 0.01043701171875, 0.012786865234375, 0.01513671875, 0.017486572265625, 0.01983642578125, 0.022186279296875, 0.0245361328125, 0.026885986328125, 0.02923583984375, 0.031585693359375, 0.033935546875, 0.036285400390625, 0.03863525390625, 0.040985107421875, 0.0433349609375, 0.045684814453125, 0.04803466796875, 0.050384521484375, 0.052734375, 0.055084228515625, 0.05743408203125, 0.059783935546875, 0.0621337890625, 0.064483642578125, 0.06683349609375, 0.069183349609375, 0.071533203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 13.0, 23.0, 30.0, 47.0, 59.0, 102.0, 137.0, 192.0, 138.0, 85.0, 42.0, 32.0, 22.0, 10.0, 15.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074005126953125, -0.007201731204986572, -0.0070029497146606445, -0.006804168224334717, -0.006605386734008789, -0.006406605243682861, -0.006207823753356934, -0.006009042263031006, -0.005810260772705078, -0.00561147928237915, -0.005412697792053223, -0.005213916301727295, -0.005015134811401367, -0.0048163533210754395, -0.004617571830749512, -0.004418790340423584, -0.004220008850097656, -0.0040212273597717285, -0.0038224458694458008, -0.003623664379119873, -0.0034248828887939453, -0.0032261013984680176, -0.00302731990814209, -0.002828538417816162, -0.0026297569274902344, -0.0024309754371643066, -0.002232193946838379, -0.002033412456512451, -0.0018346309661865234, -0.0016358494758605957, -0.001437067985534668, -0.0012382864952087402, -0.0010395050048828125, -0.0008407235145568848, -0.000641942024230957, -0.0004431605339050293, -0.00024437904357910156, -4.559755325317383e-05, 0.0001531839370727539, 0.00035196542739868164, 0.0005507469177246094, 0.0007495284080505371, 0.0009483098983764648, 0.0011470913887023926, 0.0013458728790283203, 0.001544654369354248, 0.0017434358596801758, 0.0019422173500061035, 0.0021409988403320312, 0.002339780330657959, 0.0025385618209838867, 0.0027373433113098145, 0.002936124801635742, 0.00313490629196167, 0.0033336877822875977, 0.0035324692726135254, 0.003731250762939453, 0.003930032253265381, 0.004128813743591309, 0.004327595233917236, 0.004526376724243164, 0.004725158214569092, 0.0049239397048950195, 0.005122721195220947, 0.005321502685546875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 16.0, 45.0, 102.0, 171.0, 273.0, 196.0, 100.0, 45.0, 18.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.208329439163208, -2.1550021171569824, -2.101674795150757, -2.0483474731445312, -1.9950200319290161, -1.9416927099227905, -1.888365387916565, -1.8350380659103394, -1.7817106246948242, -1.7283833026885986, -1.675055980682373, -1.6217286586761475, -1.5684012174606323, -1.5150738954544067, -1.4617465734481812, -1.4084192514419556, -1.35509192943573, -1.3017646074295044, -1.2484372854232788, -1.1951098442077637, -1.141782522201538, -1.0884552001953125, -1.035127878189087, -0.9818005561828613, -0.928473174571991, -0.8751458525657654, -0.821818470954895, -0.7684911489486694, -0.7151638269424438, -0.6618364453315735, -0.6085091233253479, -0.5551817417144775, -0.5018543004989624, -0.44852694869041443, -0.39519959688186646, -0.34187227487564087, -0.2885449230670929, -0.23521757125854492, -0.18189024925231934, -0.12856289744377136, -0.07523554563522339, -0.021908201277256012, 0.031419143080711365, 0.08474647998809814, 0.13807383179664612, 0.1914011836051941, 0.24472850561141968, 0.29805585741996765, 0.3513832092285156, 0.4047105610370636, 0.4580379128456116, 0.5113652348518372, 0.5646926164627075, 0.6180199384689331, 0.6713472604751587, 0.7246745824813843, 0.7780019640922546, 0.8313292860984802, 0.8846566677093506, 0.9379839897155762, 0.9913113117218018, 1.0446386337280273, 1.097965955734253, 1.151293396949768, 1.2046207189559937]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 4.0, 6.0, 18.0, 26.0, 29.0, 48.0, 55.0, 53.0, 65.0, 71.0, 92.0, 85.0, 82.0, 77.0, 59.0, 56.0, 41.0, 32.0, 27.0, 19.0, 16.0, 6.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3530519008636475, -1.312319278717041, -1.2715866565704346, -1.2308539152145386, -1.1901212930679321, -1.1493886709213257, -1.1086560487747192, -1.0679234266281128, -1.0271906852722168, -0.9864580631256104, -0.9457253813743591, -0.9049927592277527, -0.8642600774765015, -0.823527455329895, -0.7827948331832886, -0.7420622110366821, -0.7013295888900757, -0.6605969667434692, -0.619864284992218, -0.5791316628456116, -0.5383989810943604, -0.4976663589477539, -0.45693373680114746, -0.41620108485221863, -0.3754684329032898, -0.33473578095436096, -0.29400312900543213, -0.2532705068588257, -0.21253785490989685, -0.17180520296096802, -0.13107256591320038, -0.09033992886543274, -0.049607157707214355, -0.00887451320886612, 0.03185813128948212, 0.07259077578783035, 0.11332342028617859, 0.15405607223510742, 0.19478870928287506, 0.2355213463306427, 0.27625399827957153, 0.31698665022850037, 0.3577193021774292, 0.39845192432403564, 0.4391845762729645, 0.4799172282218933, 0.5206498503684998, 0.561382532119751, 0.6021151542663574, 0.6428477764129639, 0.6835804581642151, 0.7243130803108215, 0.7650457620620728, 0.8057783842086792, 0.8465110063552856, 0.8872436285018921, 0.9279763102531433, 0.9687089323997498, 1.009441614151001, 1.0501742362976074, 1.0909068584442139, 1.1316394805908203, 1.1723722219467163, 1.2131048440933228, 1.2538374662399292]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 35.0, 48.0, 79.0, 148.0, 233.0, 480.0, 986.0, 2626.0, 10913.0, 73913.0, 767938.0, 165595.0, 18964.0, 3963.0, 1340.0, 583.0, 302.0, 158.0, 86.0, 55.0, 39.0, 16.0, 11.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89013671875, -0.8620223999023438, -0.8339080810546875, -0.8057937622070312, -0.777679443359375, -0.7495651245117188, -0.7214508056640625, -0.6933364868164062, -0.66522216796875, -0.6371078491210938, -0.6089935302734375, -0.5808792114257812, -0.552764892578125, -0.5246505737304688, -0.4965362548828125, -0.46842193603515625, -0.4403076171875, -0.41219329833984375, -0.3840789794921875, -0.35596466064453125, -0.327850341796875, -0.29973602294921875, -0.2716217041015625, -0.24350738525390625, -0.21539306640625, -0.18727874755859375, -0.1591644287109375, -0.13105010986328125, -0.102935791015625, -0.07482147216796875, -0.0467071533203125, -0.01859283447265625, 0.009521484375, 0.03763580322265625, 0.0657501220703125, 0.09386444091796875, 0.121978759765625, 0.15009307861328125, 0.1782073974609375, 0.20632171630859375, 0.23443603515625, 0.26255035400390625, 0.2906646728515625, 0.31877899169921875, 0.346893310546875, 0.37500762939453125, 0.4031219482421875, 0.43123626708984375, 0.4593505859375, 0.48746490478515625, 0.5155792236328125, 0.5436935424804688, 0.571807861328125, 0.5999221801757812, 0.6280364990234375, 0.6561508178710938, 0.68426513671875, 0.7123794555664062, 0.7404937744140625, 0.7686080932617188, 0.796722412109375, 0.8248367309570312, 0.8529510498046875, 0.8810653686523438, 0.9091796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 33.0, 47.0, 51.0, 68.0, 94.0, 118.0, 108.0, 107.0, 84.0, 77.0, 43.0, 50.0, 29.0, 20.0, 14.0, 7.0, 15.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.74310302734375, -6.5291748046875, -6.31524658203125, -6.101318359375, -5.88739013671875, -5.6734619140625, -5.45953369140625, -5.24560546875, -5.03167724609375, -4.8177490234375, -4.60382080078125, -4.389892578125, -4.17596435546875, -3.9620361328125, -3.74810791015625, -3.5341796875, -3.32025146484375, -3.1063232421875, -2.89239501953125, -2.678466796875, -2.46453857421875, -2.2506103515625, -2.03668212890625, -1.82275390625, -1.60882568359375, -1.3948974609375, -1.18096923828125, -0.967041015625, -0.75311279296875, -0.5391845703125, -0.32525634765625, -0.111328125, 0.10260009765625, 0.3165283203125, 0.53045654296875, 0.744384765625, 0.95831298828125, 1.1722412109375, 1.38616943359375, 1.60009765625, 1.81402587890625, 2.0279541015625, 2.24188232421875, 2.455810546875, 2.66973876953125, 2.8836669921875, 3.09759521484375, 3.3115234375, 3.52545166015625, 3.7393798828125, 3.95330810546875, 4.167236328125, 4.38116455078125, 4.5950927734375, 4.80902099609375, 5.02294921875, 5.23687744140625, 5.4508056640625, 5.66473388671875, 5.878662109375, 6.09259033203125, 6.3065185546875, 6.52044677734375, 6.734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 12.0, 14.0, 15.0, 26.0, 34.0, 51.0, 51.0, 45.0, 52.0, 56.0, 189.0, 1047424.0, 167.0, 87.0, 61.0, 44.0, 51.0, 34.0, 29.0, 22.0, 21.0, 16.0, 11.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -17.9814453125, -17.181640625, -16.3818359375, -15.58203125, -14.7822265625, -13.982421875, -13.1826171875, -12.3828125, -11.5830078125, -10.783203125, -9.9833984375, -9.18359375, -8.3837890625, -7.583984375, -6.7841796875, -5.984375, -5.1845703125, -4.384765625, -3.5849609375, -2.78515625, -1.9853515625, -1.185546875, -0.3857421875, 0.4140625, 1.2138671875, 2.013671875, 2.8134765625, 3.61328125, 4.4130859375, 5.212890625, 6.0126953125, 6.8125, 7.6123046875, 8.412109375, 9.2119140625, 10.01171875, 10.8115234375, 11.611328125, 12.4111328125, 13.2109375, 14.0107421875, 14.810546875, 15.6103515625, 16.41015625, 17.2099609375, 18.009765625, 18.8095703125, 19.609375, 20.4091796875, 21.208984375, 22.0087890625, 22.80859375, 23.6083984375, 24.408203125, 25.2080078125, 26.0078125, 26.8076171875, 27.607421875, 28.4072265625, 29.20703125, 30.0068359375, 30.806640625, 31.6064453125, 32.40625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 12.0, 11.0, 17.0, 27.0, 37.0, 49.0, 51.0, 50.0, 47.0, 57.0, 90.0, 85.0, 57.0, 84.0, 60.0, 43.0, 48.0, 36.0, 30.0, 19.0, 23.0, 16.0, 11.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.95245361328125, -3.7760009765625, -3.59954833984375, -3.423095703125, -3.24664306640625, -3.0701904296875, -2.89373779296875, -2.71728515625, -2.54083251953125, -2.3643798828125, -2.18792724609375, -2.011474609375, -1.83502197265625, -1.6585693359375, -1.48211669921875, -1.3056640625, -1.12921142578125, -0.9527587890625, -0.77630615234375, -0.599853515625, -0.42340087890625, -0.2469482421875, -0.07049560546875, 0.10595703125, 0.28240966796875, 0.4588623046875, 0.63531494140625, 0.811767578125, 0.98822021484375, 1.1646728515625, 1.34112548828125, 1.517578125, 1.69403076171875, 1.8704833984375, 2.04693603515625, 2.223388671875, 2.39984130859375, 2.5762939453125, 2.75274658203125, 2.92919921875, 3.10565185546875, 3.2821044921875, 3.45855712890625, 3.635009765625, 3.81146240234375, 3.9879150390625, 4.16436767578125, 4.3408203125, 4.51727294921875, 4.6937255859375, 4.87017822265625, 5.046630859375, 5.22308349609375, 5.3995361328125, 5.57598876953125, 5.75244140625, 5.92889404296875, 6.1053466796875, 6.28179931640625, 6.458251953125, 6.63470458984375, 6.8111572265625, 6.98760986328125, 7.1640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 8.0, 9.0, 9.0, 17.0, 15.0, 22.0, 34.0, 51.0, 88.0, 208.0, 401.0, 1323.0, 4871.0, 26144.0, 890897.0, 109056.0, 11410.0, 2607.0, 730.0, 278.0, 130.0, 65.0, 34.0, 29.0, 21.0, 15.0, 18.0, 11.0, 7.0, 5.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.25415802001953125, -0.2456207275390625, -0.23708343505859375, -0.228546142578125, -0.22000885009765625, -0.2114715576171875, -0.20293426513671875, -0.19439697265625, -0.18585968017578125, -0.1773223876953125, -0.16878509521484375, -0.160247802734375, -0.15171051025390625, -0.1431732177734375, -0.13463592529296875, -0.1260986328125, -0.11756134033203125, -0.1090240478515625, -0.10048675537109375, -0.091949462890625, -0.08341217041015625, -0.0748748779296875, -0.06633758544921875, -0.05780029296875, -0.04926300048828125, -0.0407257080078125, -0.03218841552734375, -0.023651123046875, -0.01511383056640625, -0.0065765380859375, 0.00196075439453125, 0.010498046875, 0.01903533935546875, 0.0275726318359375, 0.03610992431640625, 0.044647216796875, 0.05318450927734375, 0.0617218017578125, 0.07025909423828125, 0.07879638671875, 0.08733367919921875, 0.0958709716796875, 0.10440826416015625, 0.112945556640625, 0.12148284912109375, 0.1300201416015625, 0.13855743408203125, 0.1470947265625, 0.15563201904296875, 0.1641693115234375, 0.17270660400390625, 0.181243896484375, 0.18978118896484375, 0.1983184814453125, 0.20685577392578125, 0.21539306640625, 0.22393035888671875, 0.2324676513671875, 0.24100494384765625, 0.249542236328125, 0.25807952880859375, 0.2666168212890625, 0.27515411376953125, 0.28369140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 10.0, 10.0, 15.0, 26.0, 125.0, 533.0, 173.0, 42.0, 17.0, 13.0, 4.0, 5.0, 4.0, 4.0, 1.0, 7.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4776668548583984e-05, -5.3194351494312286e-05, -5.161203444004059e-05, -5.002971738576889e-05, -4.844740033149719e-05, -4.6865083277225494e-05, -4.5282766222953796e-05, -4.37004491686821e-05, -4.21181321144104e-05, -4.05358150601387e-05, -3.8953498005867004e-05, -3.7371180951595306e-05, -3.578886389732361e-05, -3.420654684305191e-05, -3.262422978878021e-05, -3.1041912734508514e-05, -2.9459595680236816e-05, -2.787727862596512e-05, -2.629496157169342e-05, -2.4712644517421722e-05, -2.3130327463150024e-05, -2.1548010408878326e-05, -1.996569335460663e-05, -1.838337630033493e-05, -1.6801059246063232e-05, -1.5218742191791534e-05, -1.3636425137519836e-05, -1.2054108083248138e-05, -1.047179102897644e-05, -8.889473974704742e-06, -7.3071569204330444e-06, -5.7248398661613464e-06, -4.1425228118896484e-06, -2.5602057576179504e-06, -9.778887033462524e-07, 6.044283509254456e-07, 2.1867454051971436e-06, 3.7690624594688416e-06, 5.3513795137405396e-06, 6.9336965680122375e-06, 8.516013622283936e-06, 1.0098330676555634e-05, 1.1680647730827332e-05, 1.326296478509903e-05, 1.4845281839370728e-05, 1.6427598893642426e-05, 1.8009915947914124e-05, 1.959223300218582e-05, 2.117455005645752e-05, 2.2756867110729218e-05, 2.4339184165000916e-05, 2.5921501219272614e-05, 2.750381827354431e-05, 2.908613532781601e-05, 3.066845238208771e-05, 3.2250769436359406e-05, 3.3833086490631104e-05, 3.54154035449028e-05, 3.69977205991745e-05, 3.85800376534462e-05, 4.0162354707717896e-05, 4.1744671761989594e-05, 4.332698881626129e-05, 4.490930587053299e-05, 4.649162292480469e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 11.0, 2.0, 9.0, 19.0, 19.0, 40.0, 39.0, 63.0, 87.0, 139.0, 230.0, 431.0, 893.0, 1846.0, 4485.0, 12054.0, 43223.0, 809943.0, 139925.0, 21921.0, 7406.0, 3003.0, 1286.0, 643.0, 331.0, 178.0, 104.0, 61.0, 55.0, 20.0, 16.0, 12.0, 16.0, 7.0, 8.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15379905700683594, -0.14805221557617188, -0.1423053741455078, -0.13655853271484375, -0.1308116912841797, -0.12506484985351562, -0.11931800842285156, -0.1135711669921875, -0.10782432556152344, -0.10207748413085938, -0.09633064270019531, -0.09058380126953125, -0.08483695983886719, -0.07909011840820312, -0.07334327697753906, -0.067596435546875, -0.06184959411621094, -0.056102752685546875, -0.05035591125488281, -0.04460906982421875, -0.03886222839355469, -0.033115386962890625, -0.027368545532226562, -0.0216217041015625, -0.015874862670898438, -0.010128021240234375, -0.0043811798095703125, 0.00136566162109375, 0.0071125030517578125, 0.012859344482421875, 0.018606185913085938, 0.02435302734375, 0.030099868774414062, 0.035846710205078125, 0.04159355163574219, 0.04734039306640625, 0.05308723449707031, 0.058834075927734375, 0.06458091735839844, 0.0703277587890625, 0.07607460021972656, 0.08182144165039062, 0.08756828308105469, 0.09331512451171875, 0.09906196594238281, 0.10480880737304688, 0.11055564880371094, 0.116302490234375, 0.12204933166503906, 0.12779617309570312, 0.1335430145263672, 0.13928985595703125, 0.1450366973876953, 0.15078353881835938, 0.15653038024902344, 0.1622772216796875, 0.16802406311035156, 0.17377090454101562, 0.1795177459716797, 0.18526458740234375, 0.1910114288330078, 0.19675827026367188, 0.20250511169433594, 0.208251953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 5.0, 4.0, 13.0, 16.0, 19.0, 22.0, 29.0, 57.0, 135.0, 355.0, 156.0, 49.0, 23.0, 20.0, 17.0, 11.0, 9.0, 10.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.0986175537109375, -0.095916748046875, -0.0932159423828125, -0.09051513671875, -0.0878143310546875, -0.085113525390625, -0.0824127197265625, -0.0797119140625, -0.0770111083984375, -0.074310302734375, -0.0716094970703125, -0.06890869140625, -0.0662078857421875, -0.063507080078125, -0.0608062744140625, -0.05810546875, -0.0554046630859375, -0.052703857421875, -0.0500030517578125, -0.04730224609375, -0.0446014404296875, -0.041900634765625, -0.0391998291015625, -0.0364990234375, -0.0337982177734375, -0.031097412109375, -0.0283966064453125, -0.02569580078125, -0.0229949951171875, -0.020294189453125, -0.0175933837890625, -0.014892578125, -0.0121917724609375, -0.009490966796875, -0.0067901611328125, -0.00408935546875, -0.0013885498046875, 0.001312255859375, 0.0040130615234375, 0.0067138671875, 0.0094146728515625, 0.012115478515625, 0.0148162841796875, 0.01751708984375, 0.0202178955078125, 0.022918701171875, 0.0256195068359375, 0.0283203125, 0.0310211181640625, 0.033721923828125, 0.0364227294921875, 0.03912353515625, 0.0418243408203125, 0.044525146484375, 0.0472259521484375, 0.0499267578125, 0.0526275634765625, 0.055328369140625, 0.0580291748046875, 0.06072998046875, 0.0634307861328125, 0.066131591796875, 0.0688323974609375, 0.071533203125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 25.0, 157.0, 514.0, 258.0, 36.0, 13.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.88417387008667, -2.6316254138946533, -2.3790769577026367, -2.12652850151062, -1.8739800453186035, -1.621431589126587, -1.3688831329345703, -1.1163346767425537, -0.8637862205505371, -0.6112377643585205, -0.3586893081665039, -0.1061408519744873, 0.1464076042175293, 0.3989560604095459, 0.6515045166015625, 0.9040529727935791, 1.1566014289855957, 1.4091498851776123, 1.661698341369629, 1.9142467975616455, 2.166795253753662, 2.4193437099456787, 2.6718921661376953, 2.924440622329712, 3.1769890785217285, 3.429537534713745, 3.6820859909057617, 3.9346344470977783, 4.187182903289795, 4.439731597900391, 4.692279815673828, 4.944828033447266, 5.197376251220703, 5.449924468994141, 5.702473163604736, 5.955021858215332, 6.2075700759887695, 6.460118293762207, 6.712666988372803, 6.965215682983398, 7.217763900756836, 7.470312118530273, 7.722860813140869, 7.975409507751465, 8.227957725524902, 8.48050594329834, 8.733055114746094, 8.985603332519531, 9.238151550292969, 9.490699768066406, 9.743247985839844, 9.995797157287598, 10.248345375061035, 10.500893592834473, 10.753442764282227, 11.005990982055664, 11.258539199829102, 11.511087417602539, 11.763635635375977, 12.01618480682373, 12.268733024597168, 12.521281242370605, 12.77383041381836, 13.026378631591797, 13.278926849365234]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 10.0, 8.0, 9.0, 15.0, 11.0, 20.0, 36.0, 33.0, 33.0, 33.0, 46.0, 51.0, 49.0, 59.0, 44.0, 53.0, 45.0, 56.0, 40.0, 36.0, 35.0, 42.0, 37.0, 45.0, 26.0, 28.0, 18.0, 16.0, 13.0, 11.0, 9.0, 6.0, 8.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.30205249786377, -8.099584579467773, -7.8971171379089355, -7.694649696350098, -7.492181777954102, -7.289714336395264, -7.087246894836426, -6.88477897644043, -6.682311534881592, -6.479844093322754, -6.277376174926758, -6.07490873336792, -5.872441291809082, -5.669973373413086, -5.467505931854248, -5.26503849029541, -5.062570571899414, -4.860103130340576, -4.65763521194458, -4.455167770385742, -4.252699851989746, -4.050232410430908, -3.8477649688720703, -3.6452972888946533, -3.4428296089172363, -3.2403619289398193, -3.0378942489624023, -2.8354268074035645, -2.6329591274261475, -2.4304914474487305, -2.2280240058898926, -2.0255563259124756, -1.8230891227722168, -1.6206214427947998, -1.4181538820266724, -1.215686321258545, -1.013218641281128, -0.8107509613037109, -0.6082834005355835, -0.40581583976745605, -0.20334815979003906, -0.0008805394172668457, 0.20158708095550537, 0.4040547013282776, 0.6065223217010498, 0.8089900016784668, 1.0114575624465942, 1.2139251232147217, 1.4163928031921387, 1.6188604831695557, 1.821328043937683, 2.0237956047058105, 2.2262632846832275, 2.4287309646606445, 2.6311984062194824, 2.8336660861968994, 3.0361337661743164, 3.2386014461517334, 3.4410691261291504, 3.6435365676879883, 3.8460042476654053, 4.048471927642822, 4.25093936920166, 4.453407287597656, 4.655874729156494]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 3.0, 10.0, 11.0, 11.0, 18.0, 19.0, 28.0, 37.0, 58.0, 85.0, 214.0, 644.0, 5688.0, 405483.0, 3752512.0, 27417.0, 1429.0, 260.0, 107.0, 55.0, 37.0, 39.0, 26.0, 24.0, 15.0, 12.0, 10.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.83984375, -4.716461181640625, -4.59307861328125, -4.469696044921875, -4.3463134765625, -4.222930908203125, -4.09954833984375, -3.976165771484375, -3.852783203125, -3.729400634765625, -3.60601806640625, -3.482635498046875, -3.3592529296875, -3.235870361328125, -3.11248779296875, -2.989105224609375, -2.86572265625, -2.742340087890625, -2.61895751953125, -2.495574951171875, -2.3721923828125, -2.248809814453125, -2.12542724609375, -2.002044677734375, -1.878662109375, -1.755279541015625, -1.63189697265625, -1.508514404296875, -1.3851318359375, -1.261749267578125, -1.13836669921875, -1.014984130859375, -0.8916015625, -0.768218994140625, -0.64483642578125, -0.521453857421875, -0.3980712890625, -0.274688720703125, -0.15130615234375, -0.027923583984375, 0.095458984375, 0.218841552734375, 0.34222412109375, 0.465606689453125, 0.5889892578125, 0.712371826171875, 0.83575439453125, 0.959136962890625, 1.08251953125, 1.205902099609375, 1.32928466796875, 1.452667236328125, 1.5760498046875, 1.699432373046875, 1.82281494140625, 1.946197509765625, 2.069580078125, 2.192962646484375, 2.31634521484375, 2.439727783203125, 2.5631103515625, 2.686492919921875, 2.80987548828125, 2.933258056640625, 3.056640625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 5.0, 7.0, 11.0, 20.0, 23.0, 33.0, 53.0, 73.0, 71.0, 83.0, 105.0, 102.0, 96.0, 84.0, 64.0, 44.0, 36.0, 29.0, 20.0, 11.0, 8.0, 5.0, 6.0, 1.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.350006103515625, -1.30645751953125, -1.262908935546875, -1.2193603515625, -1.175811767578125, -1.13226318359375, -1.088714599609375, -1.045166015625, -1.001617431640625, -0.95806884765625, -0.914520263671875, -0.8709716796875, -0.827423095703125, -0.78387451171875, -0.740325927734375, -0.69677734375, -0.653228759765625, -0.60968017578125, -0.566131591796875, -0.5225830078125, -0.479034423828125, -0.43548583984375, -0.391937255859375, -0.348388671875, -0.304840087890625, -0.26129150390625, -0.217742919921875, -0.1741943359375, -0.130645751953125, -0.08709716796875, -0.043548583984375, 0.0, 0.043548583984375, 0.08709716796875, 0.130645751953125, 0.1741943359375, 0.217742919921875, 0.26129150390625, 0.304840087890625, 0.348388671875, 0.391937255859375, 0.43548583984375, 0.479034423828125, 0.5225830078125, 0.566131591796875, 0.60968017578125, 0.653228759765625, 0.69677734375, 0.740325927734375, 0.78387451171875, 0.827423095703125, 0.8709716796875, 0.914520263671875, 0.95806884765625, 1.001617431640625, 1.045166015625, 1.088714599609375, 1.13226318359375, 1.175811767578125, 1.2193603515625, 1.262908935546875, 1.30645751953125, 1.350006103515625, 1.3935546875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 15.0, 25.0, 72.0, 202.0, 1032.0, 4090325.0, 101756.0, 611.0, 135.0, 38.0, 15.0, 7.0, 10.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.5576171875, -9.248046875, -8.9384765625, -8.62890625, -8.3193359375, -8.009765625, -7.7001953125, -7.390625, -7.0810546875, -6.771484375, -6.4619140625, -6.15234375, -5.8427734375, -5.533203125, -5.2236328125, -4.9140625, -4.6044921875, -4.294921875, -3.9853515625, -3.67578125, -3.3662109375, -3.056640625, -2.7470703125, -2.4375, -2.1279296875, -1.818359375, -1.5087890625, -1.19921875, -0.8896484375, -0.580078125, -0.2705078125, 0.0390625, 0.3486328125, 0.658203125, 0.9677734375, 1.27734375, 1.5869140625, 1.896484375, 2.2060546875, 2.515625, 2.8251953125, 3.134765625, 3.4443359375, 3.75390625, 4.0634765625, 4.373046875, 4.6826171875, 4.9921875, 5.3017578125, 5.611328125, 5.9208984375, 6.23046875, 6.5400390625, 6.849609375, 7.1591796875, 7.46875, 7.7783203125, 8.087890625, 8.3974609375, 8.70703125, 9.0166015625, 9.326171875, 9.6357421875, 9.9453125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 22.0, 37.0, 107.0, 325.0, 1860.0, 1334.0, 253.0, 82.0, 33.0, 12.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7145919799804688, -0.6767425537109375, -0.6388931274414062, -0.601043701171875, -0.5631942749023438, -0.5253448486328125, -0.48749542236328125, -0.44964599609375, -0.41179656982421875, -0.3739471435546875, -0.33609771728515625, -0.298248291015625, -0.26039886474609375, -0.2225494384765625, -0.18470001220703125, -0.1468505859375, -0.10900115966796875, -0.0711517333984375, -0.03330230712890625, 0.004547119140625, 0.04239654541015625, 0.0802459716796875, 0.11809539794921875, 0.15594482421875, 0.19379425048828125, 0.2316436767578125, 0.26949310302734375, 0.307342529296875, 0.34519195556640625, 0.3830413818359375, 0.42089080810546875, 0.458740234375, 0.49658966064453125, 0.5344390869140625, 0.5722885131835938, 0.610137939453125, 0.6479873657226562, 0.6858367919921875, 0.7236862182617188, 0.76153564453125, 0.7993850708007812, 0.8372344970703125, 0.8750839233398438, 0.912933349609375, 0.9507827758789062, 0.9886322021484375, 1.0264816284179688, 1.0643310546875, 1.1021804809570312, 1.1400299072265625, 1.1778793334960938, 1.215728759765625, 1.2535781860351562, 1.2914276123046875, 1.3292770385742188, 1.36712646484375, 1.4049758911132812, 1.4428253173828125, 1.4806747436523438, 1.518524169921875, 1.5563735961914062, 1.5942230224609375, 1.6320724487304688, 1.669921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 15.0, 19.0, 33.0, 54.0, 99.0, 157.0, 160.0, 134.0, 110.0, 81.0, 72.0, 18.0, 10.0, 9.0, 7.0, 10.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.595392942428589, -2.5329976081848145, -2.470602035522461, -2.4082067012786865, -2.345811367034912, -2.2834157943725586, -2.221020460128784, -2.1586251258850098, -2.0962295532226562, -2.033834218978882, -1.9714387655258179, -1.909043312072754, -1.8466479778289795, -1.7842525243759155, -1.7218570709228516, -1.6594617366790771, -1.5970664024353027, -1.5346709489822388, -1.4722756147384644, -1.4098801612854004, -1.347484827041626, -1.285089373588562, -1.222693920135498, -1.1602985858917236, -1.0979031324386597, -1.0355076789855957, -0.9731123447418213, -0.9107168912887573, -0.8483214974403381, -0.785926103591919, -0.723530650138855, -0.6611352562904358, -0.5987399816513062, -0.536344587802887, -0.4739491641521454, -0.4115537405014038, -0.3491583466529846, -0.28676295280456543, -0.22436752915382385, -0.16197210550308228, -0.09957671165466309, -0.0371813029050827, 0.02521410584449768, 0.08760951459407806, 0.15000492334365845, 0.21240031719207764, 0.2747957408428192, 0.3371911644935608, 0.39958655834198, 0.46198195219039917, 0.5243773460388184, 0.5867727994918823, 0.6491681933403015, 0.7115635871887207, 0.7739590406417847, 0.8363544344902039, 0.898749828338623, 0.9611452221870422, 1.0235406160354614, 1.0859360694885254, 1.1483314037322998, 1.2107268571853638, 1.2731223106384277, 1.3355176448822021, 1.3979130983352661]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 13.0, 20.0, 21.0, 28.0, 48.0, 43.0, 82.0, 85.0, 83.0, 86.0, 109.0, 82.0, 74.0, 62.0, 49.0, 36.0, 28.0, 14.0, 17.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5845205783843994, -1.5264019966125488, -1.4682832956314087, -1.410164713859558, -1.3520461320877075, -1.2939274311065674, -1.2358088493347168, -1.1776902675628662, -1.1195716857910156, -1.061453104019165, -1.003334403038025, -0.9452158212661743, -0.8870972394943237, -0.8289785981178284, -0.770859956741333, -0.7127413749694824, -0.6546227335929871, -0.5965040922164917, -0.5383855104446411, -0.48026686906814575, -0.42214828729629517, -0.3640296459197998, -0.30591103434562683, -0.24779242277145386, -0.18967381119728088, -0.1315551996231079, -0.07343658059835434, -0.015317961573600769, 0.042800650000572205, 0.10091927647590637, 0.15903788805007935, 0.21715649962425232, 0.2752751111984253, 0.33339372277259827, 0.39151233434677124, 0.4496309757232666, 0.5077495574951172, 0.5658681988716125, 0.6239868402481079, 0.6821054220199585, 0.7402240037918091, 0.7983426451683044, 0.856461226940155, 0.9145798683166504, 0.972698450088501, 1.0308170318603516, 1.0889357328414917, 1.1470543146133423, 1.2051730155944824, 1.263291597366333, 1.3214102983474731, 1.3795288801193237, 1.4376474618911743, 1.4957661628723145, 1.553884744644165, 1.6120033264160156, 1.6701219081878662, 1.7282404899597168, 1.786359190940857, 1.8444777727127075, 1.902596354484558, 1.9607150554656982, 2.018833637237549, 2.0769522190093994, 2.13507080078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 11.0, 6.0, 14.0, 29.0, 23.0, 66.0, 122.0, 300.0, 713.0, 2503.0, 14757.0, 542655.0, 470117.0, 13576.0, 2426.0, 679.0, 297.0, 125.0, 59.0, 28.0, 16.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469970703125, -0.4531745910644531, -0.43637847900390625, -0.4195823669433594, -0.4027862548828125, -0.3859901428222656, -0.36919403076171875, -0.3523979187011719, -0.335601806640625, -0.3188056945800781, -0.30200958251953125, -0.2852134704589844, -0.2684173583984375, -0.2516212463378906, -0.23482513427734375, -0.21802902221679688, -0.20123291015625, -0.18443679809570312, -0.16764068603515625, -0.15084457397460938, -0.1340484619140625, -0.11725234985351562, -0.10045623779296875, -0.08366012573242188, -0.066864013671875, -0.050067901611328125, -0.03327178955078125, -0.016475677490234375, 0.0003204345703125, 0.017116546630859375, 0.03391265869140625, 0.050708770751953125, 0.0675048828125, 0.08430099487304688, 0.10109710693359375, 0.11789321899414062, 0.1346893310546875, 0.15148544311523438, 0.16828155517578125, 0.18507766723632812, 0.201873779296875, 0.21866989135742188, 0.23546600341796875, 0.2522621154785156, 0.2690582275390625, 0.2858543395996094, 0.30265045166015625, 0.3194465637207031, 0.33624267578125, 0.3530387878417969, 0.36983489990234375, 0.3866310119628906, 0.4034271240234375, 0.4202232360839844, 0.43701934814453125, 0.4538154602050781, 0.470611572265625, 0.4874076843261719, 0.5042037963867188, 0.5209999084472656, 0.5377960205078125, 0.5545921325683594, 0.5713882446289062, 0.5881843566894531, 0.60498046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 11.0, 14.0, 20.0, 27.0, 47.0, 54.0, 82.0, 114.0, 111.0, 106.0, 127.0, 90.0, 71.0, 41.0, 35.0, 20.0, 16.0, 6.0, 10.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.105682373046875, -1.06488037109375, -1.024078369140625, -0.9832763671875, -0.942474365234375, -0.90167236328125, -0.860870361328125, -0.820068359375, -0.779266357421875, -0.73846435546875, -0.697662353515625, -0.6568603515625, -0.616058349609375, -0.57525634765625, -0.534454345703125, -0.49365234375, -0.452850341796875, -0.41204833984375, -0.371246337890625, -0.3304443359375, -0.289642333984375, -0.24884033203125, -0.208038330078125, -0.167236328125, -0.126434326171875, -0.08563232421875, -0.044830322265625, -0.0040283203125, 0.036773681640625, 0.07757568359375, 0.118377685546875, 0.1591796875, 0.199981689453125, 0.24078369140625, 0.281585693359375, 0.3223876953125, 0.363189697265625, 0.40399169921875, 0.444793701171875, 0.485595703125, 0.526397705078125, 0.56719970703125, 0.608001708984375, 0.6488037109375, 0.689605712890625, 0.73040771484375, 0.771209716796875, 0.81201171875, 0.852813720703125, 0.89361572265625, 0.934417724609375, 0.9752197265625, 1.016021728515625, 1.05682373046875, 1.097625732421875, 1.138427734375, 1.179229736328125, 1.22003173828125, 1.260833740234375, 1.3016357421875, 1.342437744140625, 1.38323974609375, 1.424041748046875, 1.46484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 16.0, 12.0, 23.0, 43.0, 50.0, 91.0, 97.0, 199.0, 261.0, 405.0, 630.0, 1007.0, 1581.0, 2558.0, 4186.0, 7174.0, 12524.0, 23036.0, 43273.0, 84930.0, 164890.0, 250346.0, 209257.0, 114942.0, 58044.0, 29956.0, 16157.0, 9174.0, 5333.0, 3151.0, 1876.0, 1186.0, 766.0, 440.0, 309.0, 201.0, 139.0, 77.0, 67.0, 46.0, 27.0, 23.0, 14.0, 13.0, 6.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.059417724609375, -0.05765581130981445, -0.055893898010253906, -0.05413198471069336, -0.05237007141113281, -0.050608158111572266, -0.04884624481201172, -0.04708433151245117, -0.045322418212890625, -0.04356050491333008, -0.04179859161376953, -0.040036678314208984, -0.03827476501464844, -0.03651285171508789, -0.034750938415527344, -0.0329890251159668, -0.03122711181640625, -0.029465198516845703, -0.027703285217285156, -0.02594137191772461, -0.024179458618164062, -0.022417545318603516, -0.02065563201904297, -0.018893718719482422, -0.017131805419921875, -0.015369892120361328, -0.013607978820800781, -0.011846065521240234, -0.010084152221679688, -0.00832223892211914, -0.006560325622558594, -0.004798412322998047, -0.0030364990234375, -0.0012745857238769531, 0.00048732757568359375, 0.0022492408752441406, 0.0040111541748046875, 0.005773067474365234, 0.007534980773925781, 0.009296894073486328, 0.011058807373046875, 0.012820720672607422, 0.014582633972167969, 0.016344547271728516, 0.018106460571289062, 0.01986837387084961, 0.021630287170410156, 0.023392200469970703, 0.02515411376953125, 0.026916027069091797, 0.028677940368652344, 0.03043985366821289, 0.03220176696777344, 0.033963680267333984, 0.03572559356689453, 0.03748750686645508, 0.039249420166015625, 0.04101133346557617, 0.04277324676513672, 0.044535160064697266, 0.04629707336425781, 0.04805898666381836, 0.049820899963378906, 0.05158281326293945, 0.0533447265625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 11.0, 9.0, 7.0, 15.0, 22.0, 15.0, 17.0, 14.0, 23.0, 22.0, 36.0, 38.0, 33.0, 35.0, 49.0, 51.0, 41.0, 52.0, 55.0, 38.0, 38.0, 45.0, 47.0, 33.0, 29.0, 29.0, 28.0, 21.0, 21.0, 20.0, 14.0, 9.0, 15.0, 6.0, 7.0, 9.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.93603515625, -0.908416748046875, -0.88079833984375, -0.853179931640625, -0.8255615234375, -0.797943115234375, -0.77032470703125, -0.742706298828125, -0.715087890625, -0.687469482421875, -0.65985107421875, -0.632232666015625, -0.6046142578125, -0.576995849609375, -0.54937744140625, -0.521759033203125, -0.494140625, -0.466522216796875, -0.43890380859375, -0.411285400390625, -0.3836669921875, -0.356048583984375, -0.32843017578125, -0.300811767578125, -0.273193359375, -0.245574951171875, -0.21795654296875, -0.190338134765625, -0.1627197265625, -0.135101318359375, -0.10748291015625, -0.079864501953125, -0.05224609375, -0.024627685546875, 0.00299072265625, 0.030609130859375, 0.0582275390625, 0.085845947265625, 0.11346435546875, 0.141082763671875, 0.168701171875, 0.196319580078125, 0.22393798828125, 0.251556396484375, 0.2791748046875, 0.306793212890625, 0.33441162109375, 0.362030029296875, 0.3896484375, 0.417266845703125, 0.44488525390625, 0.472503662109375, 0.5001220703125, 0.527740478515625, 0.55535888671875, 0.582977294921875, 0.610595703125, 0.638214111328125, 0.66583251953125, 0.693450927734375, 0.7210693359375, 0.748687744140625, 0.77630615234375, 0.803924560546875, 0.83154296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 9.0, 10.0, 18.0, 21.0, 27.0, 56.0, 62.0, 135.0, 245.0, 439.0, 875.0, 2136.0, 5578.0, 19902.0, 144196.0, 737115.0, 113185.0, 16576.0, 4664.0, 1713.0, 756.0, 354.0, 169.0, 124.0, 62.0, 37.0, 22.0, 10.0, 15.0, 15.0, 8.0, 8.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.018096923828125, -0.017539262771606445, -0.01698160171508789, -0.016423940658569336, -0.01586627960205078, -0.015308618545532227, -0.014750957489013672, -0.014193296432495117, -0.013635635375976562, -0.013077974319458008, -0.012520313262939453, -0.011962652206420898, -0.011404991149902344, -0.010847330093383789, -0.010289669036865234, -0.00973200798034668, -0.009174346923828125, -0.00861668586730957, -0.008059024810791016, -0.007501363754272461, -0.006943702697753906, -0.0063860416412353516, -0.005828380584716797, -0.005270719528198242, -0.0047130584716796875, -0.004155397415161133, -0.003597736358642578, -0.0030400753021240234, -0.0024824142456054688, -0.001924753189086914, -0.0013670921325683594, -0.0008094310760498047, -0.00025177001953125, 0.0003058910369873047, 0.0008635520935058594, 0.001421213150024414, 0.0019788742065429688, 0.0025365352630615234, 0.003094196319580078, 0.003651857376098633, 0.0042095184326171875, 0.004767179489135742, 0.005324840545654297, 0.0058825016021728516, 0.006440162658691406, 0.006997823715209961, 0.007555484771728516, 0.00811314582824707, 0.008670806884765625, 0.00922846794128418, 0.009786128997802734, 0.010343790054321289, 0.010901451110839844, 0.011459112167358398, 0.012016773223876953, 0.012574434280395508, 0.013132095336914062, 0.013689756393432617, 0.014247417449951172, 0.014805078506469727, 0.015362739562988281, 0.015920400619506836, 0.01647806167602539, 0.017035722732543945, 0.0175933837890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 18.0, 30.0, 44.0, 51.0, 70.0, 102.0, 118.0, 123.0, 99.0, 92.0, 72.0, 56.0, 20.0, 17.0, 16.0, 12.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1398067474365234e-05, -2.0693987607955933e-05, -1.998990774154663e-05, -1.928582787513733e-05, -1.8581748008728027e-05, -1.7877668142318726e-05, -1.7173588275909424e-05, -1.6469508409500122e-05, -1.576542854309082e-05, -1.5061348676681519e-05, -1.4357268810272217e-05, -1.3653188943862915e-05, -1.2949109077453613e-05, -1.2245029211044312e-05, -1.154094934463501e-05, -1.0836869478225708e-05, -1.0132789611816406e-05, -9.428709745407104e-06, -8.724629878997803e-06, -8.020550012588501e-06, -7.316470146179199e-06, -6.6123902797698975e-06, -5.908310413360596e-06, -5.204230546951294e-06, -4.500150680541992e-06, -3.7960708141326904e-06, -3.0919909477233887e-06, -2.387911081314087e-06, -1.6838312149047852e-06, -9.797513484954834e-07, -2.7567148208618164e-07, 4.284083843231201e-07, 1.1324882507324219e-06, 1.8365681171417236e-06, 2.5406479835510254e-06, 3.244727849960327e-06, 3.948807716369629e-06, 4.652887582778931e-06, 5.356967449188232e-06, 6.061047315597534e-06, 6.765127182006836e-06, 7.469207048416138e-06, 8.17328691482544e-06, 8.877366781234741e-06, 9.581446647644043e-06, 1.0285526514053345e-05, 1.0989606380462646e-05, 1.1693686246871948e-05, 1.239776611328125e-05, 1.3101845979690552e-05, 1.3805925846099854e-05, 1.4510005712509155e-05, 1.5214085578918457e-05, 1.591816544532776e-05, 1.662224531173706e-05, 1.7326325178146362e-05, 1.8030405044555664e-05, 1.8734484910964966e-05, 1.9438564777374268e-05, 2.014264464378357e-05, 2.084672451019287e-05, 2.1550804376602173e-05, 2.2254884243011475e-05, 2.2958964109420776e-05, 2.3663043975830078e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 7.0, 16.0, 24.0, 35.0, 66.0, 116.0, 216.0, 476.0, 1063.0, 2599.0, 7869.0, 37423.0, 535249.0, 420558.0, 31575.0, 6997.0, 2360.0, 924.0, 426.0, 215.0, 113.0, 67.0, 43.0, 26.0, 18.0, 9.0, 8.0, 5.0, 8.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02435302734375, -0.0236358642578125, -0.022918701171875, -0.0222015380859375, -0.021484375, -0.0207672119140625, -0.020050048828125, -0.0193328857421875, -0.01861572265625, -0.0178985595703125, -0.017181396484375, -0.0164642333984375, -0.0157470703125, -0.0150299072265625, -0.014312744140625, -0.0135955810546875, -0.01287841796875, -0.0121612548828125, -0.011444091796875, -0.0107269287109375, -0.010009765625, -0.0092926025390625, -0.008575439453125, -0.0078582763671875, -0.00714111328125, -0.0064239501953125, -0.005706787109375, -0.0049896240234375, -0.0042724609375, -0.0035552978515625, -0.002838134765625, -0.0021209716796875, -0.00140380859375, -0.0006866455078125, 3.0517578125e-05, 0.0007476806640625, 0.00146484375, 0.0021820068359375, 0.002899169921875, 0.0036163330078125, 0.00433349609375, 0.0050506591796875, 0.005767822265625, 0.0064849853515625, 0.0072021484375, 0.0079193115234375, 0.008636474609375, 0.0093536376953125, 0.01007080078125, 0.0107879638671875, 0.011505126953125, 0.0122222900390625, 0.012939453125, 0.0136566162109375, 0.014373779296875, 0.0150909423828125, 0.01580810546875, 0.0165252685546875, 0.017242431640625, 0.0179595947265625, 0.0186767578125, 0.0193939208984375, 0.020111083984375, 0.0208282470703125, 0.02154541015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 9.0, 6.0, 6.0, 6.0, 13.0, 9.0, 14.0, 15.0, 23.0, 31.0, 45.0, 71.0, 117.0, 143.0, 113.0, 106.0, 69.0, 54.0, 37.0, 25.0, 18.0, 16.0, 9.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00540924072265625, -0.005258440971374512, -0.0051076412200927734, -0.004956841468811035, -0.004806041717529297, -0.004655241966247559, -0.00450444221496582, -0.004353642463684082, -0.004202842712402344, -0.0040520429611206055, -0.003901243209838867, -0.003750443458557129, -0.0035996437072753906, -0.0034488439559936523, -0.003298044204711914, -0.0031472444534301758, -0.0029964447021484375, -0.0028456449508666992, -0.002694845199584961, -0.0025440454483032227, -0.0023932456970214844, -0.002242445945739746, -0.002091646194458008, -0.0019408464431762695, -0.0017900466918945312, -0.001639246940612793, -0.0014884471893310547, -0.0013376474380493164, -0.0011868476867675781, -0.0010360479354858398, -0.0008852481842041016, -0.0007344484329223633, -0.000583648681640625, -0.0004328489303588867, -0.00028204917907714844, -0.00013124942779541016, 1.9550323486328125e-05, 0.0001703500747680664, 0.0003211498260498047, 0.00047194957733154297, 0.0006227493286132812, 0.0007735490798950195, 0.0009243488311767578, 0.001075148582458496, 0.0012259483337402344, 0.0013767480850219727, 0.001527547836303711, 0.0016783475875854492, 0.0018291473388671875, 0.0019799470901489258, 0.002130746841430664, 0.0022815465927124023, 0.0024323463439941406, 0.002583146095275879, 0.002733945846557617, 0.0028847455978393555, 0.0030355453491210938, 0.003186345100402832, 0.0033371448516845703, 0.0034879446029663086, 0.003638744354248047, 0.003789544105529785, 0.0039403438568115234, 0.004091143608093262, 0.004241943359375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 15.0, 19.0, 26.0, 65.0, 123.0, 203.0, 187.0, 141.0, 115.0, 55.0, 15.0, 9.0, 10.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8624801635742188, -1.8193453550338745, -1.7762105464935303, -1.733075737953186, -1.6899409294128418, -1.646806240081787, -1.6036713123321533, -1.5605366230010986, -1.5174018144607544, -1.4742670059204102, -1.431132197380066, -1.3879973888397217, -1.3448625802993774, -1.3017277717590332, -1.2585930824279785, -1.2154582738876343, -1.17232346534729, -1.1291886568069458, -1.0860538482666016, -1.0429190397262573, -0.9997842907905579, -0.9566494822502136, -0.9135146737098694, -0.8703799247741699, -0.8272449970245361, -0.7841101884841919, -0.7409753799438477, -0.6978405714035034, -0.654705822467804, -0.6115710139274597, -0.5684362053871155, -0.525301456451416, -0.4821666479110718, -0.43903183937072754, -0.3958970606327057, -0.35276225209236145, -0.3096274733543396, -0.26649266481399536, -0.22335785627365112, -0.18022307753562927, -0.13708826899528503, -0.09395347535610199, -0.05081867426633835, -0.007683873176574707, 0.03545092046260834, 0.07858571410179138, 0.12172052264213562, 0.16485530138015747, 0.2079901099205017, 0.25112491846084595, 0.2942596971988678, 0.33739450573921204, 0.3805292844772339, 0.4236640930175781, 0.46679890155792236, 0.5099337100982666, 0.5530685186386108, 0.5962033271789551, 0.6393381357192993, 0.6824729442596436, 0.725607693195343, 0.7687425017356873, 0.8118773102760315, 0.855012059211731, 0.8981468677520752]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 12.0, 11.0, 22.0, 33.0, 42.0, 61.0, 84.0, 104.0, 104.0, 123.0, 107.0, 89.0, 65.0, 54.0, 38.0, 15.0, 16.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0613079071044922, -1.0220942497253418, -0.9828804731369019, -0.9436667561531067, -0.9044530391693115, -0.8652393221855164, -0.8260256052017212, -0.786811888217926, -0.7475981712341309, -0.7083844542503357, -0.6691707372665405, -0.6299570202827454, -0.5907433032989502, -0.551529586315155, -0.5123158693313599, -0.4731021523475647, -0.43388843536376953, -0.39467471837997437, -0.3554610013961792, -0.31624728441238403, -0.27703356742858887, -0.2378198504447937, -0.19860613346099854, -0.15939241647720337, -0.1201786994934082, -0.08096498250961304, -0.04175126552581787, -0.002537548542022705, 0.03667616844177246, 0.07588988542556763, 0.11510360240936279, 0.15431731939315796, 0.19353115558624268, 0.23274487257003784, 0.271958589553833, 0.3111723065376282, 0.35038602352142334, 0.3895997405052185, 0.42881345748901367, 0.46802717447280884, 0.507240891456604, 0.5464546084403992, 0.5856683254241943, 0.6248820424079895, 0.6640957593917847, 0.7033094763755798, 0.742523193359375, 0.7817369103431702, 0.8209506273269653, 0.8601643443107605, 0.8993780612945557, 0.9385917782783508, 0.977805495262146, 1.017019271850586, 1.0562329292297363, 1.0954465866088867, 1.1346603631973267, 1.1738741397857666, 1.213087797164917, 1.2523014545440674, 1.2915152311325073, 1.3307290077209473, 1.3699426651000977, 1.409156322479248, 1.448370099067688]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 6.0, 2.0, 12.0, 2.0, 15.0, 27.0, 29.0, 45.0, 74.0, 124.0, 218.0, 374.0, 696.0, 1290.0, 2806.0, 6597.0, 18216.0, 78246.0, 714453.0, 179801.0, 28717.0, 9239.0, 3781.0, 1751.0, 862.0, 479.0, 282.0, 155.0, 88.0, 49.0, 36.0, 26.0, 15.0, 11.0, 10.0, 3.0, 4.0, 1.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6748046875, -0.6541595458984375, -0.633514404296875, -0.6128692626953125, -0.59222412109375, -0.5715789794921875, -0.550933837890625, -0.5302886962890625, -0.5096435546875, -0.4889984130859375, -0.468353271484375, -0.4477081298828125, -0.42706298828125, -0.4064178466796875, -0.385772705078125, -0.3651275634765625, -0.344482421875, -0.3238372802734375, -0.303192138671875, -0.2825469970703125, -0.26190185546875, -0.2412567138671875, -0.220611572265625, -0.1999664306640625, -0.1793212890625, -0.1586761474609375, -0.138031005859375, -0.1173858642578125, -0.09674072265625, -0.0760955810546875, -0.055450439453125, -0.0348052978515625, -0.01416015625, 0.0064849853515625, 0.027130126953125, 0.0477752685546875, 0.06842041015625, 0.0890655517578125, 0.109710693359375, 0.1303558349609375, 0.1510009765625, 0.1716461181640625, 0.192291259765625, 0.2129364013671875, 0.23358154296875, 0.2542266845703125, 0.274871826171875, 0.2955169677734375, 0.316162109375, 0.3368072509765625, 0.357452392578125, 0.3780975341796875, 0.39874267578125, 0.4193878173828125, 0.440032958984375, 0.4606781005859375, 0.4813232421875, 0.5019683837890625, 0.522613525390625, 0.5432586669921875, 0.56390380859375, 0.5845489501953125, 0.605194091796875, 0.6258392333984375, 0.646484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 12.0, 5.0, 17.0, 18.0, 21.0, 43.0, 46.0, 73.0, 82.0, 95.0, 106.0, 95.0, 95.0, 83.0, 67.0, 50.0, 26.0, 14.0, 19.0, 15.0, 7.0, 10.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.966400146484375, -1.88983154296875, -1.813262939453125, -1.7366943359375, -1.660125732421875, -1.58355712890625, -1.506988525390625, -1.430419921875, -1.353851318359375, -1.27728271484375, -1.200714111328125, -1.1241455078125, -1.047576904296875, -0.97100830078125, -0.894439697265625, -0.81787109375, -0.741302490234375, -0.66473388671875, -0.588165283203125, -0.5115966796875, -0.435028076171875, -0.35845947265625, -0.281890869140625, -0.205322265625, -0.128753662109375, -0.05218505859375, 0.024383544921875, 0.1009521484375, 0.177520751953125, 0.25408935546875, 0.330657958984375, 0.4072265625, 0.483795166015625, 0.56036376953125, 0.636932373046875, 0.7135009765625, 0.790069580078125, 0.86663818359375, 0.943206787109375, 1.019775390625, 1.096343994140625, 1.17291259765625, 1.249481201171875, 1.3260498046875, 1.402618408203125, 1.47918701171875, 1.555755615234375, 1.63232421875, 1.708892822265625, 1.78546142578125, 1.862030029296875, 1.9385986328125, 2.015167236328125, 2.09173583984375, 2.168304443359375, 2.244873046875, 2.321441650390625, 2.39801025390625, 2.474578857421875, 2.5511474609375, 2.627716064453125, 2.70428466796875, 2.780853271484375, 2.857421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 12.0, 12.0, 15.0, 14.0, 14.0, 23.0, 29.0, 41.0, 35.0, 56.0, 83.0, 139.0, 1296.0, 1036538.0, 9634.0, 204.0, 88.0, 48.0, 53.0, 44.0, 41.0, 28.0, 21.0, 15.0, 13.0, 8.0, 12.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.115966796875, -4.93115234375, -4.746337890625, -4.5615234375, -4.376708984375, -4.19189453125, -4.007080078125, -3.822265625, -3.637451171875, -3.45263671875, -3.267822265625, -3.0830078125, -2.898193359375, -2.71337890625, -2.528564453125, -2.34375, -2.158935546875, -1.97412109375, -1.789306640625, -1.6044921875, -1.419677734375, -1.23486328125, -1.050048828125, -0.865234375, -0.680419921875, -0.49560546875, -0.310791015625, -0.1259765625, 0.058837890625, 0.24365234375, 0.428466796875, 0.61328125, 0.798095703125, 0.98291015625, 1.167724609375, 1.3525390625, 1.537353515625, 1.72216796875, 1.906982421875, 2.091796875, 2.276611328125, 2.46142578125, 2.646240234375, 2.8310546875, 3.015869140625, 3.20068359375, 3.385498046875, 3.5703125, 3.755126953125, 3.93994140625, 4.124755859375, 4.3095703125, 4.494384765625, 4.67919921875, 4.864013671875, 5.048828125, 5.233642578125, 5.41845703125, 5.603271484375, 5.7880859375, 5.972900390625, 6.15771484375, 6.342529296875, 6.52734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 4.0, 17.0, 16.0, 18.0, 20.0, 25.0, 45.0, 38.0, 52.0, 69.0, 67.0, 71.0, 81.0, 68.0, 49.0, 63.0, 57.0, 56.0, 45.0, 27.0, 27.0, 19.0, 13.0, 10.0, 8.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9638671875, -1.9016265869140625, -1.839385986328125, -1.7771453857421875, -1.71490478515625, -1.6526641845703125, -1.590423583984375, -1.5281829833984375, -1.4659423828125, -1.4037017822265625, -1.341461181640625, -1.2792205810546875, -1.21697998046875, -1.1547393798828125, -1.092498779296875, -1.0302581787109375, -0.968017578125, -0.9057769775390625, -0.843536376953125, -0.7812957763671875, -0.71905517578125, -0.6568145751953125, -0.594573974609375, -0.5323333740234375, -0.4700927734375, -0.4078521728515625, -0.345611572265625, -0.2833709716796875, -0.22113037109375, -0.1588897705078125, -0.096649169921875, -0.0344085693359375, 0.02783203125, 0.0900726318359375, 0.152313232421875, 0.2145538330078125, 0.27679443359375, 0.3390350341796875, 0.401275634765625, 0.4635162353515625, 0.5257568359375, 0.5879974365234375, 0.650238037109375, 0.7124786376953125, 0.77471923828125, 0.8369598388671875, 0.899200439453125, 0.9614410400390625, 1.023681640625, 1.0859222412109375, 1.148162841796875, 1.2104034423828125, 1.27264404296875, 1.3348846435546875, 1.397125244140625, 1.4593658447265625, 1.5216064453125, 1.5838470458984375, 1.646087646484375, 1.7083282470703125, 1.77056884765625, 1.8328094482421875, 1.895050048828125, 1.9572906494140625, 2.01953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 22.0, 16.0, 30.0, 45.0, 69.0, 144.0, 320.0, 753.0, 2474.0, 9356.0, 56278.0, 837545.0, 121031.0, 15031.0, 3548.0, 1067.0, 388.0, 164.0, 95.0, 51.0, 34.0, 18.0, 12.0, 17.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23451614379882812, -0.22733306884765625, -0.22014999389648438, -0.2129669189453125, -0.20578384399414062, -0.19860076904296875, -0.19141769409179688, -0.184234619140625, -0.17705154418945312, -0.16986846923828125, -0.16268539428710938, -0.1555023193359375, -0.14831924438476562, -0.14113616943359375, -0.13395309448242188, -0.12677001953125, -0.11958694458007812, -0.11240386962890625, -0.10522079467773438, -0.0980377197265625, -0.09085464477539062, -0.08367156982421875, -0.07648849487304688, -0.069305419921875, -0.062122344970703125, -0.05493927001953125, -0.047756195068359375, -0.0405731201171875, -0.033390045166015625, -0.02620697021484375, -0.019023895263671875, -0.0118408203125, -0.004657745361328125, 0.00252532958984375, 0.009708404541015625, 0.0168914794921875, 0.024074554443359375, 0.03125762939453125, 0.038440704345703125, 0.045623779296875, 0.052806854248046875, 0.05998992919921875, 0.06717300415039062, 0.0743560791015625, 0.08153915405273438, 0.08872222900390625, 0.09590530395507812, 0.10308837890625, 0.11027145385742188, 0.11745452880859375, 0.12463760375976562, 0.1318206787109375, 0.13900375366210938, 0.14618682861328125, 0.15336990356445312, 0.160552978515625, 0.16773605346679688, 0.17491912841796875, 0.18210220336914062, 0.1892852783203125, 0.19646835327148438, 0.20365142822265625, 0.21083450317382812, 0.218017578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 10.0, 17.0, 9.0, 15.0, 24.0, 43.0, 66.0, 86.0, 158.0, 180.0, 121.0, 80.0, 42.0, 33.0, 36.0, 17.0, 18.0, 4.0, 9.0, 6.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6941299438476562e-05, -2.6129186153411865e-05, -2.5317072868347168e-05, -2.450495958328247e-05, -2.3692846298217773e-05, -2.2880733013153076e-05, -2.206861972808838e-05, -2.125650644302368e-05, -2.0444393157958984e-05, -1.9632279872894287e-05, -1.882016658782959e-05, -1.8008053302764893e-05, -1.7195940017700195e-05, -1.6383826732635498e-05, -1.55717134475708e-05, -1.4759600162506104e-05, -1.3947486877441406e-05, -1.3135373592376709e-05, -1.2323260307312012e-05, -1.1511147022247314e-05, -1.0699033737182617e-05, -9.88692045211792e-06, -9.074807167053223e-06, -8.262693881988525e-06, -7.450580596923828e-06, -6.638467311859131e-06, -5.826354026794434e-06, -5.014240741729736e-06, -4.202127456665039e-06, -3.390014171600342e-06, -2.5779008865356445e-06, -1.7657876014709473e-06, -9.5367431640625e-07, -1.4156103134155273e-07, 6.705522537231445e-07, 1.4826655387878418e-06, 2.294778823852539e-06, 3.1068921089172363e-06, 3.919005393981934e-06, 4.731118679046631e-06, 5.543231964111328e-06, 6.355345249176025e-06, 7.167458534240723e-06, 7.97957181930542e-06, 8.791685104370117e-06, 9.603798389434814e-06, 1.0415911674499512e-05, 1.1228024959564209e-05, 1.2040138244628906e-05, 1.2852251529693604e-05, 1.36643648147583e-05, 1.4476478099822998e-05, 1.5288591384887695e-05, 1.6100704669952393e-05, 1.691281795501709e-05, 1.7724931240081787e-05, 1.8537044525146484e-05, 1.934915781021118e-05, 2.016127109527588e-05, 2.0973384380340576e-05, 2.1785497665405273e-05, 2.259761095046997e-05, 2.3409724235534668e-05, 2.4221837520599365e-05, 2.5033950805664062e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 5.0, 9.0, 11.0, 15.0, 18.0, 45.0, 76.0, 143.0, 327.0, 1014.0, 3743.0, 18564.0, 203784.0, 773544.0, 38339.0, 6361.0, 1603.0, 482.0, 233.0, 104.0, 58.0, 22.0, 21.0, 6.0, 10.0, 6.0, 7.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2474365234375, -0.239501953125, -0.2315673828125, -0.2236328125, -0.2156982421875, -0.207763671875, -0.1998291015625, -0.19189453125, -0.1839599609375, -0.176025390625, -0.1680908203125, -0.16015625, -0.1522216796875, -0.144287109375, -0.1363525390625, -0.12841796875, -0.1204833984375, -0.112548828125, -0.1046142578125, -0.0966796875, -0.0887451171875, -0.080810546875, -0.0728759765625, -0.06494140625, -0.0570068359375, -0.049072265625, -0.0411376953125, -0.033203125, -0.0252685546875, -0.017333984375, -0.0093994140625, -0.00146484375, 0.0064697265625, 0.014404296875, 0.0223388671875, 0.0302734375, 0.0382080078125, 0.046142578125, 0.0540771484375, 0.06201171875, 0.0699462890625, 0.077880859375, 0.0858154296875, 0.09375, 0.1016845703125, 0.109619140625, 0.1175537109375, 0.12548828125, 0.1334228515625, 0.141357421875, 0.1492919921875, 0.1572265625, 0.1651611328125, 0.173095703125, 0.1810302734375, 0.18896484375, 0.1968994140625, 0.204833984375, 0.2127685546875, 0.220703125, 0.2286376953125, 0.236572265625, 0.2445068359375, 0.25244140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 1.0, 3.0, 6.0, 15.0, 11.0, 10.0, 10.0, 18.0, 30.0, 31.0, 63.0, 78.0, 163.0, 247.0, 87.0, 68.0, 56.0, 27.0, 24.0, 16.0, 9.0, 5.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0655517578125, -0.06272697448730469, -0.059902191162109375, -0.05707740783691406, -0.05425262451171875, -0.05142784118652344, -0.048603057861328125, -0.04577827453613281, -0.0429534912109375, -0.04012870788574219, -0.037303924560546875, -0.03447914123535156, -0.03165435791015625, -0.028829574584960938, -0.026004791259765625, -0.023180007934570312, -0.020355224609375, -0.017530441284179688, -0.014705657958984375, -0.011880874633789062, -0.00905609130859375, -0.0062313079833984375, -0.003406524658203125, -0.0005817413330078125, 0.0022430419921875, 0.0050678253173828125, 0.007892608642578125, 0.010717391967773438, 0.01354217529296875, 0.016366958618164062, 0.019191741943359375, 0.022016525268554688, 0.02484130859375, 0.027666091918945312, 0.030490875244140625, 0.03331565856933594, 0.03614044189453125, 0.03896522521972656, 0.041790008544921875, 0.04461479187011719, 0.0474395751953125, 0.05026435852050781, 0.053089141845703125, 0.05591392517089844, 0.05873870849609375, 0.06156349182128906, 0.06438827514648438, 0.06721305847167969, 0.070037841796875, 0.07286262512207031, 0.07568740844726562, 0.07851219177246094, 0.08133697509765625, 0.08416175842285156, 0.08698654174804688, 0.08981132507324219, 0.0926361083984375, 0.09546089172363281, 0.09828567504882812, 0.10111045837402344, 0.10393524169921875, 0.10676002502441406, 0.10958480834960938, 0.11240959167480469, 0.115234375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 28.0, 271.0, 610.0, 87.0, 12.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5170936584472656, -3.1729419231414795, -2.8287901878356934, -2.4846386909484863, -2.1404869556427, -1.796335220336914, -1.452183723449707, -1.108031988143921, -0.7638802528381348, -0.4197285771369934, -0.07557690143585205, 0.26857471466064453, 0.6127264499664307, 0.9568781852722168, 1.3010296821594238, 1.64518141746521, 1.989333152770996, 2.3334848880767822, 2.6776366233825684, 3.0217881202697754, 3.3659398555755615, 3.7100915908813477, 4.054243087768555, 4.398394584655762, 4.742546558380127, 5.086698055267334, 5.430850028991699, 5.775001525878906, 6.119153022766113, 6.4633049964904785, 6.8074564933776855, 7.151608467102051, 7.495759963989258, 7.839911460876465, 8.184062957763672, 8.528215408325195, 8.872366905212402, 9.21651840209961, 9.560669898986816, 9.904821395874023, 10.248973846435547, 10.593125343322754, 10.937276840209961, 11.281429290771484, 11.625580787658691, 11.969732284545898, 12.313883781433105, 12.658035278320312, 13.00218677520752, 13.346338272094727, 13.690489768981934, 14.03464126586914, 14.378793716430664, 14.722945213317871, 15.067096710205078, 15.411248207092285, 15.755399703979492, 16.099552154541016, 16.443702697753906, 16.78785514831543, 17.13200569152832, 17.476158142089844, 17.820308685302734, 18.164461135864258, 18.50861358642578]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 11.0, 17.0, 23.0, 26.0, 34.0, 41.0, 50.0, 60.0, 57.0, 65.0, 71.0, 74.0, 69.0, 80.0, 80.0, 51.0, 52.0, 29.0, 31.0, 30.0, 15.0, 12.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.926835060119629, -3.7965807914733887, -3.6663265228271484, -3.536072015762329, -3.405817747116089, -3.2755634784698486, -3.1453089714050293, -3.015054702758789, -2.884800434112549, -2.7545461654663086, -2.6242918968200684, -2.494037389755249, -2.363783121109009, -2.2335288524627686, -2.103274345397949, -1.973020076751709, -1.8427658081054688, -1.7125115394592285, -1.5822571516036987, -1.452002763748169, -1.3217484951019287, -1.1914942264556885, -1.0612398386001587, -0.9309855103492737, -0.8007311820983887, -0.6704768538475037, -0.5402225255966187, -0.40996819734573364, -0.27971386909484863, -0.14945954084396362, -0.019205212593078613, 0.1110491156578064, 0.2413034439086914, 0.3715577721595764, 0.5018121004104614, 0.6320664286613464, 0.7623207569122314, 0.8925750851631165, 1.0228294134140015, 1.1530838012695312, 1.2833380699157715, 1.4135923385620117, 1.5438467264175415, 1.6741011142730713, 1.8043553829193115, 1.9346096515655518, 2.064864158630371, 2.1951184272766113, 2.3253726959228516, 2.455626964569092, 2.585881233215332, 2.7161357402801514, 2.8463900089263916, 2.976644277572632, 3.106898784637451, 3.2371530532836914, 3.3674073219299316, 3.497661590576172, 3.627915859222412, 3.7581703662872314, 3.8884246349334717, 4.018679141998291, 4.148933410644531, 4.2791876792907715, 4.409441947937012]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 5.0, 13.0, 20.0, 12.0, 19.0, 25.0, 48.0, 68.0, 105.0, 151.0, 333.0, 857.0, 1790.0, 3265.0, 7884.0, 32347.0, 438218.0, 3196758.0, 452159.0, 44461.0, 10407.0, 3155.0, 1138.0, 449.0, 202.0, 126.0, 91.0, 50.0, 32.0, 35.0, 15.0, 14.0, 12.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.537109375, -1.4883270263671875, -1.439544677734375, -1.3907623291015625, -1.34197998046875, -1.2931976318359375, -1.244415283203125, -1.1956329345703125, -1.1468505859375, -1.0980682373046875, -1.049285888671875, -1.0005035400390625, -0.95172119140625, -0.9029388427734375, -0.854156494140625, -0.8053741455078125, -0.756591796875, -0.7078094482421875, -0.659027099609375, -0.6102447509765625, -0.56146240234375, -0.5126800537109375, -0.463897705078125, -0.4151153564453125, -0.3663330078125, -0.3175506591796875, -0.268768310546875, -0.2199859619140625, -0.17120361328125, -0.1224212646484375, -0.073638916015625, -0.0248565673828125, 0.02392578125, 0.0727081298828125, 0.121490478515625, 0.1702728271484375, 0.21905517578125, 0.2678375244140625, 0.316619873046875, 0.3654022216796875, 0.4141845703125, 0.4629669189453125, 0.511749267578125, 0.5605316162109375, 0.60931396484375, 0.6580963134765625, 0.706878662109375, 0.7556610107421875, 0.804443359375, 0.8532257080078125, 0.902008056640625, 0.9507904052734375, 0.99957275390625, 1.0483551025390625, 1.097137451171875, 1.1459197998046875, 1.1947021484375, 1.2434844970703125, 1.292266845703125, 1.3410491943359375, 1.38983154296875, 1.4386138916015625, 1.487396240234375, 1.5361785888671875, 1.5849609375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 13.0, 17.0, 29.0, 37.0, 58.0, 94.0, 111.0, 142.0, 132.0, 107.0, 92.0, 58.0, 40.0, 29.0, 17.0, 10.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5428924560546875, -1.483245849609375, -1.4235992431640625, -1.36395263671875, -1.3043060302734375, -1.244659423828125, -1.1850128173828125, -1.1253662109375, -1.0657196044921875, -1.006072998046875, -0.9464263916015625, -0.88677978515625, -0.8271331787109375, -0.767486572265625, -0.7078399658203125, -0.648193359375, -0.5885467529296875, -0.528900146484375, -0.4692535400390625, -0.40960693359375, -0.3499603271484375, -0.290313720703125, -0.2306671142578125, -0.1710205078125, -0.1113739013671875, -0.051727294921875, 0.0079193115234375, 0.06756591796875, 0.1272125244140625, 0.186859130859375, 0.2465057373046875, 0.30615234375, 0.3657989501953125, 0.425445556640625, 0.4850921630859375, 0.54473876953125, 0.6043853759765625, 0.664031982421875, 0.7236785888671875, 0.7833251953125, 0.8429718017578125, 0.902618408203125, 0.9622650146484375, 1.02191162109375, 1.0815582275390625, 1.141204833984375, 1.2008514404296875, 1.260498046875, 1.3201446533203125, 1.379791259765625, 1.4394378662109375, 1.49908447265625, 1.5587310791015625, 1.618377685546875, 1.6780242919921875, 1.7376708984375, 1.7973175048828125, 1.856964111328125, 1.9166107177734375, 1.97625732421875, 2.0359039306640625, 2.095550537109375, 2.1551971435546875, 2.21484375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 13.0, 34.0, 51.0, 113.0, 432.0, 12282.0, 4177914.0, 3015.0, 249.0, 75.0, 38.0, 25.0, 18.0, 5.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.34051513671875, -10.0638427734375, -9.78717041015625, -9.510498046875, -9.23382568359375, -8.9571533203125, -8.68048095703125, -8.40380859375, -8.12713623046875, -7.8504638671875, -7.57379150390625, -7.297119140625, -7.02044677734375, -6.7437744140625, -6.46710205078125, -6.1904296875, -5.91375732421875, -5.6370849609375, -5.36041259765625, -5.083740234375, -4.80706787109375, -4.5303955078125, -4.25372314453125, -3.97705078125, -3.70037841796875, -3.4237060546875, -3.14703369140625, -2.870361328125, -2.59368896484375, -2.3170166015625, -2.04034423828125, -1.763671875, -1.48699951171875, -1.2103271484375, -0.93365478515625, -0.656982421875, -0.38031005859375, -0.1036376953125, 0.17303466796875, 0.44970703125, 0.72637939453125, 1.0030517578125, 1.27972412109375, 1.556396484375, 1.83306884765625, 2.1097412109375, 2.38641357421875, 2.6630859375, 2.93975830078125, 3.2164306640625, 3.49310302734375, 3.769775390625, 4.04644775390625, 4.3231201171875, 4.59979248046875, 4.87646484375, 5.15313720703125, 5.4298095703125, 5.70648193359375, 5.983154296875, 6.25982666015625, 6.5364990234375, 6.81317138671875, 7.08984375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 6.0, 18.0, 21.0, 47.0, 87.0, 203.0, 803.0, 1809.0, 675.0, 196.0, 98.0, 41.0, 28.0, 17.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.431396484375, -0.4051551818847656, -0.37891387939453125, -0.3526725769042969, -0.3264312744140625, -0.3001899719238281, -0.27394866943359375, -0.24770736694335938, -0.221466064453125, -0.19522476196289062, -0.16898345947265625, -0.14274215698242188, -0.1165008544921875, -0.09025955200195312, -0.06401824951171875, -0.037776947021484375, -0.01153564453125, 0.014705657958984375, 0.04094696044921875, 0.06718826293945312, 0.0934295654296875, 0.11967086791992188, 0.14591217041015625, 0.17215347290039062, 0.198394775390625, 0.22463607788085938, 0.25087738037109375, 0.2771186828613281, 0.3033599853515625, 0.3296012878417969, 0.35584259033203125, 0.3820838928222656, 0.4083251953125, 0.4345664978027344, 0.46080780029296875, 0.4870491027832031, 0.5132904052734375, 0.5395317077636719, 0.5657730102539062, 0.5920143127441406, 0.618255615234375, 0.6444969177246094, 0.6707382202148438, 0.6969795227050781, 0.7232208251953125, 0.7494621276855469, 0.7757034301757812, 0.8019447326660156, 0.82818603515625, 0.8544273376464844, 0.8806686401367188, 0.9069099426269531, 0.9331512451171875, 0.9593925476074219, 0.9856338500976562, 1.0118751525878906, 1.038116455078125, 1.0643577575683594, 1.0905990600585938, 1.1168403625488281, 1.1430816650390625, 1.1693229675292969, 1.1955642700195312, 1.2218055725097656, 1.248046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 8.0, 18.0, 30.0, 47.0, 102.0, 133.0, 175.0, 172.0, 115.0, 89.0, 39.0, 31.0, 14.0, 9.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.270559310913086, -2.2086055278778076, -2.1466519832611084, -2.08469820022583, -2.0227444171905518, -1.960790753364563, -1.8988370895385742, -1.836883306503296, -1.7749296426773071, -1.7129759788513184, -1.65102219581604, -1.5890685319900513, -1.5271148681640625, -1.4651610851287842, -1.4032074213027954, -1.3412537574768066, -1.2792999744415283, -1.2173463106155396, -1.1553925275802612, -1.0934388637542725, -1.0314850807189941, -0.9695314168930054, -0.9075777530670166, -0.8456240296363831, -0.7836703062057495, -0.721716582775116, -0.6597628593444824, -0.5978091955184937, -0.5358554720878601, -0.47390174865722656, -0.4119480550289154, -0.34999436140060425, -0.28804051876068115, -0.2260868102312088, -0.16413310170173645, -0.1021793931722641, -0.04022568464279175, 0.021728038787841797, 0.08368173241615295, 0.1456354260444641, 0.20758914947509766, 0.2695428729057312, 0.33149656653404236, 0.3934502601623535, 0.45540398359298706, 0.5173577070236206, 0.5793113708496094, 0.6412650942802429, 0.7032188177108765, 0.76517254114151, 0.8271262645721436, 0.8890799283981323, 0.9510336518287659, 1.0129873752593994, 1.0749410390853882, 1.136894702911377, 1.1988484859466553, 1.260802149772644, 1.3227559328079224, 1.3847095966339111, 1.4466633796691895, 1.5086170434951782, 1.570570707321167, 1.6325244903564453, 1.694478154182434]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 10.0, 18.0, 21.0, 40.0, 37.0, 68.0, 88.0, 94.0, 98.0, 116.0, 106.0, 94.0, 83.0, 51.0, 36.0, 17.0, 14.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9360918998718262, -1.8711392879486084, -1.8061866760253906, -1.7412341833114624, -1.6762815713882446, -1.6113289594650269, -1.5463764667510986, -1.4814238548278809, -1.416471242904663, -1.3515186309814453, -1.2865660190582275, -1.2216135263442993, -1.1566609144210815, -1.0917083024978638, -1.0267558097839355, -0.9618031978607178, -0.8968505859375, -0.8318979740142822, -0.7669454216957092, -0.7019928693771362, -0.6370402574539185, -0.5720876455307007, -0.5071350932121277, -0.4421825110912323, -0.3772299289703369, -0.31227734684944153, -0.24732476472854614, -0.18237218260765076, -0.11741960048675537, -0.052467018365859985, 0.0124855637550354, 0.07743814587593079, 0.14239048957824707, 0.20734307169914246, 0.27229565382003784, 0.3372482359409332, 0.4022008180618286, 0.467153400182724, 0.5321059823036194, 0.5970585346221924, 0.6620111465454102, 0.7269637584686279, 0.7919163107872009, 0.8568688631057739, 0.9218214750289917, 0.9867740869522095, 1.0517265796661377, 1.1166791915893555, 1.1816318035125732, 1.246584415435791, 1.3115370273590088, 1.376489520072937, 1.4414421319961548, 1.5063947439193726, 1.5713472366333008, 1.6362998485565186, 1.7012524604797363, 1.766205072402954, 1.8311576843261719, 1.8961101770401, 1.9610627889633179, 2.026015281677246, 2.090967893600464, 2.1559205055236816, 2.2208731174468994]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 9.0, 25.0, 37.0, 36.0, 63.0, 118.0, 236.0, 488.0, 1304.0, 6091.0, 71351.0, 843979.0, 113699.0, 8302.0, 1678.0, 570.0, 250.0, 119.0, 83.0, 38.0, 21.0, 19.0, 9.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.387939453125, -0.3756523132324219, -0.36336517333984375, -0.3510780334472656, -0.3387908935546875, -0.3265037536621094, -0.31421661376953125, -0.3019294738769531, -0.289642333984375, -0.2773551940917969, -0.26506805419921875, -0.2527809143066406, -0.2404937744140625, -0.22820663452148438, -0.21591949462890625, -0.20363235473632812, -0.19134521484375, -0.17905807495117188, -0.16677093505859375, -0.15448379516601562, -0.1421966552734375, -0.12990951538085938, -0.11762237548828125, -0.10533523559570312, -0.093048095703125, -0.08076095581054688, -0.06847381591796875, -0.056186676025390625, -0.0438995361328125, -0.031612396240234375, -0.01932525634765625, -0.007038116455078125, 0.0052490234375, 0.017536163330078125, 0.02982330322265625, 0.042110443115234375, 0.0543975830078125, 0.06668472290039062, 0.07897186279296875, 0.09125900268554688, 0.103546142578125, 0.11583328247070312, 0.12812042236328125, 0.14040756225585938, 0.1526947021484375, 0.16498184204101562, 0.17726898193359375, 0.18955612182617188, 0.20184326171875, 0.21413040161132812, 0.22641754150390625, 0.23870468139648438, 0.2509918212890625, 0.2632789611816406, 0.27556610107421875, 0.2878532409667969, 0.300140380859375, 0.3124275207519531, 0.32471466064453125, 0.3370018005371094, 0.3492889404296875, 0.3615760803222656, 0.37386322021484375, 0.3861503601074219, 0.3984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 17.0, 28.0, 45.0, 72.0, 122.0, 124.0, 145.0, 140.0, 126.0, 83.0, 40.0, 23.0, 14.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3372039794921875, -1.286712646484375, -1.2362213134765625, -1.18572998046875, -1.1352386474609375, -1.084747314453125, -1.0342559814453125, -0.9837646484375, -0.9332733154296875, -0.882781982421875, -0.8322906494140625, -0.78179931640625, -0.7313079833984375, -0.680816650390625, -0.6303253173828125, -0.579833984375, -0.5293426513671875, -0.478851318359375, -0.4283599853515625, -0.37786865234375, -0.3273773193359375, -0.276885986328125, -0.2263946533203125, -0.1759033203125, -0.1254119873046875, -0.074920654296875, -0.0244293212890625, 0.02606201171875, 0.0765533447265625, 0.127044677734375, 0.1775360107421875, 0.22802734375, 0.2785186767578125, 0.329010009765625, 0.3795013427734375, 0.42999267578125, 0.4804840087890625, 0.530975341796875, 0.5814666748046875, 0.6319580078125, 0.6824493408203125, 0.732940673828125, 0.7834320068359375, 0.83392333984375, 0.8844146728515625, 0.934906005859375, 0.9853973388671875, 1.035888671875, 1.0863800048828125, 1.136871337890625, 1.1873626708984375, 1.23785400390625, 1.2883453369140625, 1.338836669921875, 1.3893280029296875, 1.4398193359375, 1.4903106689453125, 1.540802001953125, 1.5912933349609375, 1.64178466796875, 1.6922760009765625, 1.742767333984375, 1.7932586669921875, 1.84375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 19.0, 24.0, 40.0, 42.0, 81.0, 124.0, 206.0, 323.0, 485.0, 917.0, 1540.0, 2731.0, 4795.0, 9133.0, 17311.0, 34440.0, 72370.0, 153170.0, 264890.0, 239609.0, 125796.0, 59572.0, 28544.0, 14592.0, 7650.0, 4099.0, 2447.0, 1354.0, 820.0, 499.0, 311.0, 207.0, 146.0, 83.0, 63.0, 29.0, 19.0, 20.0, 11.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.056976318359375, -0.055002689361572266, -0.05302906036376953, -0.0510554313659668, -0.04908180236816406, -0.04710817337036133, -0.045134544372558594, -0.04316091537475586, -0.041187286376953125, -0.03921365737915039, -0.037240028381347656, -0.03526639938354492, -0.03329277038574219, -0.03131914138793945, -0.02934551239013672, -0.027371883392333984, -0.02539825439453125, -0.023424625396728516, -0.02145099639892578, -0.019477367401123047, -0.017503738403320312, -0.015530109405517578, -0.013556480407714844, -0.01158285140991211, -0.009609222412109375, -0.007635593414306641, -0.005661964416503906, -0.003688335418701172, -0.0017147064208984375, 0.0002589225769042969, 0.0022325515747070312, 0.004206180572509766, 0.0061798095703125, 0.008153438568115234, 0.010127067565917969, 0.012100696563720703, 0.014074325561523438, 0.016047954559326172, 0.018021583557128906, 0.01999521255493164, 0.021968841552734375, 0.02394247055053711, 0.025916099548339844, 0.027889728546142578, 0.029863357543945312, 0.03183698654174805, 0.03381061553955078, 0.035784244537353516, 0.03775787353515625, 0.039731502532958984, 0.04170513153076172, 0.04367876052856445, 0.04565238952636719, 0.04762601852416992, 0.049599647521972656, 0.05157327651977539, 0.053546905517578125, 0.05552053451538086, 0.057494163513183594, 0.05946779251098633, 0.06144142150878906, 0.0634150505065918, 0.06538867950439453, 0.06736230850219727, 0.0693359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 3.0, 0.0, 8.0, 5.0, 7.0, 9.0, 16.0, 16.0, 24.0, 16.0, 22.0, 34.0, 27.0, 34.0, 32.0, 47.0, 30.0, 43.0, 42.0, 43.0, 44.0, 42.0, 45.0, 32.0, 48.0, 38.0, 43.0, 29.0, 25.0, 22.0, 25.0, 22.0, 20.0, 17.0, 16.0, 13.0, 10.0, 9.0, 4.0, 7.0, 8.0, 4.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.76806640625, -0.7406692504882812, -0.7132720947265625, -0.6858749389648438, -0.658477783203125, -0.6310806274414062, -0.6036834716796875, -0.5762863159179688, -0.54888916015625, -0.5214920043945312, -0.4940948486328125, -0.46669769287109375, -0.439300537109375, -0.41190338134765625, -0.3845062255859375, -0.35710906982421875, -0.3297119140625, -0.30231475830078125, -0.2749176025390625, -0.24752044677734375, -0.220123291015625, -0.19272613525390625, -0.1653289794921875, -0.13793182373046875, -0.11053466796875, -0.08313751220703125, -0.0557403564453125, -0.02834320068359375, -0.000946044921875, 0.02645111083984375, 0.0538482666015625, 0.08124542236328125, 0.108642578125, 0.13603973388671875, 0.1634368896484375, 0.19083404541015625, 0.218231201171875, 0.24562835693359375, 0.2730255126953125, 0.30042266845703125, 0.32781982421875, 0.35521697998046875, 0.3826141357421875, 0.41001129150390625, 0.437408447265625, 0.46480560302734375, 0.4922027587890625, 0.5195999145507812, 0.5469970703125, 0.5743942260742188, 0.6017913818359375, 0.6291885375976562, 0.656585693359375, 0.6839828491210938, 0.7113800048828125, 0.7387771606445312, 0.76617431640625, 0.7935714721679688, 0.8209686279296875, 0.8483657836914062, 0.875762939453125, 0.9031600952148438, 0.9305572509765625, 0.9579544067382812, 0.9853515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 15.0, 9.0, 18.0, 19.0, 32.0, 65.0, 98.0, 142.0, 318.0, 941.0, 4181.0, 30022.0, 649942.0, 340422.0, 17873.0, 2999.0, 777.0, 290.0, 124.0, 91.0, 49.0, 45.0, 30.0, 14.0, 15.0, 7.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0192718505859375, -0.01866745948791504, -0.018063068389892578, -0.017458677291870117, -0.016854286193847656, -0.016249895095825195, -0.015645503997802734, -0.015041112899780273, -0.014436721801757812, -0.013832330703735352, -0.01322793960571289, -0.01262354850769043, -0.012019157409667969, -0.011414766311645508, -0.010810375213623047, -0.010205984115600586, -0.009601593017578125, -0.008997201919555664, -0.008392810821533203, -0.007788419723510742, -0.007184028625488281, -0.00657963752746582, -0.005975246429443359, -0.0053708553314208984, -0.0047664642333984375, -0.0041620731353759766, -0.0035576820373535156, -0.0029532909393310547, -0.0023488998413085938, -0.0017445087432861328, -0.0011401176452636719, -0.0005357265472412109, 6.866455078125e-05, 0.0006730556488037109, 0.0012774467468261719, 0.0018818378448486328, 0.0024862289428710938, 0.0030906200408935547, 0.0036950111389160156, 0.0042994022369384766, 0.0049037933349609375, 0.0055081844329833984, 0.006112575531005859, 0.00671696662902832, 0.007321357727050781, 0.007925748825073242, 0.008530139923095703, 0.009134531021118164, 0.009738922119140625, 0.010343313217163086, 0.010947704315185547, 0.011552095413208008, 0.012156486511230469, 0.01276087760925293, 0.01336526870727539, 0.013969659805297852, 0.014574050903320312, 0.015178442001342773, 0.015782833099365234, 0.016387224197387695, 0.016991615295410156, 0.017596006393432617, 0.018200397491455078, 0.01880478858947754, 0.0194091796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 18.0, 23.0, 56.0, 104.0, 152.0, 178.0, 159.0, 134.0, 87.0, 50.0, 16.0, 16.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.433281719684601e-05, -4.336610436439514e-05, -4.2399391531944275e-05, -4.143267869949341e-05, -4.046596586704254e-05, -3.9499253034591675e-05, -3.853254020214081e-05, -3.756582736968994e-05, -3.6599114537239075e-05, -3.563240170478821e-05, -3.466568887233734e-05, -3.3698976039886475e-05, -3.273226320743561e-05, -3.176555037498474e-05, -3.0798837542533875e-05, -2.9832124710083008e-05, -2.886541187763214e-05, -2.7898699045181274e-05, -2.6931986212730408e-05, -2.596527338027954e-05, -2.4998560547828674e-05, -2.4031847715377808e-05, -2.306513488292694e-05, -2.2098422050476074e-05, -2.1131709218025208e-05, -2.016499638557434e-05, -1.9198283553123474e-05, -1.8231570720672607e-05, -1.726485788822174e-05, -1.6298145055770874e-05, -1.5331432223320007e-05, -1.436471939086914e-05, -1.3398006558418274e-05, -1.2431293725967407e-05, -1.146458089351654e-05, -1.0497868061065674e-05, -9.531155228614807e-06, -8.56444239616394e-06, -7.597729563713074e-06, -6.631016731262207e-06, -5.66430389881134e-06, -4.697591066360474e-06, -3.730878233909607e-06, -2.7641654014587402e-06, -1.7974525690078735e-06, -8.307397365570068e-07, 1.3597309589385986e-07, 1.1026859283447266e-06, 2.0693987607955933e-06, 3.03611159324646e-06, 4.002824425697327e-06, 4.969537258148193e-06, 5.93625009059906e-06, 6.902962923049927e-06, 7.869675755500793e-06, 8.83638858795166e-06, 9.803101420402527e-06, 1.0769814252853394e-05, 1.173652708530426e-05, 1.2703239917755127e-05, 1.3669952750205994e-05, 1.463666558265686e-05, 1.5603378415107727e-05, 1.6570091247558594e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 10.0, 13.0, 17.0, 23.0, 42.0, 66.0, 126.0, 273.0, 623.0, 1565.0, 4488.0, 17930.0, 117746.0, 734925.0, 142551.0, 20459.0, 4809.0, 1602.0, 655.0, 259.0, 145.0, 72.0, 46.0, 31.0, 18.0, 9.0, 11.0, 1.0, 4.0, 5.0, 6.0, 0.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01439666748046875, -0.013940215110778809, -0.013483762741088867, -0.013027310371398926, -0.012570858001708984, -0.012114405632019043, -0.011657953262329102, -0.01120150089263916, -0.010745048522949219, -0.010288596153259277, -0.009832143783569336, -0.009375691413879395, -0.008919239044189453, -0.008462786674499512, -0.00800633430480957, -0.007549881935119629, -0.0070934295654296875, -0.006636977195739746, -0.006180524826049805, -0.005724072456359863, -0.005267620086669922, -0.0048111677169799805, -0.004354715347290039, -0.0038982629776000977, -0.0034418106079101562, -0.002985358238220215, -0.0025289058685302734, -0.002072453498840332, -0.0016160011291503906, -0.0011595487594604492, -0.0007030963897705078, -0.0002466440200805664, 0.000209808349609375, 0.0006662607192993164, 0.0011227130889892578, 0.0015791654586791992, 0.0020356178283691406, 0.002492070198059082, 0.0029485225677490234, 0.003404974937438965, 0.0038614273071289062, 0.004317879676818848, 0.004774332046508789, 0.0052307844161987305, 0.005687236785888672, 0.006143689155578613, 0.006600141525268555, 0.007056593894958496, 0.0075130462646484375, 0.007969498634338379, 0.00842595100402832, 0.008882403373718262, 0.009338855743408203, 0.009795308113098145, 0.010251760482788086, 0.010708212852478027, 0.011164665222167969, 0.01162111759185791, 0.012077569961547852, 0.012534022331237793, 0.012990474700927734, 0.013446927070617676, 0.013903379440307617, 0.014359831809997559, 0.0148162841796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 11.0, 3.0, 14.0, 9.0, 11.0, 10.0, 27.0, 43.0, 54.0, 68.0, 92.0, 116.0, 131.0, 121.0, 74.0, 51.0, 33.0, 24.0, 24.0, 18.0, 18.0, 9.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0037364959716796875, -0.0036273598670959473, -0.003518223762512207, -0.003409087657928467, -0.0032999515533447266, -0.0031908154487609863, -0.003081679344177246, -0.002972543239593506, -0.0028634071350097656, -0.0027542710304260254, -0.002645134925842285, -0.002535998821258545, -0.0024268627166748047, -0.0023177266120910645, -0.0022085905075073242, -0.002099454402923584, -0.0019903182983398438, -0.0018811821937561035, -0.0017720460891723633, -0.001662909984588623, -0.0015537738800048828, -0.0014446377754211426, -0.0013355016708374023, -0.0012263655662536621, -0.0011172294616699219, -0.0010080933570861816, -0.0008989572525024414, -0.0007898211479187012, -0.0006806850433349609, -0.0005715489387512207, -0.00046241283416748047, -0.00035327672958374023, -0.000244140625, -0.00013500452041625977, -2.586841583251953e-05, 8.32676887512207e-05, 0.00019240379333496094, 0.00030153989791870117, 0.0004106760025024414, 0.0005198121070861816, 0.0006289482116699219, 0.0007380843162536621, 0.0008472204208374023, 0.0009563565254211426, 0.0010654926300048828, 0.001174628734588623, 0.0012837648391723633, 0.0013929009437561035, 0.0015020370483398438, 0.001611173152923584, 0.0017203092575073242, 0.0018294453620910645, 0.0019385814666748047, 0.002047717571258545, 0.002156853675842285, 0.0022659897804260254, 0.0023751258850097656, 0.002484261989593506, 0.002593398094177246, 0.0027025341987609863, 0.0028116703033447266, 0.002920806407928467, 0.003029942512512207, 0.0031390786170959473, 0.0032482147216796875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 13.0, 27.0, 48.0, 119.0, 232.0, 264.0, 158.0, 73.0, 30.0, 16.0, 12.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8071820735931396, -1.7527223825454712, -1.6982625722885132, -1.6438028812408447, -1.5893431901931763, -1.5348834991455078, -1.4804236888885498, -1.4259639978408813, -1.371504306793213, -1.3170446157455444, -1.2625848054885864, -1.208125114440918, -1.1536654233932495, -1.099205732345581, -1.044745922088623, -0.9902862310409546, -0.9358264207839966, -0.8813666701316833, -0.8269069790840149, -0.7724472284317017, -0.7179875373840332, -0.66352778673172, -0.6090680360794067, -0.5546083450317383, -0.500148594379425, -0.4456888735294342, -0.39122915267944336, -0.3367694020271301, -0.2823096811771393, -0.22784996032714844, -0.1733902096748352, -0.11893048882484436, -0.06447076797485352, -0.010011039674282074, 0.04444868862628937, 0.0989084243774414, 0.15336814522743225, 0.2078278660774231, 0.26228761672973633, 0.3167473375797272, 0.371207058429718, 0.42566677927970886, 0.4801265001296997, 0.5345862507820129, 0.5890460014343262, 0.6435056924819946, 0.6979654431343079, 0.7524251937866211, 0.8068848848342896, 0.8613446354866028, 0.9158043265342712, 0.9702640771865845, 1.024723768234253, 1.079183578491211, 1.1336432695388794, 1.1881029605865479, 1.2425627708435059, 1.2970224618911743, 1.3514822721481323, 1.4059419631958008, 1.4604016542434692, 1.5148613452911377, 1.5693211555480957, 1.6237808465957642, 1.6782405376434326]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 10.0, 15.0, 24.0, 44.0, 48.0, 95.0, 122.0, 125.0, 151.0, 124.0, 104.0, 60.0, 40.0, 16.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.363757848739624, -1.3166872262954712, -1.269616723060608, -1.222546100616455, -1.1754755973815918, -1.128404974937439, -1.0813343524932861, -1.0342638492584229, -0.9871932864189148, -0.9401227235794067, -0.8930521607398987, -0.8459815979003906, -0.7989109754562378, -0.7518404722213745, -0.7047698497772217, -0.6576992869377136, -0.6106287240982056, -0.5635581612586975, -0.5164875984191895, -0.469417005777359, -0.42234644293785095, -0.3752758800983429, -0.32820528745651245, -0.2811347246170044, -0.23406416177749634, -0.18699359893798828, -0.13992302119731903, -0.09285244345664978, -0.045781880617141724, 0.001288682222366333, 0.04835927486419678, 0.09542983770370483, 0.14250051975250244, 0.1895710825920105, 0.23664166033267975, 0.283712238073349, 0.33078280091285706, 0.3778533637523651, 0.42492395639419556, 0.4719945192337036, 0.5190650820732117, 0.5661356449127197, 0.6132062077522278, 0.6602767705917358, 0.7073473930358887, 0.754417896270752, 0.8014885187149048, 0.8485590815544128, 0.8956296443939209, 0.942700207233429, 0.989770770072937, 1.0368413925170898, 1.0839118957519531, 1.130982518196106, 1.1780531406402588, 1.225123643875122, 1.2721941471099854, 1.3192647695541382, 1.3663352727890015, 1.4134058952331543, 1.4604763984680176, 1.5075470209121704, 1.5546176433563232, 1.6016881465911865, 1.6487587690353394]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 4.0, 14.0, 9.0, 14.0, 30.0, 39.0, 74.0, 117.0, 288.0, 713.0, 2284.0, 10565.0, 112659.0, 848459.0, 62684.0, 7498.0, 1828.0, 679.0, 251.0, 135.0, 75.0, 40.0, 28.0, 20.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1040496826171875, -1.066497802734375, -1.0289459228515625, -0.99139404296875, -0.9538421630859375, -0.916290283203125, -0.8787384033203125, -0.8411865234375, -0.8036346435546875, -0.766082763671875, -0.7285308837890625, -0.69097900390625, -0.6534271240234375, -0.615875244140625, -0.5783233642578125, -0.540771484375, -0.5032196044921875, -0.465667724609375, -0.4281158447265625, -0.39056396484375, -0.3530120849609375, -0.315460205078125, -0.2779083251953125, -0.2403564453125, -0.2028045654296875, -0.165252685546875, -0.1277008056640625, -0.09014892578125, -0.0525970458984375, -0.015045166015625, 0.0225067138671875, 0.06005859375, 0.0976104736328125, 0.135162353515625, 0.1727142333984375, 0.21026611328125, 0.2478179931640625, 0.285369873046875, 0.3229217529296875, 0.3604736328125, 0.3980255126953125, 0.435577392578125, 0.4731292724609375, 0.51068115234375, 0.5482330322265625, 0.585784912109375, 0.6233367919921875, 0.660888671875, 0.6984405517578125, 0.735992431640625, 0.7735443115234375, 0.81109619140625, 0.8486480712890625, 0.886199951171875, 0.9237518310546875, 0.9613037109375, 0.9988555908203125, 1.036407470703125, 1.0739593505859375, 1.11151123046875, 1.1490631103515625, 1.186614990234375, 1.2241668701171875, 1.26171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 11.0, 26.0, 32.0, 36.0, 58.0, 105.0, 97.0, 120.0, 115.0, 108.0, 92.0, 72.0, 46.0, 29.0, 20.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.341796875, -2.26361083984375, -2.1854248046875, -2.10723876953125, -2.029052734375, -1.95086669921875, -1.8726806640625, -1.79449462890625, -1.71630859375, -1.63812255859375, -1.5599365234375, -1.48175048828125, -1.403564453125, -1.32537841796875, -1.2471923828125, -1.16900634765625, -1.0908203125, -1.01263427734375, -0.9344482421875, -0.85626220703125, -0.778076171875, -0.69989013671875, -0.6217041015625, -0.54351806640625, -0.46533203125, -0.38714599609375, -0.3089599609375, -0.23077392578125, -0.152587890625, -0.07440185546875, 0.0037841796875, 0.08197021484375, 0.16015625, 0.23834228515625, 0.3165283203125, 0.39471435546875, 0.472900390625, 0.55108642578125, 0.6292724609375, 0.70745849609375, 0.78564453125, 0.86383056640625, 0.9420166015625, 1.02020263671875, 1.098388671875, 1.17657470703125, 1.2547607421875, 1.33294677734375, 1.4111328125, 1.48931884765625, 1.5675048828125, 1.64569091796875, 1.723876953125, 1.80206298828125, 1.8802490234375, 1.95843505859375, 2.03662109375, 2.11480712890625, 2.1929931640625, 2.27117919921875, 2.349365234375, 2.42755126953125, 2.5057373046875, 2.58392333984375, 2.662109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 12.0, 17.0, 27.0, 23.0, 40.0, 56.0, 94.0, 121.0, 218.0, 786.0, 61048.0, 982025.0, 3254.0, 297.0, 156.0, 105.0, 76.0, 58.0, 42.0, 20.0, 23.0, 11.0, 12.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.296875, -3.203277587890625, -3.10968017578125, -3.016082763671875, -2.9224853515625, -2.828887939453125, -2.73529052734375, -2.641693115234375, -2.548095703125, -2.454498291015625, -2.36090087890625, -2.267303466796875, -2.1737060546875, -2.080108642578125, -1.98651123046875, -1.892913818359375, -1.79931640625, -1.705718994140625, -1.61212158203125, -1.518524169921875, -1.4249267578125, -1.331329345703125, -1.23773193359375, -1.144134521484375, -1.050537109375, -0.956939697265625, -0.86334228515625, -0.769744873046875, -0.6761474609375, -0.582550048828125, -0.48895263671875, -0.395355224609375, -0.3017578125, -0.208160400390625, -0.11456298828125, -0.020965576171875, 0.0726318359375, 0.166229248046875, 0.25982666015625, 0.353424072265625, 0.447021484375, 0.540618896484375, 0.63421630859375, 0.727813720703125, 0.8214111328125, 0.915008544921875, 1.00860595703125, 1.102203369140625, 1.19580078125, 1.289398193359375, 1.38299560546875, 1.476593017578125, 1.5701904296875, 1.663787841796875, 1.75738525390625, 1.850982666015625, 1.944580078125, 2.038177490234375, 2.13177490234375, 2.225372314453125, 2.3189697265625, 2.412567138671875, 2.50616455078125, 2.599761962890625, 2.693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 4.0, 1.0, 5.0, 7.0, 12.0, 9.0, 15.0, 22.0, 25.0, 37.0, 55.0, 50.0, 65.0, 74.0, 101.0, 91.0, 89.0, 64.0, 67.0, 51.0, 45.0, 37.0, 30.0, 16.0, 13.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.490234375, -2.42120361328125, -2.3521728515625, -2.28314208984375, -2.214111328125, -2.14508056640625, -2.0760498046875, -2.00701904296875, -1.93798828125, -1.86895751953125, -1.7999267578125, -1.73089599609375, -1.661865234375, -1.59283447265625, -1.5238037109375, -1.45477294921875, -1.3857421875, -1.31671142578125, -1.2476806640625, -1.17864990234375, -1.109619140625, -1.04058837890625, -0.9715576171875, -0.90252685546875, -0.83349609375, -0.76446533203125, -0.6954345703125, -0.62640380859375, -0.557373046875, -0.48834228515625, -0.4193115234375, -0.35028076171875, -0.28125, -0.21221923828125, -0.1431884765625, -0.07415771484375, -0.005126953125, 0.06390380859375, 0.1329345703125, 0.20196533203125, 0.27099609375, 0.34002685546875, 0.4090576171875, 0.47808837890625, 0.547119140625, 0.61614990234375, 0.6851806640625, 0.75421142578125, 0.8232421875, 0.89227294921875, 0.9613037109375, 1.03033447265625, 1.099365234375, 1.16839599609375, 1.2374267578125, 1.30645751953125, 1.37548828125, 1.44451904296875, 1.5135498046875, 1.58258056640625, 1.651611328125, 1.72064208984375, 1.7896728515625, 1.85870361328125, 1.927734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 24.0, 28.0, 46.0, 102.0, 226.0, 530.0, 1278.0, 3440.0, 11360.0, 48071.0, 532105.0, 395225.0, 41049.0, 9941.0, 3098.0, 1124.0, 450.0, 195.0, 97.0, 62.0, 29.0, 16.0, 12.0, 12.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.204833984375, -0.1984233856201172, -0.19201278686523438, -0.18560218811035156, -0.17919158935546875, -0.17278099060058594, -0.16637039184570312, -0.1599597930908203, -0.1535491943359375, -0.1471385955810547, -0.14072799682617188, -0.13431739807128906, -0.12790679931640625, -0.12149620056152344, -0.11508560180664062, -0.10867500305175781, -0.102264404296875, -0.09585380554199219, -0.08944320678710938, -0.08303260803222656, -0.07662200927734375, -0.07021141052246094, -0.06380081176757812, -0.05739021301269531, -0.0509796142578125, -0.04456901550292969, -0.038158416748046875, -0.03174781799316406, -0.02533721923828125, -0.018926620483398438, -0.012516021728515625, -0.0061054229736328125, 0.00030517578125, 0.0067157745361328125, 0.013126373291015625, 0.019536972045898438, 0.02594757080078125, 0.03235816955566406, 0.038768768310546875, 0.04517936706542969, 0.0515899658203125, 0.05800056457519531, 0.06441116333007812, 0.07082176208496094, 0.07723236083984375, 0.08364295959472656, 0.09005355834960938, 0.09646415710449219, 0.102874755859375, 0.10928535461425781, 0.11569595336914062, 0.12210655212402344, 0.12851715087890625, 0.13492774963378906, 0.14133834838867188, 0.1477489471435547, 0.1541595458984375, 0.1605701446533203, 0.16698074340820312, 0.17339134216308594, 0.17980194091796875, 0.18621253967285156, 0.19262313842773438, 0.1990337371826172, 0.2054443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 2.0, 4.0, 4.0, 9.0, 16.0, 23.0, 21.0, 29.0, 43.0, 50.0, 88.0, 116.0, 128.0, 144.0, 86.0, 61.0, 31.0, 36.0, 26.0, 21.0, 18.0, 8.0, 4.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.0159950256347656e-05, -2.9357150197029114e-05, -2.855435013771057e-05, -2.775155007839203e-05, -2.6948750019073486e-05, -2.6145949959754944e-05, -2.53431499004364e-05, -2.454034984111786e-05, -2.3737549781799316e-05, -2.2934749722480774e-05, -2.213194966316223e-05, -2.132914960384369e-05, -2.0526349544525146e-05, -1.9723549485206604e-05, -1.892074942588806e-05, -1.811794936656952e-05, -1.7315149307250977e-05, -1.6512349247932434e-05, -1.570954918861389e-05, -1.4906749129295349e-05, -1.4103949069976807e-05, -1.3301149010658264e-05, -1.2498348951339722e-05, -1.169554889202118e-05, -1.0892748832702637e-05, -1.0089948773384094e-05, -9.287148714065552e-06, -8.48434865474701e-06, -7.681548595428467e-06, -6.878748536109924e-06, -6.075948476791382e-06, -5.273148417472839e-06, -4.470348358154297e-06, -3.6675482988357544e-06, -2.864748239517212e-06, -2.0619481801986694e-06, -1.259148120880127e-06, -4.5634806156158447e-07, 3.46451997756958e-07, 1.1492520570755005e-06, 1.952052116394043e-06, 2.7548521757125854e-06, 3.557652235031128e-06, 4.36045229434967e-06, 5.163252353668213e-06, 5.966052412986755e-06, 6.768852472305298e-06, 7.57165253162384e-06, 8.374452590942383e-06, 9.177252650260925e-06, 9.980052709579468e-06, 1.078285276889801e-05, 1.1585652828216553e-05, 1.2388452887535095e-05, 1.3191252946853638e-05, 1.399405300617218e-05, 1.4796853065490723e-05, 1.5599653124809265e-05, 1.6402453184127808e-05, 1.720525324344635e-05, 1.8008053302764893e-05, 1.8810853362083435e-05, 1.9613653421401978e-05, 2.041645348072052e-05, 2.1219253540039062e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 14.0, 12.0, 28.0, 35.0, 51.0, 121.0, 295.0, 632.0, 1602.0, 4396.0, 14660.0, 73019.0, 747421.0, 170268.0, 25332.0, 6845.0, 2196.0, 841.0, 379.0, 189.0, 92.0, 49.0, 24.0, 9.0, 13.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.2324066162109375, -0.224578857421875, -0.2167510986328125, -0.20892333984375, -0.2010955810546875, -0.193267822265625, -0.1854400634765625, -0.1776123046875, -0.1697845458984375, -0.161956787109375, -0.1541290283203125, -0.14630126953125, -0.1384735107421875, -0.130645751953125, -0.1228179931640625, -0.114990234375, -0.1071624755859375, -0.099334716796875, -0.0915069580078125, -0.08367919921875, -0.0758514404296875, -0.068023681640625, -0.0601959228515625, -0.0523681640625, -0.0445404052734375, -0.036712646484375, -0.0288848876953125, -0.02105712890625, -0.0132293701171875, -0.005401611328125, 0.0024261474609375, 0.01025390625, 0.0180816650390625, 0.025909423828125, 0.0337371826171875, 0.04156494140625, 0.0493927001953125, 0.057220458984375, 0.0650482177734375, 0.0728759765625, 0.0807037353515625, 0.088531494140625, 0.0963592529296875, 0.10418701171875, 0.1120147705078125, 0.119842529296875, 0.1276702880859375, 0.135498046875, 0.1433258056640625, 0.151153564453125, 0.1589813232421875, 0.16680908203125, 0.1746368408203125, 0.182464599609375, 0.1902923583984375, 0.1981201171875, 0.2059478759765625, 0.213775634765625, 0.2216033935546875, 0.22943115234375, 0.2372589111328125, 0.245086669921875, 0.2529144287109375, 0.2607421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 5.0, 6.0, 6.0, 11.0, 15.0, 19.0, 16.0, 35.0, 41.0, 50.0, 80.0, 135.0, 159.0, 110.0, 87.0, 61.0, 42.0, 22.0, 17.0, 14.0, 16.0, 9.0, 7.0, 7.0, 4.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08758068084716797, -0.08470726013183594, -0.0818338394165039, -0.07896041870117188, -0.07608699798583984, -0.07321357727050781, -0.07034015655517578, -0.06746673583984375, -0.06459331512451172, -0.06171989440917969, -0.058846473693847656, -0.055973052978515625, -0.053099632263183594, -0.05022621154785156, -0.04735279083251953, -0.0444793701171875, -0.04160594940185547, -0.03873252868652344, -0.035859107971191406, -0.032985687255859375, -0.030112266540527344, -0.027238845825195312, -0.02436542510986328, -0.02149200439453125, -0.01861858367919922, -0.015745162963867188, -0.012871742248535156, -0.009998321533203125, -0.007124900817871094, -0.0042514801025390625, -0.0013780593872070312, 0.001495361328125, 0.004368782043457031, 0.0072422027587890625, 0.010115623474121094, 0.012989044189453125, 0.015862464904785156, 0.018735885620117188, 0.02160930633544922, 0.02448272705078125, 0.02735614776611328, 0.030229568481445312, 0.033102989196777344, 0.035976409912109375, 0.038849830627441406, 0.04172325134277344, 0.04459667205810547, 0.0474700927734375, 0.05034351348876953, 0.05321693420410156, 0.056090354919433594, 0.058963775634765625, 0.061837196350097656, 0.06471061706542969, 0.06758403778076172, 0.07045745849609375, 0.07333087921142578, 0.07620429992675781, 0.07907772064208984, 0.08195114135742188, 0.0848245620727539, 0.08769798278808594, 0.09057140350341797, 0.09344482421875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 11.0, 41.0, 228.0, 482.0, 197.0, 40.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427452564239502, -3.205850124359131, -2.984247922897339, -2.7626454830169678, -2.541043281555176, -2.3194408416748047, -2.0978384017944336, -1.876236081123352, -1.6546337604522705, -1.433031439781189, -1.2114291191101074, -0.9898266792297363, -0.7682243585586548, -0.5466220378875732, -0.32501959800720215, -0.1034172773361206, 0.11818504333496094, 0.33978739380836487, 0.5613897442817688, 0.7829921245574951, 1.0045944452285767, 1.2261967658996582, 1.4477992057800293, 1.6694015264511108, 1.8910038471221924, 2.1126062870025635, 2.3342084884643555, 2.5558109283447266, 2.7774133682250977, 2.9990155696868896, 3.2206180095672607, 3.4422202110290527, 3.6638221740722656, 3.8854246139526367, 4.107027053833008, 4.328629493713379, 4.550231456756592, 4.771833896636963, 4.993436336517334, 5.215038776397705, 5.436640739440918, 5.658243179321289, 5.87984561920166, 6.101448059082031, 6.323050022125244, 6.544652462005615, 6.766254901885986, 6.987857341766357, 7.2094597816467285, 7.4310622215271, 7.652664661407471, 7.874266624450684, 8.095869064331055, 8.317471504211426, 8.539073944091797, 8.760676383972168, 8.982278823852539, 9.20388126373291, 9.425483703613281, 9.647086143493652, 9.868688583374023, 10.090290069580078, 10.311893463134766, 10.53349494934082, 10.755097389221191]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 11.0, 13.0, 33.0, 27.0, 55.0, 64.0, 77.0, 87.0, 86.0, 96.0, 87.0, 89.0, 84.0, 59.0, 43.0, 35.0, 19.0, 15.0, 10.0, 9.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.889156341552734, -4.727077960968018, -4.564999580383301, -4.402920722961426, -4.240842342376709, -4.078763961791992, -3.9166853427886963, -3.7546067237854004, -3.5925283432006836, -3.430449962615967, -3.268371343612671, -3.106292724609375, -2.944214344024658, -2.7821359634399414, -2.6200573444366455, -2.4579787254333496, -2.295900344848633, -2.133821964263916, -1.9717433452606201, -1.8096648454666138, -1.6475863456726074, -1.485507845878601, -1.3234293460845947, -1.1613508462905884, -0.999272346496582, -0.8371938467025757, -0.6751153469085693, -0.513036847114563, -0.35095834732055664, -0.1888798475265503, -0.026801347732543945, 0.1352771520614624, 0.29735517501831055, 0.4594336748123169, 0.6215121746063232, 0.7835906744003296, 0.9456691741943359, 1.1077476739883423, 1.2698261737823486, 1.431904673576355, 1.5939831733703613, 1.7560616731643677, 1.918140172958374, 2.08021879196167, 2.2422971725463867, 2.4043755531311035, 2.5664541721343994, 2.7285327911376953, 2.890611171722412, 3.052689552307129, 3.214768171310425, 3.3768467903137207, 3.5389251708984375, 3.7010035514831543, 3.86308217048645, 4.025160789489746, 4.187239170074463, 4.34931755065918, 4.511396408081055, 4.6734747886657715, 4.835553169250488, 4.997631549835205, 5.159709930419922, 5.321788787841797, 5.483867168426514]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 3.0, 9.0, 23.0, 24.0, 38.0, 56.0, 82.0, 138.0, 210.0, 394.0, 814.0, 1493.0, 2908.0, 6371.0, 21676.0, 130752.0, 2303809.0, 1590697.0, 104849.0, 18756.0, 5916.0, 2511.0, 1289.0, 629.0, 324.0, 174.0, 124.0, 50.0, 42.0, 31.0, 19.0, 13.0, 17.0, 7.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3642578125, -1.3228302001953125, -1.281402587890625, -1.2399749755859375, -1.19854736328125, -1.1571197509765625, -1.115692138671875, -1.0742645263671875, -1.0328369140625, -0.9914093017578125, -0.949981689453125, -0.9085540771484375, -0.86712646484375, -0.8256988525390625, -0.784271240234375, -0.7428436279296875, -0.701416015625, -0.6599884033203125, -0.618560791015625, -0.5771331787109375, -0.53570556640625, -0.4942779541015625, -0.452850341796875, -0.4114227294921875, -0.3699951171875, -0.3285675048828125, -0.287139892578125, -0.2457122802734375, -0.20428466796875, -0.1628570556640625, -0.121429443359375, -0.0800018310546875, -0.03857421875, 0.0028533935546875, 0.044281005859375, 0.0857086181640625, 0.12713623046875, 0.1685638427734375, 0.209991455078125, 0.2514190673828125, 0.2928466796875, 0.3342742919921875, 0.375701904296875, 0.4171295166015625, 0.45855712890625, 0.4999847412109375, 0.541412353515625, 0.5828399658203125, 0.624267578125, 0.6656951904296875, 0.707122802734375, 0.7485504150390625, 0.78997802734375, 0.8314056396484375, 0.872833251953125, 0.9142608642578125, 0.9556884765625, 0.9971160888671875, 1.038543701171875, 1.0799713134765625, 1.12139892578125, 1.1628265380859375, 1.204254150390625, 1.2456817626953125, 1.287109375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 13.0, 19.0, 20.0, 52.0, 74.0, 124.0, 161.0, 137.0, 128.0, 121.0, 78.0, 33.0, 19.0, 10.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.98516845703125, -1.9195556640625, -1.85394287109375, -1.788330078125, -1.72271728515625, -1.6571044921875, -1.59149169921875, -1.52587890625, -1.46026611328125, -1.3946533203125, -1.32904052734375, -1.263427734375, -1.19781494140625, -1.1322021484375, -1.06658935546875, -1.0009765625, -0.93536376953125, -0.8697509765625, -0.80413818359375, -0.738525390625, -0.67291259765625, -0.6072998046875, -0.54168701171875, -0.47607421875, -0.41046142578125, -0.3448486328125, -0.27923583984375, -0.213623046875, -0.14801025390625, -0.0823974609375, -0.01678466796875, 0.048828125, 0.11444091796875, 0.1800537109375, 0.24566650390625, 0.311279296875, 0.37689208984375, 0.4425048828125, 0.50811767578125, 0.57373046875, 0.63934326171875, 0.7049560546875, 0.77056884765625, 0.836181640625, 0.90179443359375, 0.9674072265625, 1.03302001953125, 1.0986328125, 1.16424560546875, 1.2298583984375, 1.29547119140625, 1.361083984375, 1.42669677734375, 1.4923095703125, 1.55792236328125, 1.62353515625, 1.68914794921875, 1.7547607421875, 1.82037353515625, 1.885986328125, 1.95159912109375, 2.0172119140625, 2.08282470703125, 2.1484375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 9.0, 12.0, 10.0, 19.0, 53.0, 108.0, 203.0, 590.0, 3444.0, 2452305.0, 1733394.0, 3217.0, 567.0, 162.0, 91.0, 52.0, 24.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.578125, -4.42547607421875, -4.2728271484375, -4.12017822265625, -3.967529296875, -3.81488037109375, -3.6622314453125, -3.50958251953125, -3.35693359375, -3.20428466796875, -3.0516357421875, -2.89898681640625, -2.746337890625, -2.59368896484375, -2.4410400390625, -2.28839111328125, -2.1357421875, -1.98309326171875, -1.8304443359375, -1.67779541015625, -1.525146484375, -1.37249755859375, -1.2198486328125, -1.06719970703125, -0.91455078125, -0.76190185546875, -0.6092529296875, -0.45660400390625, -0.303955078125, -0.15130615234375, 0.0013427734375, 0.15399169921875, 0.306640625, 0.45928955078125, 0.6119384765625, 0.76458740234375, 0.917236328125, 1.06988525390625, 1.2225341796875, 1.37518310546875, 1.52783203125, 1.68048095703125, 1.8331298828125, 1.98577880859375, 2.138427734375, 2.29107666015625, 2.4437255859375, 2.59637451171875, 2.7490234375, 2.90167236328125, 3.0543212890625, 3.20697021484375, 3.359619140625, 3.51226806640625, 3.6649169921875, 3.81756591796875, 3.97021484375, 4.12286376953125, 4.2755126953125, 4.42816162109375, 4.580810546875, 4.73345947265625, 4.8861083984375, 5.03875732421875, 5.19140625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 13.0, 28.0, 28.0, 79.0, 117.0, 386.0, 1364.0, 1354.0, 382.0, 146.0, 64.0, 42.0, 24.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6966781616210938, -0.6755828857421875, -0.6544876098632812, -0.633392333984375, -0.6122970581054688, -0.5912017822265625, -0.5701065063476562, -0.54901123046875, -0.5279159545898438, -0.5068206787109375, -0.48572540283203125, -0.464630126953125, -0.44353485107421875, -0.4224395751953125, -0.40134429931640625, -0.3802490234375, -0.35915374755859375, -0.3380584716796875, -0.31696319580078125, -0.295867919921875, -0.27477264404296875, -0.2536773681640625, -0.23258209228515625, -0.21148681640625, -0.19039154052734375, -0.1692962646484375, -0.14820098876953125, -0.127105712890625, -0.10601043701171875, -0.0849151611328125, -0.06381988525390625, -0.042724609375, -0.02162933349609375, -0.0005340576171875, 0.02056121826171875, 0.041656494140625, 0.06275177001953125, 0.0838470458984375, 0.10494232177734375, 0.12603759765625, 0.14713287353515625, 0.1682281494140625, 0.18932342529296875, 0.210418701171875, 0.23151397705078125, 0.2526092529296875, 0.27370452880859375, 0.2947998046875, 0.31589508056640625, 0.3369903564453125, 0.35808563232421875, 0.379180908203125, 0.40027618408203125, 0.4213714599609375, 0.44246673583984375, 0.46356201171875, 0.48465728759765625, 0.5057525634765625, 0.5268478393554688, 0.547943115234375, 0.5690383911132812, 0.5901336669921875, 0.6112289428710938, 0.63232421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 13.0, 14.0, 22.0, 47.0, 105.0, 236.0, 224.0, 154.0, 107.0, 39.0, 20.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.651780605316162, -2.5764214992523193, -2.5010623931884766, -2.425703525543213, -2.35034441947937, -2.2749853134155273, -2.1996264457702637, -2.124267339706421, -2.048908233642578, -1.9735491275787354, -1.8981901407241821, -1.822831153869629, -1.7474720478057861, -1.6721129417419434, -1.5967539548873901, -1.521394968032837, -1.4460358619689941, -1.3706767559051514, -1.2953177690505981, -1.219958782196045, -1.1445996761322021, -1.0692405700683594, -0.9938815832138062, -0.9185225367546082, -0.8431634902954102, -0.7678044438362122, -0.6924453973770142, -0.6170863509178162, -0.5417273044586182, -0.46636825799942017, -0.39100921154022217, -0.31565016508102417, -0.24029135704040527, -0.16493231058120728, -0.08957326412200928, -0.01421421766281128, 0.06114482879638672, 0.13650387525558472, 0.21186292171478271, 0.2872219681739807, 0.3625810146331787, 0.4379400610923767, 0.5132991075515747, 0.5886581540107727, 0.6640172004699707, 0.7393762469291687, 0.8147352933883667, 0.8900943398475647, 0.9654533863067627, 1.0408124923706055, 1.1161714792251587, 1.191530466079712, 1.2668895721435547, 1.3422486782073975, 1.4176076650619507, 1.492966651916504, 1.5683257579803467, 1.6436848640441895, 1.7190438508987427, 1.794402837753296, 1.8697619438171387, 1.9451210498809814, 2.020480155944824, 2.095839023590088, 2.1711981296539307]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 13.0, 15.0, 18.0, 38.0, 40.0, 71.0, 116.0, 119.0, 107.0, 123.0, 115.0, 87.0, 52.0, 43.0, 28.0, 14.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9467259645462036, -1.8782237768173218, -1.8097214698791504, -1.7412192821502686, -1.6727169752120972, -1.6042147874832153, -1.535712480545044, -1.467210292816162, -1.3987081050872803, -1.3302059173583984, -1.261703610420227, -1.1932014226913452, -1.1246991157531738, -1.056196928024292, -0.9876946806907654, -0.9191924333572388, -0.8506901264190674, -0.7821878790855408, -0.7136856317520142, -0.6451834440231323, -0.5766811370849609, -0.5081789493560791, -0.4396767020225525, -0.3711744546890259, -0.30267220735549927, -0.23416996002197266, -0.16566772758960724, -0.09716549515724182, -0.02866324782371521, 0.0398389995098114, 0.10834121704101562, 0.17684346437454224, 0.2453458309173584, 0.313848078250885, 0.3823503255844116, 0.45085254311561584, 0.5193548202514648, 0.5878570079803467, 0.6563592553138733, 0.7248615026473999, 0.7933637499809265, 0.8618659973144531, 0.9303682446479797, 0.9988704919815063, 1.0673726797103882, 1.1358749866485596, 1.2043771743774414, 1.2728793621063232, 1.3413816690444946, 1.4098838567733765, 1.4783861637115479, 1.5468883514404297, 1.615390658378601, 1.683892846107483, 1.7523951530456543, 1.8208973407745361, 1.889399528503418, 1.9579017162322998, 2.0264039039611816, 2.0949063301086426, 2.1634085178375244, 2.2319107055664062, 2.300412893295288, 2.36891508102417, 2.437417507171631]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 15.0, 15.0, 14.0, 25.0, 31.0, 66.0, 84.0, 138.0, 285.0, 493.0, 1153.0, 3413.0, 14386.0, 104432.0, 709971.0, 185243.0, 21352.0, 4572.0, 1431.0, 621.0, 307.0, 186.0, 104.0, 64.0, 42.0, 33.0, 17.0, 14.0, 9.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2783317565917969, -0.26979827880859375, -0.2612648010253906, -0.2527313232421875, -0.24419784545898438, -0.23566436767578125, -0.22713088989257812, -0.218597412109375, -0.21006393432617188, -0.20153045654296875, -0.19299697875976562, -0.1844635009765625, -0.17593002319335938, -0.16739654541015625, -0.15886306762695312, -0.15032958984375, -0.14179611206054688, -0.13326263427734375, -0.12472915649414062, -0.1161956787109375, -0.10766220092773438, -0.09912872314453125, -0.09059524536132812, -0.082061767578125, -0.07352828979492188, -0.06499481201171875, -0.056461334228515625, -0.0479278564453125, -0.039394378662109375, -0.03086090087890625, -0.022327423095703125, -0.0137939453125, -0.005260467529296875, 0.00327301025390625, 0.011806488037109375, 0.0203399658203125, 0.028873443603515625, 0.03740692138671875, 0.045940399169921875, 0.054473876953125, 0.06300735473632812, 0.07154083251953125, 0.08007431030273438, 0.0886077880859375, 0.09714126586914062, 0.10567474365234375, 0.11420822143554688, 0.12274169921875, 0.13127517700195312, 0.13980865478515625, 0.14834213256835938, 0.1568756103515625, 0.16540908813476562, 0.17394256591796875, 0.18247604370117188, 0.191009521484375, 0.19954299926757812, 0.20807647705078125, 0.21660995483398438, 0.2251434326171875, 0.23367691040039062, 0.24221038818359375, 0.2507438659667969, 0.25927734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 10.0, 4.0, 14.0, 33.0, 30.0, 68.0, 96.0, 126.0, 123.0, 121.0, 138.0, 102.0, 59.0, 35.0, 25.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.167938232421875, -1.12103271484375, -1.074127197265625, -1.0272216796875, -0.980316162109375, -0.93341064453125, -0.886505126953125, -0.839599609375, -0.792694091796875, -0.74578857421875, -0.698883056640625, -0.6519775390625, -0.605072021484375, -0.55816650390625, -0.511260986328125, -0.46435546875, -0.417449951171875, -0.37054443359375, -0.323638916015625, -0.2767333984375, -0.229827880859375, -0.18292236328125, -0.136016845703125, -0.089111328125, -0.042205810546875, 0.00469970703125, 0.051605224609375, 0.0985107421875, 0.145416259765625, 0.19232177734375, 0.239227294921875, 0.2861328125, 0.333038330078125, 0.37994384765625, 0.426849365234375, 0.4737548828125, 0.520660400390625, 0.56756591796875, 0.614471435546875, 0.661376953125, 0.708282470703125, 0.75518798828125, 0.802093505859375, 0.8489990234375, 0.895904541015625, 0.94281005859375, 0.989715576171875, 1.03662109375, 1.083526611328125, 1.13043212890625, 1.177337646484375, 1.2242431640625, 1.271148681640625, 1.31805419921875, 1.364959716796875, 1.411865234375, 1.458770751953125, 1.50567626953125, 1.552581787109375, 1.5994873046875, 1.646392822265625, 1.69329833984375, 1.740203857421875, 1.787109375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 5.0, 15.0, 15.0, 22.0, 37.0, 40.0, 82.0, 96.0, 200.0, 322.0, 638.0, 1142.0, 2543.0, 5834.0, 14326.0, 39461.0, 120339.0, 343809.0, 337947.0, 117985.0, 38466.0, 14076.0, 5861.0, 2512.0, 1245.0, 597.0, 348.0, 173.0, 118.0, 95.0, 59.0, 36.0, 25.0, 17.0, 15.0, 10.0, 10.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1002197265625, -0.09676265716552734, -0.09330558776855469, -0.08984851837158203, -0.08639144897460938, -0.08293437957763672, -0.07947731018066406, -0.0760202407836914, -0.07256317138671875, -0.0691061019897461, -0.06564903259277344, -0.06219196319580078, -0.058734893798828125, -0.05527782440185547, -0.05182075500488281, -0.048363685607910156, -0.0449066162109375, -0.041449546813964844, -0.03799247741699219, -0.03453540802001953, -0.031078338623046875, -0.02762126922607422, -0.024164199829101562, -0.020707130432128906, -0.01725006103515625, -0.013792991638183594, -0.010335922241210938, -0.006878852844238281, -0.003421783447265625, 3.528594970703125e-05, 0.0034923553466796875, 0.006949424743652344, 0.010406494140625, 0.013863563537597656, 0.017320632934570312, 0.02077770233154297, 0.024234771728515625, 0.02769184112548828, 0.031148910522460938, 0.034605979919433594, 0.03806304931640625, 0.041520118713378906, 0.04497718811035156, 0.04843425750732422, 0.051891326904296875, 0.05534839630126953, 0.05880546569824219, 0.062262535095214844, 0.0657196044921875, 0.06917667388916016, 0.07263374328613281, 0.07609081268310547, 0.07954788208007812, 0.08300495147705078, 0.08646202087402344, 0.0899190902709961, 0.09337615966796875, 0.0968332290649414, 0.10029029846191406, 0.10374736785888672, 0.10720443725585938, 0.11066150665283203, 0.11411857604980469, 0.11757564544677734, 0.12103271484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 13.0, 19.0, 27.0, 35.0, 33.0, 53.0, 65.0, 62.0, 63.0, 69.0, 79.0, 82.0, 75.0, 62.0, 63.0, 38.0, 41.0, 35.0, 16.0, 17.0, 14.0, 11.0, 6.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3115234375, -1.2532501220703125, -1.194976806640625, -1.1367034912109375, -1.07843017578125, -1.0201568603515625, -0.961883544921875, -0.9036102294921875, -0.8453369140625, -0.7870635986328125, -0.728790283203125, -0.6705169677734375, -0.61224365234375, -0.5539703369140625, -0.495697021484375, -0.4374237060546875, -0.379150390625, -0.3208770751953125, -0.262603759765625, -0.2043304443359375, -0.14605712890625, -0.0877838134765625, -0.029510498046875, 0.0287628173828125, 0.0870361328125, 0.1453094482421875, 0.203582763671875, 0.2618560791015625, 0.32012939453125, 0.3784027099609375, 0.436676025390625, 0.4949493408203125, 0.55322265625, 0.6114959716796875, 0.669769287109375, 0.7280426025390625, 0.78631591796875, 0.8445892333984375, 0.902862548828125, 0.9611358642578125, 1.0194091796875, 1.0776824951171875, 1.135955810546875, 1.1942291259765625, 1.25250244140625, 1.3107757568359375, 1.369049072265625, 1.4273223876953125, 1.485595703125, 1.5438690185546875, 1.602142333984375, 1.6604156494140625, 1.71868896484375, 1.7769622802734375, 1.835235595703125, 1.8935089111328125, 1.9517822265625, 2.0100555419921875, 2.068328857421875, 2.1266021728515625, 2.18487548828125, 2.2431488037109375, 2.301422119140625, 2.3596954345703125, 2.41796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 20.0, 32.0, 45.0, 60.0, 79.0, 176.0, 341.0, 678.0, 1814.0, 6485.0, 37403.0, 497178.0, 460248.0, 34766.0, 6139.0, 1705.0, 600.0, 309.0, 170.0, 105.0, 66.0, 43.0, 25.0, 17.0, 10.0, 10.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211639404296875, -0.020480871200561523, -0.019797801971435547, -0.01911473274230957, -0.018431663513183594, -0.017748594284057617, -0.01706552505493164, -0.016382455825805664, -0.015699386596679688, -0.015016317367553711, -0.014333248138427734, -0.013650178909301758, -0.012967109680175781, -0.012284040451049805, -0.011600971221923828, -0.010917901992797852, -0.010234832763671875, -0.009551763534545898, -0.008868694305419922, -0.008185625076293945, -0.007502555847167969, -0.006819486618041992, -0.006136417388916016, -0.005453348159790039, -0.0047702789306640625, -0.004087209701538086, -0.0034041404724121094, -0.002721071243286133, -0.0020380020141601562, -0.0013549327850341797, -0.0006718635559082031, 1.1205673217773438e-05, 0.00069427490234375, 0.0013773441314697266, 0.002060413360595703, 0.0027434825897216797, 0.0034265518188476562, 0.004109621047973633, 0.004792690277099609, 0.005475759506225586, 0.0061588287353515625, 0.006841897964477539, 0.007524967193603516, 0.008208036422729492, 0.008891105651855469, 0.009574174880981445, 0.010257244110107422, 0.010940313339233398, 0.011623382568359375, 0.012306451797485352, 0.012989521026611328, 0.013672590255737305, 0.014355659484863281, 0.015038728713989258, 0.015721797943115234, 0.01640486717224121, 0.017087936401367188, 0.017771005630493164, 0.01845407485961914, 0.019137144088745117, 0.019820213317871094, 0.02050328254699707, 0.021186351776123047, 0.021869421005249023, 0.022552490234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 10.0, 18.0, 21.0, 35.0, 64.0, 68.0, 123.0, 120.0, 127.0, 118.0, 78.0, 68.0, 57.0, 28.0, 19.0, 16.0, 7.0, 5.0, 7.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.415346145629883e-05, -3.323797136545181e-05, -3.23224812746048e-05, -3.140699118375778e-05, -3.0491501092910767e-05, -2.957601100206375e-05, -2.8660520911216736e-05, -2.774503082036972e-05, -2.6829540729522705e-05, -2.591405063867569e-05, -2.4998560547828674e-05, -2.408307045698166e-05, -2.3167580366134644e-05, -2.2252090275287628e-05, -2.1336600184440613e-05, -2.0421110093593597e-05, -1.9505620002746582e-05, -1.8590129911899567e-05, -1.767463982105255e-05, -1.6759149730205536e-05, -1.584365963935852e-05, -1.4928169548511505e-05, -1.401267945766449e-05, -1.3097189366817474e-05, -1.2181699275970459e-05, -1.1266209185123444e-05, -1.0350719094276428e-05, -9.435229003429413e-06, -8.519738912582397e-06, -7.604248821735382e-06, -6.688758730888367e-06, -5.773268640041351e-06, -4.857778549194336e-06, -3.9422884583473206e-06, -3.026798367500305e-06, -2.11130827665329e-06, -1.1958181858062744e-06, -2.8032809495925903e-07, 6.351619958877563e-07, 1.5506520867347717e-06, 2.466142177581787e-06, 3.3816322684288025e-06, 4.297122359275818e-06, 5.212612450122833e-06, 6.128102540969849e-06, 7.043592631816864e-06, 7.95908272266388e-06, 8.874572813510895e-06, 9.79006290435791e-06, 1.0705552995204926e-05, 1.1621043086051941e-05, 1.2536533176898956e-05, 1.3452023267745972e-05, 1.4367513358592987e-05, 1.5283003449440002e-05, 1.6198493540287018e-05, 1.7113983631134033e-05, 1.802947372198105e-05, 1.8944963812828064e-05, 1.986045390367508e-05, 2.0775943994522095e-05, 2.169143408536911e-05, 2.2606924176216125e-05, 2.352241426706314e-05, 2.4437904357910156e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 8.0, 8.0, 12.0, 17.0, 20.0, 33.0, 45.0, 60.0, 143.0, 431.0, 1126.0, 3886.0, 17398.0, 145028.0, 785686.0, 78266.0, 11970.0, 2876.0, 881.0, 302.0, 143.0, 69.0, 42.0, 26.0, 19.0, 12.0, 13.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026519775390625, -0.025700807571411133, -0.024881839752197266, -0.0240628719329834, -0.02324390411376953, -0.022424936294555664, -0.021605968475341797, -0.02078700065612793, -0.019968032836914062, -0.019149065017700195, -0.018330097198486328, -0.01751112937927246, -0.016692161560058594, -0.015873193740844727, -0.01505422592163086, -0.014235258102416992, -0.013416290283203125, -0.012597322463989258, -0.01177835464477539, -0.010959386825561523, -0.010140419006347656, -0.009321451187133789, -0.008502483367919922, -0.007683515548706055, -0.0068645477294921875, -0.00604557991027832, -0.005226612091064453, -0.004407644271850586, -0.0035886764526367188, -0.0027697086334228516, -0.0019507408142089844, -0.0011317729949951172, -0.00031280517578125, 0.0005061626434326172, 0.0013251304626464844, 0.0021440982818603516, 0.0029630661010742188, 0.003782033920288086, 0.004601001739501953, 0.00541996955871582, 0.0062389373779296875, 0.007057905197143555, 0.007876873016357422, 0.008695840835571289, 0.009514808654785156, 0.010333776473999023, 0.01115274429321289, 0.011971712112426758, 0.012790679931640625, 0.013609647750854492, 0.01442861557006836, 0.015247583389282227, 0.016066551208496094, 0.01688551902770996, 0.017704486846923828, 0.018523454666137695, 0.019342422485351562, 0.02016139030456543, 0.020980358123779297, 0.021799325942993164, 0.02261829376220703, 0.0234372615814209, 0.024256229400634766, 0.025075197219848633, 0.0258941650390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 4.0, 9.0, 8.0, 14.0, 19.0, 20.0, 33.0, 34.0, 62.0, 73.0, 131.0, 155.0, 113.0, 79.0, 56.0, 44.0, 26.0, 17.0, 21.0, 15.0, 12.0, 14.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005298614501953125, -0.005112886428833008, -0.004927158355712891, -0.0047414302825927734, -0.004555702209472656, -0.004369974136352539, -0.004184246063232422, -0.003998517990112305, -0.0038127899169921875, -0.0036270618438720703, -0.003441333770751953, -0.003255605697631836, -0.0030698776245117188, -0.0028841495513916016, -0.0026984214782714844, -0.002512693405151367, -0.00232696533203125, -0.002141237258911133, -0.0019555091857910156, -0.0017697811126708984, -0.0015840530395507812, -0.001398324966430664, -0.0012125968933105469, -0.0010268688201904297, -0.0008411407470703125, -0.0006554126739501953, -0.0004696846008300781, -0.00028395652770996094, -9.822845458984375e-05, 8.749961853027344e-05, 0.0002732276916503906, 0.0004589557647705078, 0.000644683837890625, 0.0008304119110107422, 0.0010161399841308594, 0.0012018680572509766, 0.0013875961303710938, 0.001573324203491211, 0.0017590522766113281, 0.0019447803497314453, 0.0021305084228515625, 0.0023162364959716797, 0.002501964569091797, 0.002687692642211914, 0.0028734207153320312, 0.0030591487884521484, 0.0032448768615722656, 0.003430604934692383, 0.0036163330078125, 0.003802061080932617, 0.003987789154052734, 0.0041735172271728516, 0.004359245300292969, 0.004544973373413086, 0.004730701446533203, 0.00491642951965332, 0.0051021575927734375, 0.005287885665893555, 0.005473613739013672, 0.005659341812133789, 0.005845069885253906, 0.0060307979583740234, 0.006216526031494141, 0.006402254104614258, 0.006587982177734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 11.0, 22.0, 46.0, 128.0, 321.0, 278.0, 132.0, 36.0, 20.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9554336071014404, -1.8900532722473145, -1.824673056602478, -1.759292721748352, -1.6939125061035156, -1.6285321712493896, -1.5631518363952637, -1.4977716207504272, -1.4323914051055908, -1.3670110702514648, -1.3016308546066284, -1.2362505197525024, -1.170870304107666, -1.10548996925354, -1.040109634399414, -0.9747294187545776, -0.9093490839004517, -0.8439688086509705, -0.7785885334014893, -0.7132081985473633, -0.6478279829025269, -0.5824476480484009, -0.5170673727989197, -0.4516870975494385, -0.3863068222999573, -0.3209265470504761, -0.2555462718009949, -0.19016596674919128, -0.12478569149971008, -0.05940541625022888, 0.005974888801574707, 0.07135516405105591, 0.1367354393005371, 0.2021157145500183, 0.2674959897994995, 0.3328762948513031, 0.3982565701007843, 0.4636368453502655, 0.5290171504020691, 0.5943974256515503, 0.6597777009010315, 0.7251579761505127, 0.7905382513999939, 0.8559185266494751, 0.9212988615036011, 0.9866790771484375, 1.0520594120025635, 1.1174397468566895, 1.1828199625015259, 1.2482002973556519, 1.3135805130004883, 1.3789608478546143, 1.4443410634994507, 1.5097213983535767, 1.575101613998413, 1.640481948852539, 1.705862283706665, 1.771242618560791, 1.8366228342056274, 1.9020031690597534, 1.9673833847045898, 2.032763719558716, 2.098144054412842, 2.1635241508483887, 2.2289044857025146]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 15.0, 19.0, 24.0, 47.0, 75.0, 131.0, 156.0, 131.0, 153.0, 108.0, 66.0, 42.0, 24.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4211900234222412, -1.3691729307174683, -1.3171558380126953, -1.2651387453079224, -1.2131216526031494, -1.161104679107666, -1.109087586402893, -1.0570704936981201, -1.0050534009933472, -0.9530363082885742, -0.9010192155838013, -0.8490021824836731, -0.7969850897789001, -0.7449679970741272, -0.692950963973999, -0.6409338712692261, -0.5889167785644531, -0.5368996858596802, -0.4848826229572296, -0.43286556005477905, -0.3808484673500061, -0.32883137464523315, -0.2768143117427826, -0.22479724884033203, -0.17278015613555908, -0.12076307833194733, -0.06874600052833557, -0.016728922724723816, 0.03528815507888794, 0.08730524778366089, 0.13932231068611145, 0.191339373588562, 0.2433563470840454, 0.29537343978881836, 0.3473905026912689, 0.3994075655937195, 0.45142465829849243, 0.5034417510032654, 0.5554587841033936, 0.6074758768081665, 0.6594929695129395, 0.7115100622177124, 0.7635271549224854, 0.8155441880226135, 0.8675612807273865, 0.9195783734321594, 0.9715954065322876, 1.0236124992370605, 1.0756295919418335, 1.1276466846466064, 1.1796637773513794, 1.2316808700561523, 1.2836978435516357, 1.3357150554656982, 1.3877320289611816, 1.4397491216659546, 1.4917662143707275, 1.5437833070755005, 1.5958003997802734, 1.6478174924850464, 1.6998345851898193, 1.7518515586853027, 1.8038686513900757, 1.8558857440948486, 1.9079028367996216]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 16.0, 16.0, 34.0, 53.0, 118.0, 185.0, 444.0, 1364.0, 5221.0, 24958.0, 303964.0, 663611.0, 38453.0, 7186.0, 1825.0, 617.0, 201.0, 92.0, 67.0, 35.0, 22.0, 11.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7887802124023438, -0.7596893310546875, -0.7305984497070312, -0.701507568359375, -0.6724166870117188, -0.6433258056640625, -0.6142349243164062, -0.58514404296875, -0.5560531616210938, -0.5269622802734375, -0.49787139892578125, -0.468780517578125, -0.43968963623046875, -0.4105987548828125, -0.38150787353515625, -0.3524169921875, -0.32332611083984375, -0.2942352294921875, -0.26514434814453125, -0.236053466796875, -0.20696258544921875, -0.1778717041015625, -0.14878082275390625, -0.11968994140625, -0.09059906005859375, -0.0615081787109375, -0.03241729736328125, -0.003326416015625, 0.02576446533203125, 0.0548553466796875, 0.08394622802734375, 0.113037109375, 0.14212799072265625, 0.1712188720703125, 0.20030975341796875, 0.229400634765625, 0.25849151611328125, 0.2875823974609375, 0.31667327880859375, 0.34576416015625, 0.37485504150390625, 0.4039459228515625, 0.43303680419921875, 0.462127685546875, 0.49121856689453125, 0.5203094482421875, 0.5494003295898438, 0.5784912109375, 0.6075820922851562, 0.6366729736328125, 0.6657638549804688, 0.694854736328125, 0.7239456176757812, 0.7530364990234375, 0.7821273803710938, 0.81121826171875, 0.8403091430664062, 0.8694000244140625, 0.8984909057617188, 0.927581787109375, 0.9566726684570312, 0.9857635498046875, 1.0148544311523438, 1.0439453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 9.0, 13.0, 22.0, 30.0, 43.0, 72.0, 108.0, 129.0, 112.0, 119.0, 122.0, 80.0, 59.0, 34.0, 24.0, 16.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.941558837890625, -1.85577392578125, -1.769989013671875, -1.6842041015625, -1.598419189453125, -1.51263427734375, -1.426849365234375, -1.341064453125, -1.255279541015625, -1.16949462890625, -1.083709716796875, -0.9979248046875, -0.912139892578125, -0.82635498046875, -0.740570068359375, -0.65478515625, -0.569000244140625, -0.48321533203125, -0.397430419921875, -0.3116455078125, -0.225860595703125, -0.14007568359375, -0.054290771484375, 0.031494140625, 0.117279052734375, 0.20306396484375, 0.288848876953125, 0.3746337890625, 0.460418701171875, 0.54620361328125, 0.631988525390625, 0.7177734375, 0.803558349609375, 0.88934326171875, 0.975128173828125, 1.0609130859375, 1.146697998046875, 1.23248291015625, 1.318267822265625, 1.404052734375, 1.489837646484375, 1.57562255859375, 1.661407470703125, 1.7471923828125, 1.832977294921875, 1.91876220703125, 2.004547119140625, 2.09033203125, 2.176116943359375, 2.26190185546875, 2.347686767578125, 2.4334716796875, 2.519256591796875, 2.60504150390625, 2.690826416015625, 2.776611328125, 2.862396240234375, 2.94818115234375, 3.033966064453125, 3.1197509765625, 3.205535888671875, 3.29132080078125, 3.377105712890625, 3.462890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 13.0, 11.0, 19.0, 21.0, 35.0, 29.0, 38.0, 65.0, 106.0, 217.0, 692.0, 7183.0, 668326.0, 365317.0, 5404.0, 543.0, 199.0, 97.0, 50.0, 40.0, 28.0, 18.0, 23.0, 17.0, 13.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6435546875, -1.5921173095703125, -1.540679931640625, -1.4892425537109375, -1.43780517578125, -1.3863677978515625, -1.334930419921875, -1.2834930419921875, -1.2320556640625, -1.1806182861328125, -1.129180908203125, -1.0777435302734375, -1.02630615234375, -0.9748687744140625, -0.923431396484375, -0.8719940185546875, -0.820556640625, -0.7691192626953125, -0.717681884765625, -0.6662445068359375, -0.61480712890625, -0.5633697509765625, -0.511932373046875, -0.4604949951171875, -0.4090576171875, -0.3576202392578125, -0.306182861328125, -0.2547454833984375, -0.20330810546875, -0.1518707275390625, -0.100433349609375, -0.0489959716796875, 0.00244140625, 0.0538787841796875, 0.105316162109375, 0.1567535400390625, 0.20819091796875, 0.2596282958984375, 0.311065673828125, 0.3625030517578125, 0.4139404296875, 0.4653778076171875, 0.516815185546875, 0.5682525634765625, 0.61968994140625, 0.6711273193359375, 0.722564697265625, 0.7740020751953125, 0.825439453125, 0.8768768310546875, 0.928314208984375, 0.9797515869140625, 1.03118896484375, 1.0826263427734375, 1.134063720703125, 1.1855010986328125, 1.2369384765625, 1.2883758544921875, 1.339813232421875, 1.3912506103515625, 1.44268798828125, 1.4941253662109375, 1.545562744140625, 1.5970001220703125, 1.6484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 7.0, 11.0, 13.0, 15.0, 19.0, 28.0, 26.0, 23.0, 43.0, 45.0, 70.0, 53.0, 72.0, 59.0, 83.0, 62.0, 65.0, 51.0, 58.0, 39.0, 29.0, 26.0, 15.0, 19.0, 17.0, 9.0, 11.0, 5.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.001953125, -1.93804931640625, -1.8741455078125, -1.81024169921875, -1.746337890625, -1.68243408203125, -1.6185302734375, -1.55462646484375, -1.49072265625, -1.42681884765625, -1.3629150390625, -1.29901123046875, -1.235107421875, -1.17120361328125, -1.1072998046875, -1.04339599609375, -0.9794921875, -0.91558837890625, -0.8516845703125, -0.78778076171875, -0.723876953125, -0.65997314453125, -0.5960693359375, -0.53216552734375, -0.46826171875, -0.40435791015625, -0.3404541015625, -0.27655029296875, -0.212646484375, -0.14874267578125, -0.0848388671875, -0.02093505859375, 0.04296875, 0.10687255859375, 0.1707763671875, 0.23468017578125, 0.298583984375, 0.36248779296875, 0.4263916015625, 0.49029541015625, 0.55419921875, 0.61810302734375, 0.6820068359375, 0.74591064453125, 0.809814453125, 0.87371826171875, 0.9376220703125, 1.00152587890625, 1.0654296875, 1.12933349609375, 1.1932373046875, 1.25714111328125, 1.321044921875, 1.38494873046875, 1.4488525390625, 1.51275634765625, 1.57666015625, 1.64056396484375, 1.7044677734375, 1.76837158203125, 1.832275390625, 1.89617919921875, 1.9600830078125, 2.02398681640625, 2.087890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 4.0, 7.0, 12.0, 28.0, 23.0, 30.0, 56.0, 84.0, 111.0, 207.0, 377.0, 704.0, 1286.0, 2472.0, 5959.0, 16980.0, 80506.0, 716549.0, 180527.0, 27223.0, 8342.0, 3338.0, 1614.0, 893.0, 468.0, 278.0, 182.0, 95.0, 50.0, 30.0, 33.0, 21.0, 14.0, 13.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1668701171875, -0.16160202026367188, -0.15633392333984375, -0.15106582641601562, -0.1457977294921875, -0.14052963256835938, -0.13526153564453125, -0.12999343872070312, -0.124725341796875, -0.11945724487304688, -0.11418914794921875, -0.10892105102539062, -0.1036529541015625, -0.09838485717773438, -0.09311676025390625, -0.08784866333007812, -0.08258056640625, -0.07731246948242188, -0.07204437255859375, -0.06677627563476562, -0.0615081787109375, -0.056240081787109375, -0.05097198486328125, -0.045703887939453125, -0.040435791015625, -0.035167694091796875, -0.02989959716796875, -0.024631500244140625, -0.0193634033203125, -0.014095306396484375, -0.00882720947265625, -0.003559112548828125, 0.001708984375, 0.006977081298828125, 0.01224517822265625, 0.017513275146484375, 0.0227813720703125, 0.028049468994140625, 0.03331756591796875, 0.038585662841796875, 0.043853759765625, 0.049121856689453125, 0.05438995361328125, 0.059658050537109375, 0.0649261474609375, 0.07019424438476562, 0.07546234130859375, 0.08073043823242188, 0.08599853515625, 0.09126663208007812, 0.09653472900390625, 0.10180282592773438, 0.1070709228515625, 0.11233901977539062, 0.11760711669921875, 0.12287521362304688, 0.128143310546875, 0.13341140747070312, 0.13867950439453125, 0.14394760131835938, 0.1492156982421875, 0.15448379516601562, 0.15975189208984375, 0.16501998901367188, 0.1702880859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 4.0, 6.0, 12.0, 13.0, 16.0, 29.0, 48.0, 82.0, 128.0, 197.0, 178.0, 96.0, 69.0, 24.0, 24.0, 16.0, 16.0, 6.0, 13.0, 1.0, 8.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.676248550415039e-05, -2.5920569896697998e-05, -2.5078654289245605e-05, -2.4236738681793213e-05, -2.339482307434082e-05, -2.2552907466888428e-05, -2.1710991859436035e-05, -2.0869076251983643e-05, -2.002716064453125e-05, -1.9185245037078857e-05, -1.8343329429626465e-05, -1.7501413822174072e-05, -1.665949821472168e-05, -1.5817582607269287e-05, -1.4975666999816895e-05, -1.4133751392364502e-05, -1.329183578491211e-05, -1.2449920177459717e-05, -1.1608004570007324e-05, -1.0766088962554932e-05, -9.924173355102539e-06, -9.082257747650146e-06, -8.240342140197754e-06, -7.398426532745361e-06, -6.556510925292969e-06, -5.714595317840576e-06, -4.872679710388184e-06, -4.030764102935791e-06, -3.1888484954833984e-06, -2.346932888031006e-06, -1.5050172805786133e-06, -6.631016731262207e-07, 1.7881393432617188e-07, 1.0207295417785645e-06, 1.862645149230957e-06, 2.7045607566833496e-06, 3.546476364135742e-06, 4.388391971588135e-06, 5.230307579040527e-06, 6.07222318649292e-06, 6.9141387939453125e-06, 7.756054401397705e-06, 8.597970008850098e-06, 9.43988561630249e-06, 1.0281801223754883e-05, 1.1123716831207275e-05, 1.1965632438659668e-05, 1.280754804611206e-05, 1.3649463653564453e-05, 1.4491379261016846e-05, 1.5333294868469238e-05, 1.617521047592163e-05, 1.7017126083374023e-05, 1.7859041690826416e-05, 1.870095729827881e-05, 1.95428729057312e-05, 2.0384788513183594e-05, 2.1226704120635986e-05, 2.206861972808838e-05, 2.291053533554077e-05, 2.3752450942993164e-05, 2.4594366550445557e-05, 2.543628215789795e-05, 2.6278197765350342e-05, 2.7120113372802734e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 6.0, 13.0, 17.0, 20.0, 23.0, 35.0, 71.0, 115.0, 218.0, 404.0, 748.0, 1646.0, 3468.0, 8448.0, 26969.0, 198615.0, 714904.0, 67718.0, 14863.0, 5490.0, 2351.0, 1099.0, 570.0, 309.0, 155.0, 102.0, 54.0, 35.0, 24.0, 16.0, 16.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22350692749023438, -0.21678924560546875, -0.21007156372070312, -0.2033538818359375, -0.19663619995117188, -0.18991851806640625, -0.18320083618164062, -0.176483154296875, -0.16976547241210938, -0.16304779052734375, -0.15633010864257812, -0.1496124267578125, -0.14289474487304688, -0.13617706298828125, -0.12945938110351562, -0.12274169921875, -0.11602401733398438, -0.10930633544921875, -0.10258865356445312, -0.0958709716796875, -0.08915328979492188, -0.08243560791015625, -0.07571792602539062, -0.069000244140625, -0.062282562255859375, -0.05556488037109375, -0.048847198486328125, -0.0421295166015625, -0.035411834716796875, -0.02869415283203125, -0.021976470947265625, -0.0152587890625, -0.008541107177734375, -0.00182342529296875, 0.004894256591796875, 0.0116119384765625, 0.018329620361328125, 0.02504730224609375, 0.031764984130859375, 0.038482666015625, 0.045200347900390625, 0.05191802978515625, 0.058635711669921875, 0.0653533935546875, 0.07207107543945312, 0.07878875732421875, 0.08550643920898438, 0.09222412109375, 0.09894180297851562, 0.10565948486328125, 0.11237716674804688, 0.1190948486328125, 0.12581253051757812, 0.13253021240234375, 0.13924789428710938, 0.145965576171875, 0.15268325805664062, 0.15940093994140625, 0.16611862182617188, 0.1728363037109375, 0.17955398559570312, 0.18627166748046875, 0.19298934936523438, 0.19970703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 13.0, 4.0, 12.0, 22.0, 37.0, 32.0, 47.0, 66.0, 109.0, 137.0, 154.0, 93.0, 64.0, 59.0, 34.0, 29.0, 19.0, 6.0, 5.0, 11.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1068115234375, -0.1036691665649414, -0.10052680969238281, -0.09738445281982422, -0.09424209594726562, -0.09109973907470703, -0.08795738220214844, -0.08481502532958984, -0.08167266845703125, -0.07853031158447266, -0.07538795471191406, -0.07224559783935547, -0.06910324096679688, -0.06596088409423828, -0.06281852722167969, -0.059676170349121094, -0.0565338134765625, -0.053391456604003906, -0.05024909973144531, -0.04710674285888672, -0.043964385986328125, -0.04082202911376953, -0.03767967224121094, -0.034537315368652344, -0.03139495849609375, -0.028252601623535156, -0.025110244750976562, -0.02196788787841797, -0.018825531005859375, -0.01568317413330078, -0.012540817260742188, -0.009398460388183594, -0.006256103515625, -0.0031137466430664062, 2.86102294921875e-05, 0.0031709671020507812, 0.006313323974609375, 0.009455680847167969, 0.012598037719726562, 0.015740394592285156, 0.01888275146484375, 0.022025108337402344, 0.025167465209960938, 0.02830982208251953, 0.031452178955078125, 0.03459453582763672, 0.03773689270019531, 0.040879249572753906, 0.0440216064453125, 0.047163963317871094, 0.05030632019042969, 0.05344867706298828, 0.056591033935546875, 0.05973339080810547, 0.06287574768066406, 0.06601810455322266, 0.06916046142578125, 0.07230281829833984, 0.07544517517089844, 0.07858753204345703, 0.08172988891601562, 0.08487224578857422, 0.08801460266113281, 0.0911569595336914, 0.09429931640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 15.0, 33.0, 149.0, 373.0, 308.0, 89.0, 27.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.718236923217773, -4.548639297485352, -4.37904167175293, -4.209444046020508, -4.039846420288086, -3.870248794555664, -3.700650930404663, -3.531053304672241, -3.3614556789398193, -3.1918580532073975, -3.0222604274749756, -2.8526625633239746, -2.6830649375915527, -2.513467311859131, -2.343869686126709, -2.174272060394287, -2.0046744346618652, -1.8350768089294434, -1.6654791831970215, -1.49588143825531, -1.3262838125228882, -1.1566861867904663, -0.9870884418487549, -0.817490816116333, -0.6478931903839111, -0.47829553484916687, -0.3086978793144226, -0.13910019397735596, 0.030497431755065918, 0.2000950574874878, 0.3696928024291992, 0.5392904281616211, 0.7088885307312012, 0.878486156463623, 1.048083782196045, 1.2176815271377563, 1.3872791528701782, 1.5568767786026, 1.7264745235443115, 1.8960721492767334, 2.0656697750091553, 2.235267400741577, 2.404865026473999, 2.574462890625, 2.744060516357422, 2.9136581420898438, 3.0832557678222656, 3.2528533935546875, 3.4224510192871094, 3.5920486450195312, 3.761646270751953, 3.931243896484375, 4.100841522216797, 4.270439147949219, 4.440036773681641, 4.6096343994140625, 4.779232025146484, 4.948829650878906, 5.118427276611328, 5.28802490234375, 5.457622528076172, 5.627220153808594, 5.796817779541016, 5.9664154052734375, 6.136013507843018]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 23.0, 21.0, 34.0, 33.0, 47.0, 49.0, 65.0, 78.0, 91.0, 80.0, 78.0, 65.0, 78.0, 64.0, 43.0, 38.0, 39.0, 19.0, 11.0, 13.0, 10.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.293010711669922, -5.124783515930176, -4.95655632019043, -4.788329124450684, -4.6201019287109375, -4.45187520980835, -4.2836480140686035, -4.115420818328857, -3.9471936225891113, -3.7789664268493652, -3.610739231109619, -3.442512273788452, -3.274285078048706, -3.10605788230896, -2.937830924987793, -2.769603729248047, -2.601376533508301, -2.4331493377685547, -2.2649221420288086, -2.0966951847076416, -1.9284679889678955, -1.7602407932281494, -1.5920137166976929, -1.4237866401672363, -1.2555594444274902, -1.0873322486877441, -0.9191051721572876, -0.7508780360221863, -0.582650899887085, -0.41442376375198364, -0.24619662761688232, -0.07796955108642578, 0.09025812149047852, 0.25848525762557983, 0.42671239376068115, 0.5949395298957825, 0.7631666660308838, 0.9313938021659851, 1.0996209383010864, 1.267848014831543, 1.436075210571289, 1.6043024063110352, 1.7725294828414917, 1.9407565593719482, 2.1089837551116943, 2.2772109508514404, 2.4454379081726074, 2.6136651039123535, 2.7818922996520996, 2.9501194953918457, 3.118346691131592, 3.286573648452759, 3.454800844192505, 3.623028039932251, 3.791254997253418, 3.959482192993164, 4.12770938873291, 4.295936584472656, 4.464163780212402, 4.632390975952148, 4.8006181716918945, 4.968844890594482, 5.1370720863342285, 5.305299282073975, 5.473526477813721]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 10.0, 13.0, 25.0, 19.0, 42.0, 59.0, 105.0, 207.0, 522.0, 1208.0, 2416.0, 5452.0, 23905.0, 492411.0, 3515226.0, 134427.0, 12108.0, 3650.0, 1298.0, 514.0, 271.0, 142.0, 86.0, 61.0, 28.0, 29.0, 9.0, 13.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7314453125, -1.676177978515625, -1.62091064453125, -1.565643310546875, -1.5103759765625, -1.455108642578125, -1.39984130859375, -1.344573974609375, -1.289306640625, -1.234039306640625, -1.17877197265625, -1.123504638671875, -1.0682373046875, -1.012969970703125, -0.95770263671875, -0.902435302734375, -0.84716796875, -0.791900634765625, -0.73663330078125, -0.681365966796875, -0.6260986328125, -0.570831298828125, -0.51556396484375, -0.460296630859375, -0.405029296875, -0.349761962890625, -0.29449462890625, -0.239227294921875, -0.1839599609375, -0.128692626953125, -0.07342529296875, -0.018157958984375, 0.037109375, 0.092376708984375, 0.14764404296875, 0.202911376953125, 0.2581787109375, 0.313446044921875, 0.36871337890625, 0.423980712890625, 0.479248046875, 0.534515380859375, 0.58978271484375, 0.645050048828125, 0.7003173828125, 0.755584716796875, 0.81085205078125, 0.866119384765625, 0.92138671875, 0.976654052734375, 1.03192138671875, 1.087188720703125, 1.1424560546875, 1.197723388671875, 1.25299072265625, 1.308258056640625, 1.363525390625, 1.418792724609375, 1.47406005859375, 1.529327392578125, 1.5845947265625, 1.639862060546875, 1.69512939453125, 1.750396728515625, 1.8056640625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 23.0, 22.0, 42.0, 74.0, 122.0, 132.0, 179.0, 139.0, 113.0, 66.0, 43.0, 26.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6298828125, -1.5679779052734375, -1.506072998046875, -1.4441680908203125, -1.38226318359375, -1.3203582763671875, -1.258453369140625, -1.1965484619140625, -1.1346435546875, -1.0727386474609375, -1.010833740234375, -0.9489288330078125, -0.88702392578125, -0.8251190185546875, -0.763214111328125, -0.7013092041015625, -0.639404296875, -0.5774993896484375, -0.515594482421875, -0.4536895751953125, -0.39178466796875, -0.3298797607421875, -0.267974853515625, -0.2060699462890625, -0.1441650390625, -0.0822601318359375, -0.020355224609375, 0.0415496826171875, 0.10345458984375, 0.1653594970703125, 0.227264404296875, 0.2891693115234375, 0.35107421875, 0.4129791259765625, 0.474884033203125, 0.5367889404296875, 0.59869384765625, 0.6605987548828125, 0.722503662109375, 0.7844085693359375, 0.8463134765625, 0.9082183837890625, 0.970123291015625, 1.0320281982421875, 1.09393310546875, 1.1558380126953125, 1.217742919921875, 1.2796478271484375, 1.341552734375, 1.4034576416015625, 1.465362548828125, 1.5272674560546875, 1.58917236328125, 1.6510772705078125, 1.712982177734375, 1.7748870849609375, 1.8367919921875, 1.8986968994140625, 1.960601806640625, 2.0225067138671875, 2.08441162109375, 2.1463165283203125, 2.208221435546875, 2.2701263427734375, 2.33203125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 12.0, 11.0, 20.0, 46.0, 88.0, 182.0, 481.0, 2330.0, 49978.0, 4105606.0, 33059.0, 1797.0, 384.0, 120.0, 77.0, 44.0, 27.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.36590576171875, -4.2630615234375, -4.16021728515625, -4.057373046875, -3.95452880859375, -3.8516845703125, -3.74884033203125, -3.64599609375, -3.54315185546875, -3.4403076171875, -3.33746337890625, -3.234619140625, -3.13177490234375, -3.0289306640625, -2.92608642578125, -2.8232421875, -2.72039794921875, -2.6175537109375, -2.51470947265625, -2.411865234375, -2.30902099609375, -2.2061767578125, -2.10333251953125, -2.00048828125, -1.89764404296875, -1.7947998046875, -1.69195556640625, -1.589111328125, -1.48626708984375, -1.3834228515625, -1.28057861328125, -1.177734375, -1.07489013671875, -0.9720458984375, -0.86920166015625, -0.766357421875, -0.66351318359375, -0.5606689453125, -0.45782470703125, -0.35498046875, -0.25213623046875, -0.1492919921875, -0.04644775390625, 0.056396484375, 0.15924072265625, 0.2620849609375, 0.36492919921875, 0.4677734375, 0.57061767578125, 0.6734619140625, 0.77630615234375, 0.879150390625, 0.98199462890625, 1.0848388671875, 1.18768310546875, 1.29052734375, 1.39337158203125, 1.4962158203125, 1.59906005859375, 1.701904296875, 1.80474853515625, 1.9075927734375, 2.01043701171875, 2.11328125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 12.0, 30.0, 48.0, 103.0, 391.0, 1960.0, 1164.0, 204.0, 83.0, 35.0, 18.0, 13.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4892578125, -0.4617767333984375, -0.434295654296875, -0.4068145751953125, -0.37933349609375, -0.3518524169921875, -0.324371337890625, -0.2968902587890625, -0.2694091796875, -0.2419281005859375, -0.214447021484375, -0.1869659423828125, -0.15948486328125, -0.1320037841796875, -0.104522705078125, -0.0770416259765625, -0.049560546875, -0.0220794677734375, 0.005401611328125, 0.0328826904296875, 0.06036376953125, 0.0878448486328125, 0.115325927734375, 0.1428070068359375, 0.1702880859375, 0.1977691650390625, 0.225250244140625, 0.2527313232421875, 0.28021240234375, 0.3076934814453125, 0.335174560546875, 0.3626556396484375, 0.39013671875, 0.4176177978515625, 0.445098876953125, 0.4725799560546875, 0.50006103515625, 0.5275421142578125, 0.555023193359375, 0.5825042724609375, 0.6099853515625, 0.6374664306640625, 0.664947509765625, 0.6924285888671875, 0.71990966796875, 0.7473907470703125, 0.774871826171875, 0.8023529052734375, 0.829833984375, 0.8573150634765625, 0.884796142578125, 0.9122772216796875, 0.93975830078125, 0.9672393798828125, 0.994720458984375, 1.0222015380859375, 1.0496826171875, 1.0771636962890625, 1.104644775390625, 1.1321258544921875, 1.15960693359375, 1.1870880126953125, 1.214569091796875, 1.2420501708984375, 1.26953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 11.0, 14.0, 27.0, 76.0, 176.0, 246.0, 210.0, 128.0, 65.0, 31.0, 9.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5147783756256104, -2.43587589263916, -2.35697340965271, -2.2780709266662598, -2.1991684436798096, -2.1202659606933594, -2.04136323928833, -1.9624607563018799, -1.8835582733154297, -1.8046557903289795, -1.7257533073425293, -1.646850824356079, -1.5679482221603394, -1.4890457391738892, -1.410143256187439, -1.3312406539916992, -1.2523382902145386, -1.1734358072280884, -1.0945333242416382, -1.0156307220458984, -0.9367282390594482, -0.857825756072998, -0.7789232730865479, -0.7000207304954529, -0.6211182475090027, -0.5422157645225525, -0.4633132219314575, -0.3844107389450073, -0.30550822615623474, -0.22660571336746216, -0.14770323038101196, -0.06880068778991699, 0.010101795196533203, 0.08900430053472519, 0.16790680587291718, 0.24680930376052856, 0.32571181654930115, 0.40461432933807373, 0.4835168123245239, 0.5624193549156189, 0.6413218379020691, 0.7202243208885193, 0.7991268634796143, 0.8780293464660645, 0.9569318294525146, 1.0358343124389648, 1.114736795425415, 1.1936393976211548, 1.272541880607605, 1.3514443635940552, 1.4303468465805054, 1.5092494487762451, 1.5881519317626953, 1.6670544147491455, 1.7459568977355957, 1.824859380722046, 1.903761863708496, 1.9826643466949463, 2.0615668296813965, 2.1404693126678467, 2.219371795654297, 2.298274517059326, 2.3771767616271973, 2.4560794830322266, 2.5349819660186768]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 11.0, 24.0, 37.0, 65.0, 91.0, 106.0, 136.0, 133.0, 127.0, 91.0, 68.0, 46.0, 32.0, 13.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85817289352417, -1.7943387031555176, -1.7305046319961548, -1.6666704416275024, -1.6028363704681396, -1.5390021800994873, -1.475167989730835, -1.4113337993621826, -1.3474997282028198, -1.2836655378341675, -1.2198314666748047, -1.1559972763061523, -1.0921630859375, -1.0283290147781372, -0.9644948244094849, -0.9006606936454773, -0.8368265628814697, -0.7729924321174622, -0.7091583013534546, -0.6453241109848022, -0.5814899802207947, -0.5176558494567871, -0.45382168889045715, -0.3899875283241272, -0.32615339756011963, -0.26231926679611206, -0.1984851062297821, -0.13465096056461334, -0.07081681489944458, -0.006982684135437012, 0.056851476430892944, 0.1206856369972229, 0.18451952934265137, 0.24835367500782013, 0.3121878206729889, 0.37602198123931885, 0.4398561120033264, 0.503690242767334, 0.5675244331359863, 0.6313585638999939, 0.6951926946640015, 0.759026825428009, 0.8228609561920166, 0.886695146560669, 0.9505292773246765, 1.014363408088684, 1.0781975984573364, 1.1420316696166992, 1.2058658599853516, 1.269700050354004, 1.3335341215133667, 1.397368311882019, 1.4612023830413818, 1.5250365734100342, 1.5888707637786865, 1.6527049541473389, 1.7165390253067017, 1.780373215675354, 1.8442072868347168, 1.9080414772033691, 1.9718756675720215, 2.035709857940674, 2.099543809890747, 2.1633780002593994, 2.2272121906280518]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 11.0, 19.0, 16.0, 20.0, 23.0, 37.0, 68.0, 73.0, 120.0, 179.0, 396.0, 1031.0, 3425.0, 17772.0, 177893.0, 738714.0, 93355.0, 11285.0, 2463.0, 791.0, 341.0, 164.0, 84.0, 66.0, 50.0, 46.0, 18.0, 29.0, 13.0, 14.0, 5.0, 2.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23435020446777344, -0.22663497924804688, -0.2189197540283203, -0.21120452880859375, -0.2034893035888672, -0.19577407836914062, -0.18805885314941406, -0.1803436279296875, -0.17262840270996094, -0.16491317749023438, -0.1571979522705078, -0.14948272705078125, -0.1417675018310547, -0.13405227661132812, -0.12633705139160156, -0.118621826171875, -0.11090660095214844, -0.10319137573242188, -0.09547615051269531, -0.08776092529296875, -0.08004570007324219, -0.07233047485351562, -0.06461524963378906, -0.0569000244140625, -0.04918479919433594, -0.041469573974609375, -0.03375434875488281, -0.02603912353515625, -0.018323898315429688, -0.010608673095703125, -0.0028934478759765625, 0.00482177734375, 0.012537002563476562, 0.020252227783203125, 0.027967453002929688, 0.03568267822265625, 0.04339790344238281, 0.051113128662109375, 0.05882835388183594, 0.0665435791015625, 0.07425880432128906, 0.08197402954101562, 0.08968925476074219, 0.09740447998046875, 0.10511970520019531, 0.11283493041992188, 0.12055015563964844, 0.128265380859375, 0.13598060607910156, 0.14369583129882812, 0.1514110565185547, 0.15912628173828125, 0.1668415069580078, 0.17455673217773438, 0.18227195739746094, 0.1899871826171875, 0.19770240783691406, 0.20541763305664062, 0.2131328582763672, 0.22084808349609375, 0.2285633087158203, 0.23627853393554688, 0.24399375915527344, 0.251708984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 16.0, 13.0, 30.0, 59.0, 103.0, 154.0, 164.0, 186.0, 128.0, 69.0, 47.0, 19.0, 14.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.30853271484375, -1.2576904296875, -1.20684814453125, -1.156005859375, -1.10516357421875, -1.0543212890625, -1.00347900390625, -0.95263671875, -0.90179443359375, -0.8509521484375, -0.80010986328125, -0.749267578125, -0.69842529296875, -0.6475830078125, -0.59674072265625, -0.5458984375, -0.49505615234375, -0.4442138671875, -0.39337158203125, -0.342529296875, -0.29168701171875, -0.2408447265625, -0.19000244140625, -0.13916015625, -0.08831787109375, -0.0374755859375, 0.01336669921875, 0.064208984375, 0.11505126953125, 0.1658935546875, 0.21673583984375, 0.267578125, 0.31842041015625, 0.3692626953125, 0.42010498046875, 0.470947265625, 0.52178955078125, 0.5726318359375, 0.62347412109375, 0.67431640625, 0.72515869140625, 0.7760009765625, 0.82684326171875, 0.877685546875, 0.92852783203125, 0.9793701171875, 1.03021240234375, 1.0810546875, 1.13189697265625, 1.1827392578125, 1.23358154296875, 1.284423828125, 1.33526611328125, 1.3861083984375, 1.43695068359375, 1.48779296875, 1.53863525390625, 1.5894775390625, 1.64031982421875, 1.691162109375, 1.74200439453125, 1.7928466796875, 1.84368896484375, 1.89453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 11.0, 12.0, 21.0, 31.0, 43.0, 84.0, 126.0, 204.0, 339.0, 504.0, 949.0, 1598.0, 3039.0, 5669.0, 11462.0, 24427.0, 55847.0, 137515.0, 313008.0, 282488.0, 119046.0, 48925.0, 21586.0, 10207.0, 5149.0, 2680.0, 1460.0, 846.0, 526.0, 293.0, 168.0, 123.0, 52.0, 30.0, 41.0, 16.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0819091796875, -0.0794210433959961, -0.07693290710449219, -0.07444477081298828, -0.07195663452148438, -0.06946849822998047, -0.06698036193847656, -0.06449222564697266, -0.06200408935546875, -0.059515953063964844, -0.05702781677246094, -0.05453968048095703, -0.052051544189453125, -0.04956340789794922, -0.04707527160644531, -0.044587135314941406, -0.0420989990234375, -0.039610862731933594, -0.03712272644042969, -0.03463459014892578, -0.032146453857421875, -0.02965831756591797, -0.027170181274414062, -0.024682044982910156, -0.02219390869140625, -0.019705772399902344, -0.017217636108398438, -0.014729499816894531, -0.012241363525390625, -0.009753227233886719, -0.0072650909423828125, -0.004776954650878906, -0.002288818359375, 0.00019931793212890625, 0.0026874542236328125, 0.005175590515136719, 0.007663726806640625, 0.010151863098144531, 0.012639999389648438, 0.015128135681152344, 0.01761627197265625, 0.020104408264160156, 0.022592544555664062, 0.02508068084716797, 0.027568817138671875, 0.03005695343017578, 0.03254508972167969, 0.035033226013183594, 0.0375213623046875, 0.040009498596191406, 0.04249763488769531, 0.04498577117919922, 0.047473907470703125, 0.04996204376220703, 0.05245018005371094, 0.054938316345214844, 0.05742645263671875, 0.059914588928222656, 0.06240272521972656, 0.06489086151123047, 0.06737899780273438, 0.06986713409423828, 0.07235527038574219, 0.0748434066772461, 0.07733154296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 4.0, 8.0, 11.0, 8.0, 18.0, 22.0, 21.0, 22.0, 25.0, 25.0, 29.0, 36.0, 46.0, 48.0, 52.0, 48.0, 52.0, 48.0, 50.0, 44.0, 52.0, 37.0, 43.0, 39.0, 25.0, 35.0, 21.0, 16.0, 20.0, 14.0, 14.0, 12.0, 8.0, 9.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1357421875, -1.101348876953125, -1.06695556640625, -1.032562255859375, -0.9981689453125, -0.963775634765625, -0.92938232421875, -0.894989013671875, -0.860595703125, -0.826202392578125, -0.79180908203125, -0.757415771484375, -0.7230224609375, -0.688629150390625, -0.65423583984375, -0.619842529296875, -0.58544921875, -0.551055908203125, -0.51666259765625, -0.482269287109375, -0.4478759765625, -0.413482666015625, -0.37908935546875, -0.344696044921875, -0.310302734375, -0.275909423828125, -0.24151611328125, -0.207122802734375, -0.1727294921875, -0.138336181640625, -0.10394287109375, -0.069549560546875, -0.03515625, -0.000762939453125, 0.03363037109375, 0.068023681640625, 0.1024169921875, 0.136810302734375, 0.17120361328125, 0.205596923828125, 0.239990234375, 0.274383544921875, 0.30877685546875, 0.343170166015625, 0.3775634765625, 0.411956787109375, 0.44635009765625, 0.480743408203125, 0.51513671875, 0.549530029296875, 0.58392333984375, 0.618316650390625, 0.6527099609375, 0.687103271484375, 0.72149658203125, 0.755889892578125, 0.790283203125, 0.824676513671875, 0.85906982421875, 0.893463134765625, 0.9278564453125, 0.962249755859375, 0.99664306640625, 1.031036376953125, 1.0654296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 4.0, 10.0, 11.0, 19.0, 32.0, 36.0, 53.0, 85.0, 138.0, 229.0, 445.0, 1124.0, 3246.0, 16700.0, 928606.0, 87491.0, 6910.0, 1917.0, 699.0, 318.0, 203.0, 119.0, 53.0, 29.0, 30.0, 19.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.044677734375, -0.04327058792114258, -0.041863441467285156, -0.040456295013427734, -0.03904914855957031, -0.03764200210571289, -0.03623485565185547, -0.03482770919799805, -0.033420562744140625, -0.0320134162902832, -0.03060626983642578, -0.02919912338256836, -0.027791976928710938, -0.026384830474853516, -0.024977684020996094, -0.023570537567138672, -0.02216339111328125, -0.020756244659423828, -0.019349098205566406, -0.017941951751708984, -0.016534805297851562, -0.01512765884399414, -0.013720512390136719, -0.012313365936279297, -0.010906219482421875, -0.009499073028564453, -0.008091926574707031, -0.006684780120849609, -0.0052776336669921875, -0.0038704872131347656, -0.0024633407592773438, -0.0010561943054199219, 0.0003509521484375, 0.0017580986022949219, 0.0031652450561523438, 0.004572391510009766, 0.0059795379638671875, 0.007386684417724609, 0.008793830871582031, 0.010200977325439453, 0.011608123779296875, 0.013015270233154297, 0.014422416687011719, 0.01582956314086914, 0.017236709594726562, 0.018643856048583984, 0.020051002502441406, 0.021458148956298828, 0.02286529541015625, 0.024272441864013672, 0.025679588317871094, 0.027086734771728516, 0.028493881225585938, 0.02990102767944336, 0.03130817413330078, 0.0327153205871582, 0.034122467041015625, 0.03552961349487305, 0.03693675994873047, 0.03834390640258789, 0.03975105285644531, 0.041158199310302734, 0.042565345764160156, 0.04397249221801758, 0.045379638671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 10.0, 21.0, 40.0, 97.0, 166.0, 281.0, 172.0, 86.0, 45.0, 30.0, 16.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.212690353393555e-05, -3.091525286436081e-05, -2.9703602194786072e-05, -2.8491951525211334e-05, -2.7280300855636597e-05, -2.606865018606186e-05, -2.485699951648712e-05, -2.3645348846912384e-05, -2.2433698177337646e-05, -2.122204750776291e-05, -2.001039683818817e-05, -1.8798746168613434e-05, -1.7587095499038696e-05, -1.637544482946396e-05, -1.5163794159889221e-05, -1.3952143490314484e-05, -1.2740492820739746e-05, -1.1528842151165009e-05, -1.0317191481590271e-05, -9.105540812015533e-06, -7.893890142440796e-06, -6.682239472866058e-06, -5.470588803291321e-06, -4.258938133716583e-06, -3.0472874641418457e-06, -1.8356367945671082e-06, -6.239861249923706e-07, 5.876645445823669e-07, 1.7993152141571045e-06, 3.010965883731842e-06, 4.22261655330658e-06, 5.434267222881317e-06, 6.645917892456055e-06, 7.857568562030792e-06, 9.06921923160553e-06, 1.0280869901180267e-05, 1.1492520570755005e-05, 1.2704171240329742e-05, 1.391582190990448e-05, 1.5127472579479218e-05, 1.6339123249053955e-05, 1.7550773918628693e-05, 1.876242458820343e-05, 1.9974075257778168e-05, 2.1185725927352905e-05, 2.2397376596927643e-05, 2.360902726650238e-05, 2.4820677936077118e-05, 2.6032328605651855e-05, 2.7243979275226593e-05, 2.845562994480133e-05, 2.9667280614376068e-05, 3.0878931283950806e-05, 3.209058195352554e-05, 3.330223262310028e-05, 3.451388329267502e-05, 3.5725533962249756e-05, 3.6937184631824493e-05, 3.814883530139923e-05, 3.936048597097397e-05, 4.0572136640548706e-05, 4.1783787310123444e-05, 4.299543797969818e-05, 4.420708864927292e-05, 4.5418739318847656e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 11.0, 33.0, 35.0, 66.0, 145.0, 269.0, 614.0, 1442.0, 3793.0, 16789.0, 921685.0, 92283.0, 7213.0, 2321.0, 951.0, 431.0, 213.0, 105.0, 53.0, 26.0, 22.0, 10.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047149658203125, -0.045510292053222656, -0.04387092590332031, -0.04223155975341797, -0.040592193603515625, -0.03895282745361328, -0.03731346130371094, -0.035674095153808594, -0.03403472900390625, -0.032395362854003906, -0.030755996704101562, -0.02911663055419922, -0.027477264404296875, -0.02583789825439453, -0.024198532104492188, -0.022559165954589844, -0.0209197998046875, -0.019280433654785156, -0.017641067504882812, -0.01600170135498047, -0.014362335205078125, -0.012722969055175781, -0.011083602905273438, -0.009444236755371094, -0.00780487060546875, -0.006165504455566406, -0.0045261383056640625, -0.0028867721557617188, -0.001247406005859375, 0.00039196014404296875, 0.0020313262939453125, 0.0036706924438476562, 0.00531005859375, 0.006949424743652344, 0.008588790893554688, 0.010228157043457031, 0.011867523193359375, 0.013506889343261719, 0.015146255493164062, 0.016785621643066406, 0.01842498779296875, 0.020064353942871094, 0.021703720092773438, 0.02334308624267578, 0.024982452392578125, 0.02662181854248047, 0.028261184692382812, 0.029900550842285156, 0.0315399169921875, 0.033179283142089844, 0.03481864929199219, 0.03645801544189453, 0.038097381591796875, 0.03973674774169922, 0.04137611389160156, 0.043015480041503906, 0.04465484619140625, 0.046294212341308594, 0.04793357849121094, 0.04957294464111328, 0.051212310791015625, 0.05285167694091797, 0.05449104309082031, 0.056130409240722656, 0.057769775390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 23.0, 50.0, 86.0, 288.0, 318.0, 82.0, 46.0, 20.0, 17.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.01313018798828125, -0.012755632400512695, -0.01238107681274414, -0.012006521224975586, -0.011631965637207031, -0.011257410049438477, -0.010882854461669922, -0.010508298873901367, -0.010133743286132812, -0.009759187698364258, -0.009384632110595703, -0.009010076522827148, -0.008635520935058594, -0.008260965347290039, -0.007886409759521484, -0.00751185417175293, -0.007137298583984375, -0.00676274299621582, -0.006388187408447266, -0.006013631820678711, -0.005639076232910156, -0.0052645206451416016, -0.004889965057373047, -0.004515409469604492, -0.0041408538818359375, -0.003766298294067383, -0.003391742706298828, -0.0030171871185302734, -0.0026426315307617188, -0.002268075942993164, -0.0018935203552246094, -0.0015189647674560547, -0.0011444091796875, -0.0007698535919189453, -0.0003952980041503906, -2.0742416381835938e-05, 0.00035381317138671875, 0.0007283687591552734, 0.0011029243469238281, 0.0014774799346923828, 0.0018520355224609375, 0.002226591110229492, 0.002601146697998047, 0.0029757022857666016, 0.0033502578735351562, 0.003724813461303711, 0.004099369049072266, 0.00447392463684082, 0.004848480224609375, 0.00522303581237793, 0.005597591400146484, 0.005972146987915039, 0.006346702575683594, 0.0067212581634521484, 0.007095813751220703, 0.007470369338989258, 0.007844924926757812, 0.008219480514526367, 0.008594036102294922, 0.008968591690063477, 0.009343147277832031, 0.009717702865600586, 0.01009225845336914, 0.010466814041137695, 0.01084136962890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 15.0, 45.0, 169.0, 376.0, 246.0, 111.0, 20.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8784151077270508, -1.8107056617736816, -1.742996096611023, -1.6752865314483643, -1.6075770854949951, -1.539867639541626, -1.4721580743789673, -1.4044485092163086, -1.3367390632629395, -1.2690296173095703, -1.2013200521469116, -1.133610486984253, -1.0659010410308838, -0.9981915354728699, -0.930482029914856, -0.862772524356842, -0.7950630187988281, -0.7273535132408142, -0.6596440076828003, -0.5919345021247864, -0.5242249965667725, -0.45651549100875854, -0.38880598545074463, -0.3210964798927307, -0.2533869743347168, -0.18567746877670288, -0.11796796321868896, -0.05025845766067505, 0.017451047897338867, 0.08516055345535278, 0.1528700590133667, 0.22057956457138062, 0.28828883171081543, 0.35599833726882935, 0.42370784282684326, 0.4914173483848572, 0.5591268539428711, 0.626836359500885, 0.6945458650588989, 0.7622553706169128, 0.8299648761749268, 0.8976743817329407, 0.9653838872909546, 1.0330934524536133, 1.1008028984069824, 1.1685123443603516, 1.2362219095230103, 1.303931474685669, 1.371640920639038, 1.4393503665924072, 1.507059931755066, 1.5747694969177246, 1.6424789428710938, 1.710188388824463, 1.7778979539871216, 1.8456075191497803, 1.9133169651031494, 1.9810264110565186, 2.048736095428467, 2.116445541381836, 2.184154987335205, 2.251864433288574, 2.3195738792419434, 2.3872835636138916, 2.4549930095672607]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 21.0, 33.0, 74.0, 103.0, 154.0, 175.0, 159.0, 122.0, 68.0, 42.0, 24.0, 9.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318250060081482, -1.270463466644287, -1.2226768732070923, -1.1748902797698975, -1.1271036863327026, -1.0793170928955078, -1.031530499458313, -0.9837439060211182, -0.9359573125839233, -0.8881707191467285, -0.8403841257095337, -0.7925975322723389, -0.744810938835144, -0.6970243453979492, -0.6492377519607544, -0.6014511585235596, -0.5536645650863647, -0.5058779716491699, -0.4580913782119751, -0.4103047847747803, -0.36251819133758545, -0.3147315979003906, -0.2669450044631958, -0.21915841102600098, -0.17137181758880615, -0.12358522415161133, -0.0757986307144165, -0.02801203727722168, 0.019774556159973145, 0.06756114959716797, 0.11534774303436279, 0.16313433647155762, 0.2109208106994629, 0.2587074041366577, 0.30649399757385254, 0.35428059101104736, 0.4020671844482422, 0.449853777885437, 0.49764037132263184, 0.5454269647598267, 0.5932135581970215, 0.6410001516342163, 0.6887867450714111, 0.736573338508606, 0.7843599319458008, 0.8321465253829956, 0.8799331188201904, 0.9277197122573853, 0.9755063056945801, 1.023292899131775, 1.0710794925689697, 1.1188660860061646, 1.1666526794433594, 1.2144392728805542, 1.262225866317749, 1.3100124597549438, 1.3577990531921387, 1.4055856466293335, 1.4533722400665283, 1.5011588335037231, 1.548945426940918, 1.5967320203781128, 1.6445186138153076, 1.6923052072525024, 1.7400918006896973]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 12.0, 14.0, 28.0, 42.0, 62.0, 94.0, 171.0, 292.0, 532.0, 1005.0, 2095.0, 4885.0, 13540.0, 62833.0, 725325.0, 199292.0, 24630.0, 7592.0, 3046.0, 1373.0, 710.0, 330.0, 202.0, 149.0, 87.0, 53.0, 36.0, 30.0, 19.0, 10.0, 9.0, 17.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.583984375, -0.568084716796875, -0.55218505859375, -0.536285400390625, -0.5203857421875, -0.504486083984375, -0.48858642578125, -0.472686767578125, -0.456787109375, -0.440887451171875, -0.42498779296875, -0.409088134765625, -0.3931884765625, -0.377288818359375, -0.36138916015625, -0.345489501953125, -0.32958984375, -0.313690185546875, -0.29779052734375, -0.281890869140625, -0.2659912109375, -0.250091552734375, -0.23419189453125, -0.218292236328125, -0.202392578125, -0.186492919921875, -0.17059326171875, -0.154693603515625, -0.1387939453125, -0.122894287109375, -0.10699462890625, -0.091094970703125, -0.0751953125, -0.059295654296875, -0.04339599609375, -0.027496337890625, -0.0115966796875, 0.004302978515625, 0.02020263671875, 0.036102294921875, 0.052001953125, 0.067901611328125, 0.08380126953125, 0.099700927734375, 0.1156005859375, 0.131500244140625, 0.14739990234375, 0.163299560546875, 0.17919921875, 0.195098876953125, 0.21099853515625, 0.226898193359375, 0.2427978515625, 0.258697509765625, 0.27459716796875, 0.290496826171875, 0.306396484375, 0.322296142578125, 0.33819580078125, 0.354095458984375, 0.3699951171875, 0.385894775390625, 0.40179443359375, 0.417694091796875, 0.43359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 11.0, 6.0, 9.0, 24.0, 33.0, 48.0, 63.0, 112.0, 104.0, 115.0, 132.0, 112.0, 77.0, 48.0, 33.0, 39.0, 20.0, 5.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.298126220703125, -2.22320556640625, -2.148284912109375, -2.0733642578125, -1.998443603515625, -1.92352294921875, -1.848602294921875, -1.773681640625, -1.698760986328125, -1.62384033203125, -1.548919677734375, -1.4739990234375, -1.399078369140625, -1.32415771484375, -1.249237060546875, -1.17431640625, -1.099395751953125, -1.02447509765625, -0.949554443359375, -0.8746337890625, -0.799713134765625, -0.72479248046875, -0.649871826171875, -0.574951171875, -0.500030517578125, -0.42510986328125, -0.350189208984375, -0.2752685546875, -0.200347900390625, -0.12542724609375, -0.050506591796875, 0.0244140625, 0.099334716796875, 0.17425537109375, 0.249176025390625, 0.3240966796875, 0.399017333984375, 0.47393798828125, 0.548858642578125, 0.623779296875, 0.698699951171875, 0.77362060546875, 0.848541259765625, 0.9234619140625, 0.998382568359375, 1.07330322265625, 1.148223876953125, 1.22314453125, 1.298065185546875, 1.37298583984375, 1.447906494140625, 1.5228271484375, 1.597747802734375, 1.67266845703125, 1.747589111328125, 1.822509765625, 1.897430419921875, 1.97235107421875, 2.047271728515625, 2.1221923828125, 2.197113037109375, 2.27203369140625, 2.346954345703125, 2.421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 5.0, 7.0, 11.0, 9.0, 22.0, 31.0, 40.0, 47.0, 62.0, 104.0, 143.0, 231.0, 556.0, 1984.0, 14640.0, 872857.0, 149806.0, 5831.0, 1138.0, 383.0, 210.0, 112.0, 91.0, 49.0, 44.0, 35.0, 26.0, 18.0, 10.0, 5.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0775070190429688, -1.0446624755859375, -1.0118179321289062, -0.978973388671875, -0.9461288452148438, -0.9132843017578125, -0.8804397583007812, -0.84759521484375, -0.8147506713867188, -0.7819061279296875, -0.7490615844726562, -0.716217041015625, -0.6833724975585938, -0.6505279541015625, -0.6176834106445312, -0.5848388671875, -0.5519943237304688, -0.5191497802734375, -0.48630523681640625, -0.453460693359375, -0.42061614990234375, -0.3877716064453125, -0.35492706298828125, -0.32208251953125, -0.28923797607421875, -0.2563934326171875, -0.22354888916015625, -0.190704345703125, -0.15785980224609375, -0.1250152587890625, -0.09217071533203125, -0.059326171875, -0.02648162841796875, 0.0063629150390625, 0.03920745849609375, 0.072052001953125, 0.10489654541015625, 0.1377410888671875, 0.17058563232421875, 0.20343017578125, 0.23627471923828125, 0.2691192626953125, 0.30196380615234375, 0.334808349609375, 0.36765289306640625, 0.4004974365234375, 0.43334197998046875, 0.4661865234375, 0.49903106689453125, 0.5318756103515625, 0.5647201538085938, 0.597564697265625, 0.6304092407226562, 0.6632537841796875, 0.6960983276367188, 0.72894287109375, 0.7617874145507812, 0.7946319580078125, 0.8274765014648438, 0.860321044921875, 0.8931655883789062, 0.9260101318359375, 0.9588546752929688, 0.99169921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 7.0, 14.0, 15.0, 23.0, 20.0, 27.0, 37.0, 38.0, 47.0, 55.0, 77.0, 72.0, 68.0, 85.0, 79.0, 49.0, 46.0, 48.0, 37.0, 26.0, 29.0, 21.0, 18.0, 10.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.984375, -1.922027587890625, -1.85968017578125, -1.797332763671875, -1.7349853515625, -1.672637939453125, -1.61029052734375, -1.547943115234375, -1.485595703125, -1.423248291015625, -1.36090087890625, -1.298553466796875, -1.2362060546875, -1.173858642578125, -1.11151123046875, -1.049163818359375, -0.98681640625, -0.924468994140625, -0.86212158203125, -0.799774169921875, -0.7374267578125, -0.675079345703125, -0.61273193359375, -0.550384521484375, -0.488037109375, -0.425689697265625, -0.36334228515625, -0.300994873046875, -0.2386474609375, -0.176300048828125, -0.11395263671875, -0.051605224609375, 0.0107421875, 0.073089599609375, 0.13543701171875, 0.197784423828125, 0.2601318359375, 0.322479248046875, 0.38482666015625, 0.447174072265625, 0.509521484375, 0.571868896484375, 0.63421630859375, 0.696563720703125, 0.7589111328125, 0.821258544921875, 0.88360595703125, 0.945953369140625, 1.00830078125, 1.070648193359375, 1.13299560546875, 1.195343017578125, 1.2576904296875, 1.320037841796875, 1.38238525390625, 1.444732666015625, 1.507080078125, 1.569427490234375, 1.63177490234375, 1.694122314453125, 1.7564697265625, 1.818817138671875, 1.88116455078125, 1.943511962890625, 2.005859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 12.0, 18.0, 15.0, 26.0, 68.0, 140.0, 317.0, 831.0, 2530.0, 10796.0, 165684.0, 837320.0, 24458.0, 4136.0, 1224.0, 475.0, 245.0, 115.0, 43.0, 24.0, 11.0, 18.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36474609375, -0.3554401397705078, -0.3461341857910156, -0.33682823181152344, -0.32752227783203125, -0.31821632385253906, -0.3089103698730469, -0.2996044158935547, -0.2902984619140625, -0.2809925079345703, -0.2716865539550781, -0.26238059997558594, -0.25307464599609375, -0.24376869201660156, -0.23446273803710938, -0.2251567840576172, -0.215850830078125, -0.2065448760986328, -0.19723892211914062, -0.18793296813964844, -0.17862701416015625, -0.16932106018066406, -0.16001510620117188, -0.1507091522216797, -0.1414031982421875, -0.1320972442626953, -0.12279129028320312, -0.11348533630371094, -0.10417938232421875, -0.09487342834472656, -0.08556747436523438, -0.07626152038574219, -0.06695556640625, -0.05764961242675781, -0.048343658447265625, -0.03903770446777344, -0.02973175048828125, -0.020425796508789062, -0.011119842529296875, -0.0018138885498046875, 0.0074920654296875, 0.016798019409179688, 0.026103973388671875, 0.03540992736816406, 0.04471588134765625, 0.05402183532714844, 0.06332778930664062, 0.07263374328613281, 0.081939697265625, 0.09124565124511719, 0.10055160522460938, 0.10985755920410156, 0.11916351318359375, 0.12846946716308594, 0.13777542114257812, 0.1470813751220703, 0.1563873291015625, 0.1656932830810547, 0.17499923706054688, 0.18430519104003906, 0.19361114501953125, 0.20291709899902344, 0.21222305297851562, 0.2215290069580078, 0.2308349609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 16.0, 15.0, 58.0, 105.0, 232.0, 288.0, 119.0, 49.0, 37.0, 20.0, 12.0, 12.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7358531951904297e-05, -2.627260982990265e-05, -2.5186687707901e-05, -2.4100765585899353e-05, -2.3014843463897705e-05, -2.1928921341896057e-05, -2.084299921989441e-05, -1.975707709789276e-05, -1.8671154975891113e-05, -1.7585232853889465e-05, -1.6499310731887817e-05, -1.541338860988617e-05, -1.4327466487884521e-05, -1.3241544365882874e-05, -1.2155622243881226e-05, -1.1069700121879578e-05, -9.98377799987793e-06, -8.897855877876282e-06, -7.811933755874634e-06, -6.726011633872986e-06, -5.640089511871338e-06, -4.55416738986969e-06, -3.468245267868042e-06, -2.382323145866394e-06, -1.296401023864746e-06, -2.1047890186309814e-07, 8.754432201385498e-07, 1.9613653421401978e-06, 3.0472874641418457e-06, 4.133209586143494e-06, 5.219131708145142e-06, 6.3050538301467896e-06, 7.3909759521484375e-06, 8.476898074150085e-06, 9.562820196151733e-06, 1.0648742318153381e-05, 1.173466444015503e-05, 1.2820586562156677e-05, 1.3906508684158325e-05, 1.4992430806159973e-05, 1.607835292816162e-05, 1.716427505016327e-05, 1.8250197172164917e-05, 1.9336119294166565e-05, 2.0422041416168213e-05, 2.150796353816986e-05, 2.259388566017151e-05, 2.3679807782173157e-05, 2.4765729904174805e-05, 2.5851652026176453e-05, 2.69375741481781e-05, 2.802349627017975e-05, 2.9109418392181396e-05, 3.0195340514183044e-05, 3.128126263618469e-05, 3.236718475818634e-05, 3.345310688018799e-05, 3.4539029002189636e-05, 3.5624951124191284e-05, 3.671087324619293e-05, 3.779679536819458e-05, 3.888271749019623e-05, 3.9968639612197876e-05, 4.1054561734199524e-05, 4.214048385620117e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 8.0, 4.0, 14.0, 14.0, 32.0, 40.0, 67.0, 137.0, 301.0, 695.0, 1947.0, 7175.0, 59094.0, 922962.0, 46696.0, 6291.0, 1834.0, 650.0, 288.0, 151.0, 58.0, 31.0, 23.0, 12.0, 11.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.27602386474609375, -0.2651824951171875, -0.25434112548828125, -0.243499755859375, -0.23265838623046875, -0.2218170166015625, -0.21097564697265625, -0.20013427734375, -0.18929290771484375, -0.1784515380859375, -0.16761016845703125, -0.156768798828125, -0.14592742919921875, -0.1350860595703125, -0.12424468994140625, -0.1134033203125, -0.10256195068359375, -0.0917205810546875, -0.08087921142578125, -0.070037841796875, -0.05919647216796875, -0.0483551025390625, -0.03751373291015625, -0.02667236328125, -0.01583099365234375, -0.0049896240234375, 0.00585174560546875, 0.016693115234375, 0.02753448486328125, 0.0383758544921875, 0.04921722412109375, 0.06005859375, 0.07089996337890625, 0.0817413330078125, 0.09258270263671875, 0.103424072265625, 0.11426544189453125, 0.1251068115234375, 0.13594818115234375, 0.14678955078125, 0.15763092041015625, 0.1684722900390625, 0.17931365966796875, 0.190155029296875, 0.20099639892578125, 0.2118377685546875, 0.22267913818359375, 0.2335205078125, 0.24436187744140625, 0.2552032470703125, 0.26604461669921875, 0.276885986328125, 0.28772735595703125, 0.2985687255859375, 0.30941009521484375, 0.32025146484375, 0.33109283447265625, 0.3419342041015625, 0.35277557373046875, 0.363616943359375, 0.37445831298828125, 0.3852996826171875, 0.39614105224609375, 0.406982421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 5.0, 2.0, 9.0, 0.0, 12.0, 12.0, 13.0, 27.0, 40.0, 66.0, 139.0, 250.0, 187.0, 83.0, 52.0, 30.0, 25.0, 8.0, 5.0, 4.0, 11.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.13035297393798828, -0.12679481506347656, -0.12323665618896484, -0.11967849731445312, -0.1161203384399414, -0.11256217956542969, -0.10900402069091797, -0.10544586181640625, -0.10188770294189453, -0.09832954406738281, -0.0947713851928711, -0.09121322631835938, -0.08765506744384766, -0.08409690856933594, -0.08053874969482422, -0.0769805908203125, -0.07342243194580078, -0.06986427307128906, -0.06630611419677734, -0.06274795532226562, -0.059189796447753906, -0.05563163757324219, -0.05207347869873047, -0.04851531982421875, -0.04495716094970703, -0.04139900207519531, -0.037840843200683594, -0.034282684326171875, -0.030724525451660156, -0.027166366577148438, -0.02360820770263672, -0.020050048828125, -0.01649188995361328, -0.012933731079101562, -0.009375572204589844, -0.005817413330078125, -0.0022592544555664062, 0.0012989044189453125, 0.004857063293457031, 0.00841522216796875, 0.011973381042480469, 0.015531539916992188, 0.019089698791503906, 0.022647857666015625, 0.026206016540527344, 0.029764175415039062, 0.03332233428955078, 0.0368804931640625, 0.04043865203857422, 0.04399681091308594, 0.047554969787597656, 0.051113128662109375, 0.054671287536621094, 0.05822944641113281, 0.06178760528564453, 0.06534576416015625, 0.06890392303466797, 0.07246208190917969, 0.0760202407836914, 0.07957839965820312, 0.08313655853271484, 0.08669471740722656, 0.09025287628173828, 0.09381103515625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 43.0, 237.0, 500.0, 183.0, 25.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1378190517425537, -2.9339663982391357, -2.7301137447357178, -2.5262610912323, -2.322408437728882, -2.118556022644043, -1.9147032499313354, -1.7108505964279175, -1.5069979429244995, -1.3031452894210815, -1.0992926359176636, -0.8954400420188904, -0.6915873885154724, -0.4877347946166992, -0.28388214111328125, -0.08002948760986328, 0.12382316589355469, 0.32767581939697266, 0.5315284729003906, 0.7353810667991638, 0.9392337203025818, 1.143086314201355, 1.346938967704773, 1.550791621208191, 1.7546442747116089, 1.9584969282150269, 2.1623494625091553, 2.3662021160125732, 2.570054769515991, 2.773907423019409, 2.977760076522827, 3.181612730026245, 3.385465145111084, 3.589317798614502, 3.79317045211792, 3.997023105621338, 4.200875759124756, 4.404728412628174, 4.608581066131592, 4.81243371963501, 5.016286373138428, 5.220139026641846, 5.423991680145264, 5.627844333648682, 5.8316969871521, 6.035549640655518, 6.2394022941589355, 6.4432549476623535, 6.647107124328613, 6.850959777832031, 7.054812431335449, 7.258665084838867, 7.462517738342285, 7.666370391845703, 7.870223045349121, 8.074075698852539, 8.277928352355957, 8.481781005859375, 8.685633659362793, 8.889486312866211, 9.093338966369629, 9.297191619873047, 9.501044273376465, 9.704896926879883, 9.9087495803833]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 12.0, 13.0, 32.0, 23.0, 37.0, 66.0, 56.0, 70.0, 78.0, 93.0, 88.0, 76.0, 81.0, 76.0, 46.0, 44.0, 39.0, 29.0, 13.0, 8.0, 14.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.445219993591309, -5.270247459411621, -5.095274925231934, -4.920302391052246, -4.745329856872559, -4.570357322692871, -4.395384788513184, -4.220412254333496, -4.045439720153809, -3.870467185974121, -3.6954946517944336, -3.520522117614746, -3.3455495834350586, -3.170577049255371, -2.9956042766571045, -2.820631742477417, -2.6456589698791504, -2.470686435699463, -2.2957139015197754, -2.120741367340088, -1.9457687139511108, -1.7707961797714233, -1.5958235263824463, -1.4208509922027588, -1.2458784580230713, -1.0709059238433838, -0.8959333300590515, -0.7209607362747192, -0.5459882020950317, -0.37101566791534424, -0.1960430145263672, -0.021070480346679688, 0.15390253067016602, 0.3288750946521759, 0.5038476586341858, 0.6788202524185181, 0.8537927865982056, 1.028765320777893, 1.2037379741668701, 1.3787105083465576, 1.5536830425262451, 1.7286555767059326, 1.9036281108856201, 2.0786008834838867, 2.253573417663574, 2.4285459518432617, 2.603518486022949, 2.7784910202026367, 2.953463554382324, 3.1284360885620117, 3.303408622741699, 3.4783811569213867, 3.653353691101074, 3.8283262252807617, 4.003298759460449, 4.178271293640137, 4.353243827819824, 4.528216361999512, 4.703188896179199, 4.878161430358887, 5.053133964538574, 5.228106498718262, 5.403079032897949, 5.578051567077637, 5.753024578094482]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 12.0, 8.0, 23.0, 17.0, 31.0, 62.0, 129.0, 246.0, 569.0, 1307.0, 2722.0, 6664.0, 39456.0, 1394264.0, 2671382.0, 63660.0, 8987.0, 2752.0, 1013.0, 420.0, 233.0, 122.0, 81.0, 41.0, 28.0, 14.0, 10.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4580078125, -1.406097412109375, -1.35418701171875, -1.302276611328125, -1.2503662109375, -1.198455810546875, -1.14654541015625, -1.094635009765625, -1.042724609375, -0.990814208984375, -0.93890380859375, -0.886993408203125, -0.8350830078125, -0.783172607421875, -0.73126220703125, -0.679351806640625, -0.62744140625, -0.575531005859375, -0.52362060546875, -0.471710205078125, -0.4197998046875, -0.367889404296875, -0.31597900390625, -0.264068603515625, -0.212158203125, -0.160247802734375, -0.10833740234375, -0.056427001953125, -0.0045166015625, 0.047393798828125, 0.09930419921875, 0.151214599609375, 0.203125, 0.255035400390625, 0.30694580078125, 0.358856201171875, 0.4107666015625, 0.462677001953125, 0.51458740234375, 0.566497802734375, 0.618408203125, 0.670318603515625, 0.72222900390625, 0.774139404296875, 0.8260498046875, 0.877960205078125, 0.92987060546875, 0.981781005859375, 1.03369140625, 1.085601806640625, 1.13751220703125, 1.189422607421875, 1.2413330078125, 1.293243408203125, 1.34515380859375, 1.397064208984375, 1.448974609375, 1.500885009765625, 1.55279541015625, 1.604705810546875, 1.6566162109375, 1.708526611328125, 1.76043701171875, 1.812347412109375, 1.8642578125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 11.0, 16.0, 34.0, 76.0, 129.0, 159.0, 174.0, 165.0, 105.0, 58.0, 30.0, 24.0, 8.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5576171875, -1.5006561279296875, -1.443695068359375, -1.3867340087890625, -1.32977294921875, -1.2728118896484375, -1.215850830078125, -1.1588897705078125, -1.1019287109375, -1.0449676513671875, -0.988006591796875, -0.9310455322265625, -0.87408447265625, -0.8171234130859375, -0.760162353515625, -0.7032012939453125, -0.646240234375, -0.5892791748046875, -0.532318115234375, -0.4753570556640625, -0.41839599609375, -0.3614349365234375, -0.304473876953125, -0.2475128173828125, -0.1905517578125, -0.1335906982421875, -0.076629638671875, -0.0196685791015625, 0.03729248046875, 0.0942535400390625, 0.151214599609375, 0.2081756591796875, 0.26513671875, 0.3220977783203125, 0.379058837890625, 0.4360198974609375, 0.49298095703125, 0.5499420166015625, 0.606903076171875, 0.6638641357421875, 0.7208251953125, 0.7777862548828125, 0.834747314453125, 0.8917083740234375, 0.94866943359375, 1.0056304931640625, 1.062591552734375, 1.1195526123046875, 1.176513671875, 1.2334747314453125, 1.290435791015625, 1.3473968505859375, 1.40435791015625, 1.4613189697265625, 1.518280029296875, 1.5752410888671875, 1.6322021484375, 1.6891632080078125, 1.746124267578125, 1.8030853271484375, 1.86004638671875, 1.9170074462890625, 1.973968505859375, 2.0309295654296875, 2.087890625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 2.0, 12.0, 17.0, 16.0, 22.0, 28.0, 48.0, 76.0, 96.0, 262.0, 541.0, 1470.0, 4520.0, 21307.0, 364293.0, 3730248.0, 59039.0, 8425.0, 2280.0, 839.0, 324.0, 167.0, 83.0, 50.0, 32.0, 19.0, 12.0, 8.0, 8.0, 6.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.7373046875, -1.689361572265625, -1.64141845703125, -1.593475341796875, -1.5455322265625, -1.497589111328125, -1.44964599609375, -1.401702880859375, -1.353759765625, -1.305816650390625, -1.25787353515625, -1.209930419921875, -1.1619873046875, -1.114044189453125, -1.06610107421875, -1.018157958984375, -0.97021484375, -0.922271728515625, -0.87432861328125, -0.826385498046875, -0.7784423828125, -0.730499267578125, -0.68255615234375, -0.634613037109375, -0.586669921875, -0.538726806640625, -0.49078369140625, -0.442840576171875, -0.3948974609375, -0.346954345703125, -0.29901123046875, -0.251068115234375, -0.203125, -0.155181884765625, -0.10723876953125, -0.059295654296875, -0.0113525390625, 0.036590576171875, 0.08453369140625, 0.132476806640625, 0.180419921875, 0.228363037109375, 0.27630615234375, 0.324249267578125, 0.3721923828125, 0.420135498046875, 0.46807861328125, 0.516021728515625, 0.56396484375, 0.611907958984375, 0.65985107421875, 0.707794189453125, 0.7557373046875, 0.803680419921875, 0.85162353515625, 0.899566650390625, 0.947509765625, 0.995452880859375, 1.04339599609375, 1.091339111328125, 1.1392822265625, 1.187225341796875, 1.23516845703125, 1.283111572265625, 1.3310546875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 11.0, 8.0, 12.0, 18.0, 27.0, 31.0, 69.0, 122.0, 286.0, 845.0, 1378.0, 722.0, 244.0, 109.0, 67.0, 31.0, 22.0, 12.0, 13.0, 11.0, 7.0, 2.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3723945617675781, -0.35880279541015625, -0.3452110290527344, -0.3316192626953125, -0.3180274963378906, -0.30443572998046875, -0.2908439636230469, -0.277252197265625, -0.2636604309082031, -0.25006866455078125, -0.23647689819335938, -0.2228851318359375, -0.20929336547851562, -0.19570159912109375, -0.18210983276367188, -0.16851806640625, -0.15492630004882812, -0.14133453369140625, -0.12774276733398438, -0.1141510009765625, -0.10055923461914062, -0.08696746826171875, -0.07337570190429688, -0.059783935546875, -0.046192169189453125, -0.03260040283203125, -0.019008636474609375, -0.0054168701171875, 0.008174896240234375, 0.02176666259765625, 0.035358428955078125, 0.0489501953125, 0.06254196166992188, 0.07613372802734375, 0.08972549438476562, 0.1033172607421875, 0.11690902709960938, 0.13050079345703125, 0.14409255981445312, 0.157684326171875, 0.17127609252929688, 0.18486785888671875, 0.19845962524414062, 0.2120513916015625, 0.22564315795898438, 0.23923492431640625, 0.2528266906738281, 0.26641845703125, 0.2800102233886719, 0.29360198974609375, 0.3071937561035156, 0.3207855224609375, 0.3343772888183594, 0.34796905517578125, 0.3615608215332031, 0.375152587890625, 0.3887443542480469, 0.40233612060546875, 0.4159278869628906, 0.4295196533203125, 0.4431114196777344, 0.45670318603515625, 0.4702949523925781, 0.48388671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 15.0, 17.0, 48.0, 79.0, 153.0, 237.0, 194.0, 123.0, 62.0, 44.0, 15.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1634411811828613, -2.1013851165771484, -2.0393290519714355, -1.9772731065750122, -1.9152171611785889, -1.853161096572876, -1.791105031967163, -1.7290490865707397, -1.6669931411743164, -1.6049370765686035, -1.5428811311721802, -1.4808250665664673, -1.418769121170044, -1.356713056564331, -1.2946569919586182, -1.2326010465621948, -1.170544981956482, -1.108488917350769, -1.0464329719543457, -0.9843769073486328, -0.9223209619522095, -0.8602648973464966, -0.7982088923454285, -0.7361528873443604, -0.6740968823432922, -0.6120408773422241, -0.549984872341156, -0.4879288375377655, -0.4258728325366974, -0.3638168275356293, -0.30176079273223877, -0.23970478773117065, -0.17764878273010254, -0.11559277027845383, -0.053536757826805115, 0.008519262075424194, 0.07057526707649231, 0.13263127207756042, 0.19468730688095093, 0.25674331188201904, 0.31879931688308716, 0.3808553218841553, 0.4429113268852234, 0.5049673318862915, 0.5670233964920044, 0.6290793418884277, 0.6911354064941406, 0.7531914114952087, 0.8152474164962769, 0.877303421497345, 0.9393594264984131, 1.001415491104126, 1.0634714365005493, 1.1255275011062622, 1.1875834465026855, 1.2496395111083984, 1.3116955757141113, 1.3737516403198242, 1.4358075857162476, 1.4978636503219604, 1.5599195957183838, 1.6219756603240967, 1.6840317249298096, 1.746087670326233, 1.8081436157226562]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 21.0, 24.0, 47.0, 67.0, 93.0, 117.0, 144.0, 139.0, 105.0, 96.0, 63.0, 35.0, 24.0, 14.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7203772068023682, -1.662180781364441, -1.6039842367172241, -1.5457878112792969, -1.4875913858413696, -1.4293949604034424, -1.3711984157562256, -1.3130019903182983, -1.254805564880371, -1.1966091394424438, -1.138412594795227, -1.0802161693572998, -1.0220197439193726, -0.9638232588768005, -0.9056267738342285, -0.8474303483963013, -0.7892338633537292, -0.7310373783111572, -0.67284095287323, -0.614644467830658, -0.5564480423927307, -0.4982515573501587, -0.44005510210990906, -0.3818586468696594, -0.3236621916294098, -0.26546573638916016, -0.20726928114891052, -0.1490728110074997, -0.09087635576725006, -0.03267988562583923, 0.0255165696144104, 0.08371302485466003, 0.14190948009490967, 0.2001059353351593, 0.25830239057540894, 0.31649887561798096, 0.3746953010559082, 0.4328917860984802, 0.49108824133872986, 0.5492846965789795, 0.6074811220169067, 0.6656776070594788, 0.723874032497406, 0.782070517539978, 0.8402669429779053, 0.8984634280204773, 0.9566599130630493, 1.0148563385009766, 1.0730528831481934, 1.1312493085861206, 1.1894458532333374, 1.2476422786712646, 1.305838704109192, 1.3640351295471191, 1.422231674194336, 1.4804280996322632, 1.5386245250701904, 1.5968209505081177, 1.6550174951553345, 1.7132139205932617, 1.771410346031189, 1.8296067714691162, 1.887803316116333, 1.9459997415542603, 2.0041961669921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 9.0, 18.0, 22.0, 31.0, 44.0, 82.0, 119.0, 238.0, 558.0, 1660.0, 10900.0, 207370.0, 782812.0, 39182.0, 3767.0, 923.0, 370.0, 203.0, 93.0, 38.0, 37.0, 29.0, 22.0, 12.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3349609375, -0.3238868713378906, -0.31281280517578125, -0.3017387390136719, -0.2906646728515625, -0.2795906066894531, -0.26851654052734375, -0.2574424743652344, -0.246368408203125, -0.23529434204101562, -0.22422027587890625, -0.21314620971679688, -0.2020721435546875, -0.19099807739257812, -0.17992401123046875, -0.16884994506835938, -0.15777587890625, -0.14670181274414062, -0.13562774658203125, -0.12455368041992188, -0.1134796142578125, -0.10240554809570312, -0.09133148193359375, -0.08025741577148438, -0.069183349609375, -0.058109283447265625, -0.04703521728515625, -0.035961151123046875, -0.0248870849609375, -0.013813018798828125, -0.00273895263671875, 0.008335113525390625, 0.0194091796875, 0.030483245849609375, 0.04155731201171875, 0.052631378173828125, 0.0637054443359375, 0.07477951049804688, 0.08585357666015625, 0.09692764282226562, 0.108001708984375, 0.11907577514648438, 0.13014984130859375, 0.14122390747070312, 0.1522979736328125, 0.16337203979492188, 0.17444610595703125, 0.18552017211914062, 0.19659423828125, 0.20766830444335938, 0.21874237060546875, 0.22981643676757812, 0.2408905029296875, 0.2519645690917969, 0.26303863525390625, 0.2741127014160156, 0.285186767578125, 0.2962608337402344, 0.30733489990234375, 0.3184089660644531, 0.3294830322265625, 0.3405570983886719, 0.35163116455078125, 0.3627052307128906, 0.373779296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 18.0, 21.0, 47.0, 78.0, 114.0, 165.0, 162.0, 133.0, 114.0, 74.0, 34.0, 25.0, 10.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.310546875, -1.265838623046875, -1.22113037109375, -1.176422119140625, -1.1317138671875, -1.087005615234375, -1.04229736328125, -0.997589111328125, -0.952880859375, -0.908172607421875, -0.86346435546875, -0.818756103515625, -0.7740478515625, -0.729339599609375, -0.68463134765625, -0.639923095703125, -0.59521484375, -0.550506591796875, -0.50579833984375, -0.461090087890625, -0.4163818359375, -0.371673583984375, -0.32696533203125, -0.282257080078125, -0.237548828125, -0.192840576171875, -0.14813232421875, -0.103424072265625, -0.0587158203125, -0.014007568359375, 0.03070068359375, 0.075408935546875, 0.1201171875, 0.164825439453125, 0.20953369140625, 0.254241943359375, 0.2989501953125, 0.343658447265625, 0.38836669921875, 0.433074951171875, 0.477783203125, 0.522491455078125, 0.56719970703125, 0.611907958984375, 0.6566162109375, 0.701324462890625, 0.74603271484375, 0.790740966796875, 0.83544921875, 0.880157470703125, 0.92486572265625, 0.969573974609375, 1.0142822265625, 1.058990478515625, 1.10369873046875, 1.148406982421875, 1.193115234375, 1.237823486328125, 1.28253173828125, 1.327239990234375, 1.3719482421875, 1.416656494140625, 1.46136474609375, 1.506072998046875, 1.55078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 10.0, 13.0, 26.0, 37.0, 70.0, 77.0, 156.0, 253.0, 434.0, 708.0, 1284.0, 2321.0, 4459.0, 8655.0, 18191.0, 39856.0, 93541.0, 215917.0, 319313.0, 191849.0, 82023.0, 35745.0, 16358.0, 7943.0, 4125.0, 2184.0, 1258.0, 697.0, 396.0, 228.0, 159.0, 90.0, 62.0, 31.0, 29.0, 19.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06435203552246094, -0.062236785888671875, -0.06012153625488281, -0.05800628662109375, -0.05589103698730469, -0.053775787353515625, -0.05166053771972656, -0.0495452880859375, -0.04743003845214844, -0.045314788818359375, -0.04319953918457031, -0.04108428955078125, -0.03896903991699219, -0.036853790283203125, -0.03473854064941406, -0.032623291015625, -0.030508041381835938, -0.028392791748046875, -0.026277542114257812, -0.02416229248046875, -0.022047042846679688, -0.019931793212890625, -0.017816543579101562, -0.0157012939453125, -0.013586044311523438, -0.011470794677734375, -0.009355545043945312, -0.00724029541015625, -0.0051250457763671875, -0.003009796142578125, -0.0008945465087890625, 0.001220703125, 0.0033359527587890625, 0.005451202392578125, 0.0075664520263671875, 0.00968170166015625, 0.011796951293945312, 0.013912200927734375, 0.016027450561523438, 0.0181427001953125, 0.020257949829101562, 0.022373199462890625, 0.024488449096679688, 0.02660369873046875, 0.028718948364257812, 0.030834197998046875, 0.03294944763183594, 0.035064697265625, 0.03717994689941406, 0.039295196533203125, 0.04141044616699219, 0.04352569580078125, 0.04564094543457031, 0.047756195068359375, 0.04987144470214844, 0.0519866943359375, 0.05410194396972656, 0.056217193603515625, 0.05833244323730469, 0.06044769287109375, 0.06256294250488281, 0.06467819213867188, 0.06679344177246094, 0.06890869140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 8.0, 5.0, 16.0, 13.0, 23.0, 26.0, 28.0, 22.0, 30.0, 44.0, 44.0, 53.0, 48.0, 48.0, 51.0, 56.0, 50.0, 58.0, 45.0, 39.0, 35.0, 36.0, 38.0, 38.0, 18.0, 19.0, 17.0, 16.0, 13.0, 10.0, 10.0, 7.0, 1.0, 7.0, 0.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9577560424804688, -0.9267425537109375, -0.8957290649414062, -0.864715576171875, -0.8337020874023438, -0.8026885986328125, -0.7716751098632812, -0.74066162109375, -0.7096481323242188, -0.6786346435546875, -0.6476211547851562, -0.616607666015625, -0.5855941772460938, -0.5545806884765625, -0.5235671997070312, -0.4925537109375, -0.46154022216796875, -0.4305267333984375, -0.39951324462890625, -0.368499755859375, -0.33748626708984375, -0.3064727783203125, -0.27545928955078125, -0.24444580078125, -0.21343231201171875, -0.1824188232421875, -0.15140533447265625, -0.120391845703125, -0.08937835693359375, -0.0583648681640625, -0.02735137939453125, 0.003662109375, 0.03467559814453125, 0.0656890869140625, 0.09670257568359375, 0.127716064453125, 0.15872955322265625, 0.1897430419921875, 0.22075653076171875, 0.25177001953125, 0.28278350830078125, 0.3137969970703125, 0.34481048583984375, 0.375823974609375, 0.40683746337890625, 0.4378509521484375, 0.46886444091796875, 0.4998779296875, 0.5308914184570312, 0.5619049072265625, 0.5929183959960938, 0.623931884765625, 0.6549453735351562, 0.6859588623046875, 0.7169723510742188, 0.74798583984375, 0.7789993286132812, 0.8100128173828125, 0.8410263061523438, 0.872039794921875, 0.9030532836914062, 0.9340667724609375, 0.9650802612304688, 0.99609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 8.0, 7.0, 16.0, 24.0, 22.0, 31.0, 57.0, 83.0, 121.0, 163.0, 292.0, 507.0, 824.0, 1526.0, 2874.0, 6087.0, 15554.0, 55783.0, 308078.0, 513346.0, 102357.0, 24354.0, 8216.0, 3707.0, 1929.0, 1044.0, 571.0, 315.0, 195.0, 133.0, 83.0, 60.0, 55.0, 25.0, 27.0, 19.0, 15.0, 11.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008270263671875, -0.007996320724487305, -0.007722377777099609, -0.007448434829711914, -0.007174491882324219, -0.0069005489349365234, -0.006626605987548828, -0.006352663040161133, -0.0060787200927734375, -0.005804777145385742, -0.005530834197998047, -0.0052568912506103516, -0.004982948303222656, -0.004709005355834961, -0.004435062408447266, -0.00416111946105957, -0.003887176513671875, -0.0036132335662841797, -0.0033392906188964844, -0.003065347671508789, -0.0027914047241210938, -0.0025174617767333984, -0.002243518829345703, -0.001969575881958008, -0.0016956329345703125, -0.0014216899871826172, -0.0011477470397949219, -0.0008738040924072266, -0.0005998611450195312, -0.00032591819763183594, -5.1975250244140625e-05, 0.0002219676971435547, 0.00049591064453125, 0.0007698535919189453, 0.0010437965393066406, 0.001317739486694336, 0.0015916824340820312, 0.0018656253814697266, 0.002139568328857422, 0.002413511276245117, 0.0026874542236328125, 0.002961397171020508, 0.003235340118408203, 0.0035092830657958984, 0.0037832260131835938, 0.004057168960571289, 0.004331111907958984, 0.00460505485534668, 0.004878997802734375, 0.00515294075012207, 0.005426883697509766, 0.005700826644897461, 0.005974769592285156, 0.0062487125396728516, 0.006522655487060547, 0.006796598434448242, 0.0070705413818359375, 0.007344484329223633, 0.007618427276611328, 0.007892370223999023, 0.008166313171386719, 0.008440256118774414, 0.00871419906616211, 0.008988142013549805, 0.0092620849609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 9.0, 16.0, 12.0, 26.0, 37.0, 53.0, 61.0, 110.0, 119.0, 103.0, 107.0, 98.0, 68.0, 60.0, 39.0, 16.0, 19.0, 14.0, 8.0, 6.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1205673217773438e-05, -1.0625459253787994e-05, -1.0045245289802551e-05, -9.465031325817108e-06, -8.884817361831665e-06, -8.304603397846222e-06, -7.724389433860779e-06, -7.144175469875336e-06, -6.563961505889893e-06, -5.9837475419044495e-06, -5.403533577919006e-06, -4.823319613933563e-06, -4.24310564994812e-06, -3.662891685962677e-06, -3.082677721977234e-06, -2.5024637579917908e-06, -1.9222497940063477e-06, -1.3420358300209045e-06, -7.618218660354614e-07, -1.816079020500183e-07, 3.986060619354248e-07, 9.78820025920868e-07, 1.559033989906311e-06, 2.139247953891754e-06, 2.7194619178771973e-06, 3.2996758818626404e-06, 3.8798898458480835e-06, 4.460103809833527e-06, 5.04031777381897e-06, 5.620531737804413e-06, 6.200745701789856e-06, 6.780959665775299e-06, 7.361173629760742e-06, 7.941387593746185e-06, 8.521601557731628e-06, 9.101815521717072e-06, 9.682029485702515e-06, 1.0262243449687958e-05, 1.0842457413673401e-05, 1.1422671377658844e-05, 1.2002885341644287e-05, 1.258309930562973e-05, 1.3163313269615173e-05, 1.3743527233600616e-05, 1.432374119758606e-05, 1.4903955161571503e-05, 1.5484169125556946e-05, 1.606438308954239e-05, 1.6644597053527832e-05, 1.7224811017513275e-05, 1.7805024981498718e-05, 1.838523894548416e-05, 1.8965452909469604e-05, 1.9545666873455048e-05, 2.012588083744049e-05, 2.0706094801425934e-05, 2.1286308765411377e-05, 2.186652272939682e-05, 2.2446736693382263e-05, 2.3026950657367706e-05, 2.360716462135315e-05, 2.4187378585338593e-05, 2.4767592549324036e-05, 2.534780651330948e-05, 2.5928020477294922e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 7.0, 14.0, 8.0, 25.0, 20.0, 34.0, 40.0, 42.0, 82.0, 126.0, 238.0, 515.0, 1358.0, 4143.0, 17088.0, 119945.0, 776137.0, 106342.0, 15984.0, 3994.0, 1236.0, 507.0, 243.0, 128.0, 78.0, 61.0, 38.0, 32.0, 18.0, 20.0, 15.0, 10.0, 6.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01409149169921875, -0.013596653938293457, -0.013101816177368164, -0.012606978416442871, -0.012112140655517578, -0.011617302894592285, -0.011122465133666992, -0.0106276273727417, -0.010132789611816406, -0.009637951850891113, -0.00914311408996582, -0.008648276329040527, -0.008153438568115234, -0.007658600807189941, -0.0071637630462646484, -0.0066689252853393555, -0.0061740875244140625, -0.0056792497634887695, -0.0051844120025634766, -0.004689574241638184, -0.004194736480712891, -0.0036998987197875977, -0.0032050609588623047, -0.0027102231979370117, -0.0022153854370117188, -0.0017205476760864258, -0.0012257099151611328, -0.0007308721542358398, -0.00023603439331054688, 0.0002588033676147461, 0.0007536411285400391, 0.001248478889465332, 0.001743316650390625, 0.002238154411315918, 0.002732992172241211, 0.003227829933166504, 0.003722667694091797, 0.00421750545501709, 0.004712343215942383, 0.005207180976867676, 0.005702018737792969, 0.006196856498718262, 0.006691694259643555, 0.007186532020568848, 0.007681369781494141, 0.008176207542419434, 0.008671045303344727, 0.00916588306427002, 0.009660720825195312, 0.010155558586120605, 0.010650396347045898, 0.011145234107971191, 0.011640071868896484, 0.012134909629821777, 0.01262974739074707, 0.013124585151672363, 0.013619422912597656, 0.01411426067352295, 0.014609098434448242, 0.015103936195373535, 0.015598773956298828, 0.01609361171722412, 0.016588449478149414, 0.017083287239074707, 0.017578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 0.0, 7.0, 16.0, 17.0, 24.0, 34.0, 58.0, 110.0, 165.0, 198.0, 135.0, 76.0, 58.0, 25.0, 19.0, 15.0, 18.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.00618705153465271, -0.006030261516571045, -0.00587347149848938, -0.005716681480407715, -0.00555989146232605, -0.005403101444244385, -0.00524631142616272, -0.005089521408081055, -0.00493273138999939, -0.004775941371917725, -0.00461915135383606, -0.0044623613357543945, -0.0043055713176727295, -0.0041487812995910645, -0.003991991281509399, -0.0038352012634277344, -0.0036784112453460693, -0.0035216212272644043, -0.0033648312091827393, -0.0032080411911010742, -0.003051251173019409, -0.002894461154937744, -0.002737671136856079, -0.002580881118774414, -0.002424091100692749, -0.002267301082611084, -0.002110511064529419, -0.001953721046447754, -0.0017969310283660889, -0.0016401410102844238, -0.0014833509922027588, -0.0013265609741210938, -0.0011697709560394287, -0.0010129809379577637, -0.0008561909198760986, -0.0006994009017944336, -0.0005426108837127686, -0.0003858208656311035, -0.00022903084754943848, -7.224082946777344e-05, 8.45491886138916e-05, 0.00024133920669555664, 0.0003981292247772217, 0.0005549192428588867, 0.0007117092609405518, 0.0008684992790222168, 0.0010252892971038818, 0.0011820793151855469, 0.001338869333267212, 0.001495659351348877, 0.001652449369430542, 0.001809239387512207, 0.001966029405593872, 0.002122819423675537, 0.002279609441757202, 0.002436399459838867, 0.0025931894779205322, 0.0027499794960021973, 0.0029067695140838623, 0.0030635595321655273, 0.0032203495502471924, 0.0033771395683288574, 0.0035339295864105225, 0.0036907196044921875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 9.0, 29.0, 80.0, 189.0, 284.0, 213.0, 117.0, 43.0, 17.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.468843936920166, -1.4224694967269897, -1.3760950565338135, -1.3297206163406372, -1.283346176147461, -1.2369717359542847, -1.1905972957611084, -1.1442228555679321, -1.0978484153747559, -1.0514739751815796, -1.0050995349884033, -0.958725094795227, -0.9123506546020508, -0.8659762144088745, -0.8196017742156982, -0.773227334022522, -0.7268528938293457, -0.6804784536361694, -0.6341040134429932, -0.5877295732498169, -0.5413551330566406, -0.49498069286346436, -0.4486062526702881, -0.4022318124771118, -0.35585737228393555, -0.3094829320907593, -0.263108491897583, -0.21673405170440674, -0.17035961151123047, -0.1239851713180542, -0.07761073112487793, -0.03123629093170166, 0.01513826847076416, 0.06151270866394043, 0.1078871488571167, 0.15426158905029297, 0.20063602924346924, 0.2470104694366455, 0.2933849096298218, 0.33975934982299805, 0.3861337900161743, 0.4325082302093506, 0.47888267040252686, 0.5252571105957031, 0.5716315507888794, 0.6180059909820557, 0.6643804311752319, 0.7107548713684082, 0.7571293115615845, 0.8035037517547607, 0.849878191947937, 0.8962526321411133, 0.9426270723342896, 0.9890015125274658, 1.035375952720642, 1.0817503929138184, 1.1281248331069946, 1.174499273300171, 1.2208737134933472, 1.2672481536865234, 1.3136225938796997, 1.359997034072876, 1.4063714742660522, 1.4527459144592285, 1.4991203546524048]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 13.0, 26.0, 46.0, 84.0, 112.0, 154.0, 183.0, 135.0, 110.0, 61.0, 39.0, 24.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2135868072509766, -1.1691458225250244, -1.1247048377990723, -1.0802638530731201, -1.0358227491378784, -0.9913817644119263, -0.9469407796859741, -0.902499794960022, -0.858058750629425, -0.8136177659034729, -0.769176721572876, -0.7247357368469238, -0.6802947521209717, -0.6358537077903748, -0.5914127230644226, -0.5469716787338257, -0.5025306940078735, -0.458089679479599, -0.41364866495132446, -0.3692076802253723, -0.3247666656970978, -0.28032565116882324, -0.2358846664428711, -0.19144365191459656, -0.14700263738632202, -0.10256163030862808, -0.05812062323093414, -0.0136796236038208, 0.030761390924453735, 0.07520240545272827, 0.11964339017868042, 0.16408440470695496, 0.2085254192352295, 0.25296643376350403, 0.29740744829177856, 0.3418484330177307, 0.38628944754600525, 0.4307304620742798, 0.47517144680023193, 0.5196124315261841, 0.564053475856781, 0.6084944605827332, 0.6529355049133301, 0.6973764896392822, 0.7418174743652344, 0.7862585186958313, 0.8306995034217834, 0.8751405477523804, 0.9195815324783325, 0.9640225172042847, 1.0084635019302368, 1.0529046058654785, 1.0973455905914307, 1.1417865753173828, 1.186227560043335, 1.230668544769287, 1.2751095294952393, 1.3195505142211914, 1.3639914989471436, 1.4084324836730957, 1.4528735876083374, 1.4973145723342896, 1.5417555570602417, 1.5861965417861938, 1.6306376457214355]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 7.0, 12.0, 20.0, 28.0, 33.0, 61.0, 101.0, 169.0, 253.0, 477.0, 821.0, 1597.0, 3580.0, 9471.0, 37775.0, 432652.0, 502737.0, 41213.0, 10086.0, 3737.0, 1710.0, 822.0, 458.0, 283.0, 145.0, 91.0, 67.0, 38.0, 26.0, 23.0, 13.0, 10.0, 7.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52880859375, -0.514129638671875, -0.49945068359375, -0.484771728515625, -0.4700927734375, -0.455413818359375, -0.44073486328125, -0.426055908203125, -0.411376953125, -0.396697998046875, -0.38201904296875, -0.367340087890625, -0.3526611328125, -0.337982177734375, -0.32330322265625, -0.308624267578125, -0.2939453125, -0.279266357421875, -0.26458740234375, -0.249908447265625, -0.2352294921875, -0.220550537109375, -0.20587158203125, -0.191192626953125, -0.176513671875, -0.161834716796875, -0.14715576171875, -0.132476806640625, -0.1177978515625, -0.103118896484375, -0.08843994140625, -0.073760986328125, -0.05908203125, -0.044403076171875, -0.02972412109375, -0.015045166015625, -0.0003662109375, 0.014312744140625, 0.02899169921875, 0.043670654296875, 0.058349609375, 0.073028564453125, 0.08770751953125, 0.102386474609375, 0.1170654296875, 0.131744384765625, 0.14642333984375, 0.161102294921875, 0.17578125, 0.190460205078125, 0.20513916015625, 0.219818115234375, 0.2344970703125, 0.249176025390625, 0.26385498046875, 0.278533935546875, 0.293212890625, 0.307891845703125, 0.32257080078125, 0.337249755859375, 0.3519287109375, 0.366607666015625, 0.38128662109375, 0.395965576171875, 0.41064453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 20.0, 31.0, 41.0, 54.0, 83.0, 92.0, 127.0, 112.0, 117.0, 81.0, 90.0, 51.0, 27.0, 25.0, 16.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2943115234375, -2.227294921875, -2.1602783203125, -2.09326171875, -2.0262451171875, -1.959228515625, -1.8922119140625, -1.8251953125, -1.7581787109375, -1.691162109375, -1.6241455078125, -1.55712890625, -1.4901123046875, -1.423095703125, -1.3560791015625, -1.2890625, -1.2220458984375, -1.155029296875, -1.0880126953125, -1.02099609375, -0.9539794921875, -0.886962890625, -0.8199462890625, -0.7529296875, -0.6859130859375, -0.618896484375, -0.5518798828125, -0.48486328125, -0.4178466796875, -0.350830078125, -0.2838134765625, -0.216796875, -0.1497802734375, -0.082763671875, -0.0157470703125, 0.05126953125, 0.1182861328125, 0.185302734375, 0.2523193359375, 0.3193359375, 0.3863525390625, 0.453369140625, 0.5203857421875, 0.58740234375, 0.6544189453125, 0.721435546875, 0.7884521484375, 0.85546875, 0.9224853515625, 0.989501953125, 1.0565185546875, 1.12353515625, 1.1905517578125, 1.257568359375, 1.3245849609375, 1.3916015625, 1.4586181640625, 1.525634765625, 1.5926513671875, 1.65966796875, 1.7266845703125, 1.793701171875, 1.8607177734375, 1.927734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 9.0, 13.0, 22.0, 36.0, 55.0, 91.0, 169.0, 378.0, 1362.0, 20771.0, 1008314.0, 15314.0, 1252.0, 351.0, 160.0, 97.0, 46.0, 34.0, 28.0, 12.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7119140625, -1.6591796875, -1.6064453125, -1.5537109375, -1.5009765625, -1.4482421875, -1.3955078125, -1.3427734375, -1.2900390625, -1.2373046875, -1.1845703125, -1.1318359375, -1.0791015625, -1.0263671875, -0.9736328125, -0.9208984375, -0.8681640625, -0.8154296875, -0.7626953125, -0.7099609375, -0.6572265625, -0.6044921875, -0.5517578125, -0.4990234375, -0.4462890625, -0.3935546875, -0.3408203125, -0.2880859375, -0.2353515625, -0.1826171875, -0.1298828125, -0.0771484375, -0.0244140625, 0.0283203125, 0.0810546875, 0.1337890625, 0.1865234375, 0.2392578125, 0.2919921875, 0.3447265625, 0.3974609375, 0.4501953125, 0.5029296875, 0.5556640625, 0.6083984375, 0.6611328125, 0.7138671875, 0.7666015625, 0.8193359375, 0.8720703125, 0.9248046875, 0.9775390625, 1.0302734375, 1.0830078125, 1.1357421875, 1.1884765625, 1.2412109375, 1.2939453125, 1.3466796875, 1.3994140625, 1.4521484375, 1.5048828125, 1.5576171875, 1.6103515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 16.0, 28.0, 55.0, 69.0, 103.0, 114.0, 141.0, 123.0, 114.0, 91.0, 47.0, 36.0, 28.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1239013671875, -3.997802734375, -3.8717041015625, -3.74560546875, -3.6195068359375, -3.493408203125, -3.3673095703125, -3.2412109375, -3.1151123046875, -2.989013671875, -2.8629150390625, -2.73681640625, -2.6107177734375, -2.484619140625, -2.3585205078125, -2.232421875, -2.1063232421875, -1.980224609375, -1.8541259765625, -1.72802734375, -1.6019287109375, -1.475830078125, -1.3497314453125, -1.2236328125, -1.0975341796875, -0.971435546875, -0.8453369140625, -0.71923828125, -0.5931396484375, -0.467041015625, -0.3409423828125, -0.21484375, -0.0887451171875, 0.037353515625, 0.1634521484375, 0.28955078125, 0.4156494140625, 0.541748046875, 0.6678466796875, 0.7939453125, 0.9200439453125, 1.046142578125, 1.1722412109375, 1.29833984375, 1.4244384765625, 1.550537109375, 1.6766357421875, 1.802734375, 1.9288330078125, 2.054931640625, 2.1810302734375, 2.30712890625, 2.4332275390625, 2.559326171875, 2.6854248046875, 2.8115234375, 2.9376220703125, 3.063720703125, 3.1898193359375, 3.31591796875, 3.4420166015625, 3.568115234375, 3.6942138671875, 3.8203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 7.0, 12.0, 13.0, 14.0, 18.0, 46.0, 65.0, 100.0, 174.0, 350.0, 860.0, 3211.0, 24794.0, 791436.0, 211636.0, 12554.0, 1937.0, 698.0, 275.0, 142.0, 82.0, 54.0, 26.0, 16.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.355712890625, -0.3463153839111328, -0.3369178771972656, -0.32752037048339844, -0.31812286376953125, -0.30872535705566406, -0.2993278503417969, -0.2899303436279297, -0.2805328369140625, -0.2711353302001953, -0.2617378234863281, -0.25234031677246094, -0.24294281005859375, -0.23354530334472656, -0.22414779663085938, -0.2147502899169922, -0.205352783203125, -0.1959552764892578, -0.18655776977539062, -0.17716026306152344, -0.16776275634765625, -0.15836524963378906, -0.14896774291992188, -0.1395702362060547, -0.1301727294921875, -0.12077522277832031, -0.11137771606445312, -0.10198020935058594, -0.09258270263671875, -0.08318519592285156, -0.07378768920898438, -0.06439018249511719, -0.05499267578125, -0.04559516906738281, -0.036197662353515625, -0.026800155639648438, -0.01740264892578125, -0.008005142211914062, 0.001392364501953125, 0.010789871215820312, 0.0201873779296875, 0.029584884643554688, 0.038982391357421875, 0.04837989807128906, 0.05777740478515625, 0.06717491149902344, 0.07657241821289062, 0.08596992492675781, 0.095367431640625, 0.10476493835449219, 0.11416244506835938, 0.12355995178222656, 0.13295745849609375, 0.14235496520996094, 0.15175247192382812, 0.1611499786376953, 0.1705474853515625, 0.1799449920654297, 0.18934249877929688, 0.19874000549316406, 0.20813751220703125, 0.21753501892089844, 0.22693252563476562, 0.2363300323486328, 0.2457275390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 5.0, 12.0, 15.0, 16.0, 25.0, 36.0, 43.0, 105.0, 231.0, 240.0, 103.0, 42.0, 33.0, 17.0, 23.0, 11.0, 10.0, 14.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8172897398471832e-05, -1.7212703824043274e-05, -1.6252510249614716e-05, -1.5292316675186157e-05, -1.4332123100757599e-05, -1.337192952632904e-05, -1.2411735951900482e-05, -1.1451542377471924e-05, -1.0491348803043365e-05, -9.531155228614807e-06, -8.570961654186249e-06, -7.6107680797576904e-06, -6.650574505329132e-06, -5.690380930900574e-06, -4.730187356472015e-06, -3.769993782043457e-06, -2.8098002076148987e-06, -1.8496066331863403e-06, -8.89413058757782e-07, 7.078051567077637e-08, 1.0309740900993347e-06, 1.991167664527893e-06, 2.9513612389564514e-06, 3.91155481338501e-06, 4.871748387813568e-06, 5.8319419622421265e-06, 6.792135536670685e-06, 7.752329111099243e-06, 8.712522685527802e-06, 9.67271625995636e-06, 1.0632909834384918e-05, 1.1593103408813477e-05, 1.2553296983242035e-05, 1.3513490557670593e-05, 1.4473684132099152e-05, 1.543387770652771e-05, 1.639407128095627e-05, 1.7354264855384827e-05, 1.8314458429813385e-05, 1.9274652004241943e-05, 2.0234845578670502e-05, 2.119503915309906e-05, 2.215523272752762e-05, 2.3115426301956177e-05, 2.4075619876384735e-05, 2.5035813450813293e-05, 2.5996007025241852e-05, 2.695620059967041e-05, 2.791639417409897e-05, 2.8876587748527527e-05, 2.9836781322956085e-05, 3.0796974897384644e-05, 3.17571684718132e-05, 3.271736204624176e-05, 3.367755562067032e-05, 3.463774919509888e-05, 3.5597942769527435e-05, 3.6558136343955994e-05, 3.751832991838455e-05, 3.847852349281311e-05, 3.943871706724167e-05, 4.039891064167023e-05, 4.1359104216098785e-05, 4.2319297790527344e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 11.0, 33.0, 34.0, 63.0, 142.0, 241.0, 649.0, 2018.0, 10456.0, 132999.0, 861884.0, 33723.0, 4388.0, 1085.0, 419.0, 201.0, 78.0, 36.0, 26.0, 15.0, 8.0, 8.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.26654815673828125, -0.2559967041015625, -0.24544525146484375, -0.234893798828125, -0.22434234619140625, -0.2137908935546875, -0.20323944091796875, -0.19268798828125, -0.18213653564453125, -0.1715850830078125, -0.16103363037109375, -0.150482177734375, -0.13993072509765625, -0.1293792724609375, -0.11882781982421875, -0.1082763671875, -0.09772491455078125, -0.0871734619140625, -0.07662200927734375, -0.066070556640625, -0.05551910400390625, -0.0449676513671875, -0.03441619873046875, -0.02386474609375, -0.01331329345703125, -0.0027618408203125, 0.00778961181640625, 0.018341064453125, 0.02889251708984375, 0.0394439697265625, 0.04999542236328125, 0.060546875, 0.07109832763671875, 0.0816497802734375, 0.09220123291015625, 0.102752685546875, 0.11330413818359375, 0.1238555908203125, 0.13440704345703125, 0.14495849609375, 0.15550994873046875, 0.1660614013671875, 0.17661285400390625, 0.187164306640625, 0.19771575927734375, 0.2082672119140625, 0.21881866455078125, 0.2293701171875, 0.23992156982421875, 0.2504730224609375, 0.26102447509765625, 0.271575927734375, 0.28212738037109375, 0.2926788330078125, 0.30323028564453125, 0.31378173828125, 0.32433319091796875, 0.3348846435546875, 0.34543609619140625, 0.355987548828125, 0.36653900146484375, 0.3770904541015625, 0.38764190673828125, 0.398193359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 15.0, 20.0, 30.0, 39.0, 65.0, 174.0, 362.0, 105.0, 69.0, 42.0, 25.0, 21.0, 11.0, 7.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188232421875, -0.1830463409423828, -0.17786026000976562, -0.17267417907714844, -0.16748809814453125, -0.16230201721191406, -0.15711593627929688, -0.1519298553466797, -0.1467437744140625, -0.1415576934814453, -0.13637161254882812, -0.13118553161621094, -0.12599945068359375, -0.12081336975097656, -0.11562728881835938, -0.11044120788574219, -0.105255126953125, -0.10006904602050781, -0.09488296508789062, -0.08969688415527344, -0.08451080322265625, -0.07932472229003906, -0.07413864135742188, -0.06895256042480469, -0.0637664794921875, -0.05858039855957031, -0.053394317626953125, -0.04820823669433594, -0.04302215576171875, -0.03783607482910156, -0.032649993896484375, -0.027463912963867188, -0.02227783203125, -0.017091751098632812, -0.011905670166015625, -0.0067195892333984375, -0.00153350830078125, 0.0036525726318359375, 0.008838653564453125, 0.014024734497070312, 0.0192108154296875, 0.024396896362304688, 0.029582977294921875, 0.03476905822753906, 0.03995513916015625, 0.04514122009277344, 0.050327301025390625, 0.05551338195800781, 0.060699462890625, 0.06588554382324219, 0.07107162475585938, 0.07625770568847656, 0.08144378662109375, 0.08662986755371094, 0.09181594848632812, 0.09700202941894531, 0.1021881103515625, 0.10737419128417969, 0.11256027221679688, 0.11774635314941406, 0.12293243408203125, 0.12811851501464844, 0.13330459594726562, 0.1384906768798828, 0.1436767578125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 14.0, 42.0, 126.0, 268.0, 289.0, 166.0, 54.0, 24.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.624056577682495, -2.519740581512451, -2.4154248237609863, -2.3111088275909424, -2.2067928314208984, -2.1024770736694336, -1.9981610774993896, -1.8938452005386353, -1.7895293235778809, -1.6852134466171265, -1.580897569656372, -1.4765815734863281, -1.3722656965255737, -1.2679498195648193, -1.1636338233947754, -1.059317946434021, -0.9550020694732666, -0.8506861925125122, -0.746370255947113, -0.6420543193817139, -0.5377384424209595, -0.4334225654602051, -0.3291066288948059, -0.22479069232940674, -0.12047481536865234, -0.01615890860557556, 0.08815699815750122, 0.192472904920578, 0.2967888116836548, 0.4011046886444092, 0.5054206252098083, 0.6097365617752075, 0.7140522003173828, 0.8183680772781372, 0.9226840138435364, 1.0269999504089355, 1.13131582736969, 1.2356317043304443, 1.3399477005004883, 1.4442635774612427, 1.548579454421997, 1.6528953313827515, 1.7572112083435059, 1.8615272045135498, 1.9658430814743042, 2.0701589584350586, 2.1744749546051025, 2.2787909507751465, 2.3831067085266113, 2.4874227046966553, 2.59173846244812, 2.696054458618164, 2.800370216369629, 2.904686212539673, 3.009002208709717, 3.1133179664611816, 3.2176339626312256, 3.3219499588012695, 3.4262657165527344, 3.5305817127227783, 3.6348977088928223, 3.739213466644287, 3.843529462814331, 3.947845458984375, 4.05216121673584]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 12.0, 22.0, 27.0, 60.0, 89.0, 94.0, 113.0, 109.0, 96.0, 98.0, 92.0, 58.0, 50.0, 19.0, 19.0, 13.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.932028293609619, -5.681494235992432, -5.430960178375244, -5.180425643920898, -4.929891586303711, -4.679357528686523, -4.428823471069336, -4.178289413452148, -3.927755117416382, -3.6772210597991943, -3.4266867637634277, -3.1761527061462402, -2.9256186485290527, -2.675084352493286, -2.4245502948760986, -2.174015998840332, -1.9234819412231445, -1.6729477643966675, -1.4224135875701904, -1.171879529953003, -0.9213453531265259, -0.6708111763000488, -0.42027711868286133, -0.16974294185638428, 0.08079123497009277, 0.33132538199424744, 0.5818595290184021, 0.8323936462402344, 1.0829278230667114, 1.3334619998931885, 1.583996057510376, 1.834530234336853, 2.085063934326172, 2.3355979919433594, 2.586132287979126, 2.8366663455963135, 3.08720064163208, 3.3377346992492676, 3.588268756866455, 3.8388028144836426, 4.089337348937988, 4.339871406555176, 4.590405464172363, 4.840939521789551, 5.0914740562438965, 5.342008113861084, 5.5925421714782715, 5.843076229095459, 6.0936102867126465, 6.344144344329834, 6.5946784019470215, 6.845212936401367, 7.095746994018555, 7.346281051635742, 7.59681510925293, 7.847349166870117, 8.097883224487305, 8.348417282104492, 8.59895133972168, 8.849485397338867, 9.100019454956055, 9.350553512573242, 9.60108757019043, 9.851622581481934, 10.102156639099121]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 13.0, 8.0, 22.0, 32.0, 47.0, 112.0, 264.0, 981.0, 4227.0, 47872.0, 4085683.0, 50127.0, 3623.0, 723.0, 248.0, 108.0, 67.0, 51.0, 29.0, 12.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.300567626953125, -2.20269775390625, -2.104827880859375, -2.0069580078125, -1.909088134765625, -1.81121826171875, -1.713348388671875, -1.615478515625, -1.517608642578125, -1.41973876953125, -1.321868896484375, -1.2239990234375, -1.126129150390625, -1.02825927734375, -0.930389404296875, -0.83251953125, -0.734649658203125, -0.63677978515625, -0.538909912109375, -0.4410400390625, -0.343170166015625, -0.24530029296875, -0.147430419921875, -0.049560546875, 0.048309326171875, 0.14617919921875, 0.244049072265625, 0.3419189453125, 0.439788818359375, 0.53765869140625, 0.635528564453125, 0.7333984375, 0.831268310546875, 0.92913818359375, 1.027008056640625, 1.1248779296875, 1.222747802734375, 1.32061767578125, 1.418487548828125, 1.516357421875, 1.614227294921875, 1.71209716796875, 1.809967041015625, 1.9078369140625, 2.005706787109375, 2.10357666015625, 2.201446533203125, 2.29931640625, 2.397186279296875, 2.49505615234375, 2.592926025390625, 2.6907958984375, 2.788665771484375, 2.88653564453125, 2.984405517578125, 3.082275390625, 3.180145263671875, 3.27801513671875, 3.375885009765625, 3.4737548828125, 3.571624755859375, 3.66949462890625, 3.767364501953125, 3.865234375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 6.0, 24.0, 33.0, 79.0, 155.0, 206.0, 197.0, 139.0, 94.0, 41.0, 18.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5576171875, -1.4976348876953125, -1.437652587890625, -1.3776702880859375, -1.31768798828125, -1.2577056884765625, -1.197723388671875, -1.1377410888671875, -1.0777587890625, -1.0177764892578125, -0.957794189453125, -0.8978118896484375, -0.83782958984375, -0.7778472900390625, -0.717864990234375, -0.6578826904296875, -0.597900390625, -0.5379180908203125, -0.477935791015625, -0.4179534912109375, -0.35797119140625, -0.2979888916015625, -0.238006591796875, -0.1780242919921875, -0.1180419921875, -0.0580596923828125, 0.001922607421875, 0.0619049072265625, 0.12188720703125, 0.1818695068359375, 0.241851806640625, 0.3018341064453125, 0.36181640625, 0.4217987060546875, 0.481781005859375, 0.5417633056640625, 0.60174560546875, 0.6617279052734375, 0.721710205078125, 0.7816925048828125, 0.8416748046875, 0.9016571044921875, 0.961639404296875, 1.0216217041015625, 1.08160400390625, 1.1415863037109375, 1.201568603515625, 1.2615509033203125, 1.321533203125, 1.3815155029296875, 1.441497802734375, 1.5014801025390625, 1.56146240234375, 1.6214447021484375, 1.681427001953125, 1.7414093017578125, 1.8013916015625, 1.8613739013671875, 1.921356201171875, 1.9813385009765625, 2.04132080078125, 2.1013031005859375, 2.161285400390625, 2.2212677001953125, 2.28125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 7.0, 14.0, 13.0, 44.0, 79.0, 272.0, 763.0, 4124.0, 203521.0, 3974794.0, 9027.0, 1142.0, 276.0, 84.0, 42.0, 31.0, 10.0, 7.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.9141845703125, -3.808837890625, -3.7034912109375, -3.59814453125, -3.4927978515625, -3.387451171875, -3.2821044921875, -3.1767578125, -3.0714111328125, -2.966064453125, -2.8607177734375, -2.75537109375, -2.6500244140625, -2.544677734375, -2.4393310546875, -2.333984375, -2.2286376953125, -2.123291015625, -2.0179443359375, -1.91259765625, -1.8072509765625, -1.701904296875, -1.5965576171875, -1.4912109375, -1.3858642578125, -1.280517578125, -1.1751708984375, -1.06982421875, -0.9644775390625, -0.859130859375, -0.7537841796875, -0.6484375, -0.5430908203125, -0.437744140625, -0.3323974609375, -0.22705078125, -0.1217041015625, -0.016357421875, 0.0889892578125, 0.1943359375, 0.2996826171875, 0.405029296875, 0.5103759765625, 0.61572265625, 0.7210693359375, 0.826416015625, 0.9317626953125, 1.037109375, 1.1424560546875, 1.247802734375, 1.3531494140625, 1.45849609375, 1.5638427734375, 1.669189453125, 1.7745361328125, 1.8798828125, 1.9852294921875, 2.090576171875, 2.1959228515625, 2.30126953125, 2.4066162109375, 2.511962890625, 2.6173095703125, 2.72265625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 12.0, 9.0, 31.0, 58.0, 139.0, 501.0, 2155.0, 837.0, 171.0, 60.0, 38.0, 22.0, 11.0, 11.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888671875, -0.5675582885742188, -0.5462493896484375, -0.5249404907226562, -0.503631591796875, -0.48232269287109375, -0.4610137939453125, -0.43970489501953125, -0.41839599609375, -0.39708709716796875, -0.3757781982421875, -0.35446929931640625, -0.333160400390625, -0.31185150146484375, -0.2905426025390625, -0.26923370361328125, -0.2479248046875, -0.22661590576171875, -0.2053070068359375, -0.18399810791015625, -0.162689208984375, -0.14138031005859375, -0.1200714111328125, -0.09876251220703125, -0.07745361328125, -0.05614471435546875, -0.0348358154296875, -0.01352691650390625, 0.007781982421875, 0.02909088134765625, 0.0503997802734375, 0.07170867919921875, 0.093017578125, 0.11432647705078125, 0.1356353759765625, 0.15694427490234375, 0.178253173828125, 0.19956207275390625, 0.2208709716796875, 0.24217987060546875, 0.26348876953125, 0.28479766845703125, 0.3061065673828125, 0.32741546630859375, 0.348724365234375, 0.37003326416015625, 0.3913421630859375, 0.41265106201171875, 0.4339599609375, 0.45526885986328125, 0.4765777587890625, 0.49788665771484375, 0.519195556640625, 0.5405044555664062, 0.5618133544921875, 0.5831222534179688, 0.60443115234375, 0.6257400512695312, 0.6470489501953125, 0.6683578491210938, 0.689666748046875, 0.7109756469726562, 0.7322845458984375, 0.7535934448242188, 0.77490234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 11.0, 30.0, 73.0, 114.0, 185.0, 223.0, 175.0, 98.0, 52.0, 22.0, 7.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3814737796783447, -2.3180668354034424, -2.25465989112854, -2.1912529468536377, -2.1278460025787354, -2.064439058303833, -2.0010321140289307, -1.9376250505447388, -1.8742181062698364, -1.810811161994934, -1.7474042177200317, -1.6839972734451294, -1.6205902099609375, -1.5571832656860352, -1.4937763214111328, -1.4303693771362305, -1.3669624328613281, -1.3035554885864258, -1.2401485443115234, -1.176741600036621, -1.1133346557617188, -1.0499277114868164, -0.9865206480026245, -0.9231137037277222, -0.8597067594528198, -0.7962998151779175, -0.7328928709030151, -0.669485867023468, -0.6060789227485657, -0.5426719784736633, -0.4792650043964386, -0.41585803031921387, -0.3524508476257324, -0.2890439033508301, -0.22563692927360535, -0.1622299700975418, -0.09882301092147827, -0.03541606664657593, 0.027990907430648804, 0.09139788150787354, 0.15480482578277588, 0.21821178495883942, 0.28161874413490295, 0.3450257182121277, 0.40843266248703003, 0.4718396067619324, 0.5352466106414795, 0.5986535549163818, 0.6620604991912842, 0.7254674434661865, 0.7888743877410889, 0.852281391620636, 0.9156883358955383, 0.9790952801704407, 1.0425022840499878, 1.1059092283248901, 1.1693161725997925, 1.2327231168746948, 1.2961300611495972, 1.3595370054244995, 1.4229440689086914, 1.4863510131835938, 1.549757957458496, 1.6131649017333984, 1.6765718460083008]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 11.0, 13.0, 17.0, 45.0, 60.0, 89.0, 118.0, 139.0, 127.0, 125.0, 89.0, 62.0, 47.0, 34.0, 17.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5944753885269165, -1.5397987365722656, -1.4851220846176147, -1.4304454326629639, -1.3757686614990234, -1.3210920095443726, -1.2664153575897217, -1.2117387056350708, -1.15706205368042, -1.102385401725769, -1.0477087497711182, -0.9930320382118225, -0.9383553266525269, -0.883678674697876, -0.8290020227432251, -0.7743253707885742, -0.7196485996246338, -0.6649719476699829, -0.6102952361106873, -0.5556185841560364, -0.5009418725967407, -0.44626522064208984, -0.39158856868743896, -0.3369118869304657, -0.28223520517349243, -0.22755852341651917, -0.1728818565607071, -0.11820518970489502, -0.06352850794792175, -0.008851826190948486, 0.04582482576370239, 0.10050150752067566, 0.15517807006835938, 0.20985475182533264, 0.2645314335823059, 0.3192080855369568, 0.37388476729393005, 0.4285614490509033, 0.4832381010055542, 0.5379147529602051, 0.5925914645195007, 0.6472681164741516, 0.7019448280334473, 0.7566214799880981, 0.811298131942749, 0.8659748435020447, 0.9206514954566956, 0.9753282070159912, 1.030004858970642, 1.084681510925293, 1.1393581628799438, 1.1940348148345947, 1.2487115859985352, 1.303388237953186, 1.358064889907837, 1.4127415418624878, 1.4674181938171387, 1.5220948457717896, 1.5767714977264404, 1.6314482688903809, 1.6861249208450317, 1.7408015727996826, 1.7954782247543335, 1.8501548767089844, 1.9048316478729248]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 9.0, 13.0, 27.0, 27.0, 41.0, 59.0, 123.0, 279.0, 742.0, 3244.0, 32160.0, 819139.0, 181643.0, 8752.0, 1407.0, 459.0, 160.0, 107.0, 56.0, 33.0, 21.0, 13.0, 7.0, 5.0, 11.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2729301452636719, -0.26143646240234375, -0.24994277954101562, -0.2384490966796875, -0.22695541381835938, -0.21546173095703125, -0.20396804809570312, -0.192474365234375, -0.18098068237304688, -0.16948699951171875, -0.15799331665039062, -0.1464996337890625, -0.13500595092773438, -0.12351226806640625, -0.11201858520507812, -0.10052490234375, -0.08903121948242188, -0.07753753662109375, -0.06604385375976562, -0.0545501708984375, -0.043056488037109375, -0.03156280517578125, -0.020069122314453125, -0.008575439453125, 0.002918243408203125, 0.01441192626953125, 0.025905609130859375, 0.0373992919921875, 0.048892974853515625, 0.06038665771484375, 0.07188034057617188, 0.0833740234375, 0.09486770629882812, 0.10636138916015625, 0.11785507202148438, 0.1293487548828125, 0.14084243774414062, 0.15233612060546875, 0.16382980346679688, 0.175323486328125, 0.18681716918945312, 0.19831085205078125, 0.20980453491210938, 0.2212982177734375, 0.23279190063476562, 0.24428558349609375, 0.2557792663574219, 0.26727294921875, 0.2787666320800781, 0.29026031494140625, 0.3017539978027344, 0.3132476806640625, 0.3247413635253906, 0.33623504638671875, 0.3477287292480469, 0.359222412109375, 0.3707160949707031, 0.38220977783203125, 0.3937034606933594, 0.4051971435546875, 0.4166908264160156, 0.42818450927734375, 0.4396781921386719, 0.451171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 16.0, 35.0, 59.0, 99.0, 148.0, 160.0, 158.0, 117.0, 93.0, 57.0, 24.0, 19.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.984130859375, -0.94287109375, -0.901611328125, -0.8603515625, -0.819091796875, -0.77783203125, -0.736572265625, -0.6953125, -0.654052734375, -0.61279296875, -0.571533203125, -0.5302734375, -0.489013671875, -0.44775390625, -0.406494140625, -0.365234375, -0.323974609375, -0.28271484375, -0.241455078125, -0.2001953125, -0.158935546875, -0.11767578125, -0.076416015625, -0.03515625, 0.006103515625, 0.04736328125, 0.088623046875, 0.1298828125, 0.171142578125, 0.21240234375, 0.253662109375, 0.294921875, 0.336181640625, 0.37744140625, 0.418701171875, 0.4599609375, 0.501220703125, 0.54248046875, 0.583740234375, 0.625, 0.666259765625, 0.70751953125, 0.748779296875, 0.7900390625, 0.831298828125, 0.87255859375, 0.913818359375, 0.955078125, 0.996337890625, 1.03759765625, 1.078857421875, 1.1201171875, 1.161376953125, 1.20263671875, 1.243896484375, 1.28515625, 1.326416015625, 1.36767578125, 1.408935546875, 1.4501953125, 1.491455078125, 1.53271484375, 1.573974609375, 1.615234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 21.0, 26.0, 24.0, 52.0, 87.0, 130.0, 216.0, 388.0, 786.0, 1578.0, 3916.0, 10554.0, 37184.0, 183860.0, 555316.0, 196432.0, 39745.0, 10988.0, 3831.0, 1644.0, 792.0, 399.0, 197.0, 138.0, 64.0, 68.0, 28.0, 21.0, 18.0, 11.0, 10.0, 1.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12457275390625, -0.12085628509521484, -0.11713981628417969, -0.11342334747314453, -0.10970687866210938, -0.10599040985107422, -0.10227394104003906, -0.0985574722290039, -0.09484100341796875, -0.0911245346069336, -0.08740806579589844, -0.08369159698486328, -0.07997512817382812, -0.07625865936279297, -0.07254219055175781, -0.06882572174072266, -0.0651092529296875, -0.061392784118652344, -0.05767631530761719, -0.05395984649658203, -0.050243377685546875, -0.04652690887451172, -0.04281044006347656, -0.039093971252441406, -0.03537750244140625, -0.031661033630371094, -0.027944564819335938, -0.02422809600830078, -0.020511627197265625, -0.01679515838623047, -0.013078689575195312, -0.009362220764160156, -0.005645751953125, -0.0019292831420898438, 0.0017871856689453125, 0.005503654479980469, 0.009220123291015625, 0.012936592102050781, 0.016653060913085938, 0.020369529724121094, 0.02408599853515625, 0.027802467346191406, 0.03151893615722656, 0.03523540496826172, 0.038951873779296875, 0.04266834259033203, 0.04638481140136719, 0.050101280212402344, 0.0538177490234375, 0.057534217834472656, 0.06125068664550781, 0.06496715545654297, 0.06868362426757812, 0.07240009307861328, 0.07611656188964844, 0.0798330307006836, 0.08354949951171875, 0.0872659683227539, 0.09098243713378906, 0.09469890594482422, 0.09841537475585938, 0.10213184356689453, 0.10584831237792969, 0.10956478118896484, 0.11328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 16.0, 18.0, 24.0, 31.0, 54.0, 67.0, 93.0, 92.0, 102.0, 106.0, 97.0, 82.0, 75.0, 41.0, 30.0, 20.0, 16.0, 12.0, 2.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.854888916015625, -1.79669189453125, -1.738494873046875, -1.6802978515625, -1.622100830078125, -1.56390380859375, -1.505706787109375, -1.447509765625, -1.389312744140625, -1.33111572265625, -1.272918701171875, -1.2147216796875, -1.156524658203125, -1.09832763671875, -1.040130615234375, -0.98193359375, -0.923736572265625, -0.86553955078125, -0.807342529296875, -0.7491455078125, -0.690948486328125, -0.63275146484375, -0.574554443359375, -0.516357421875, -0.458160400390625, -0.39996337890625, -0.341766357421875, -0.2835693359375, -0.225372314453125, -0.16717529296875, -0.108978271484375, -0.05078125, 0.007415771484375, 0.06561279296875, 0.123809814453125, 0.1820068359375, 0.240203857421875, 0.29840087890625, 0.356597900390625, 0.414794921875, 0.472991943359375, 0.53118896484375, 0.589385986328125, 0.6475830078125, 0.705780029296875, 0.76397705078125, 0.822174072265625, 0.88037109375, 0.938568115234375, 0.99676513671875, 1.054962158203125, 1.1131591796875, 1.171356201171875, 1.22955322265625, 1.287750244140625, 1.345947265625, 1.404144287109375, 1.46234130859375, 1.520538330078125, 1.5787353515625, 1.636932373046875, 1.69512939453125, 1.753326416015625, 1.8115234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 6.0, 10.0, 17.0, 17.0, 16.0, 22.0, 31.0, 39.0, 43.0, 79.0, 121.0, 193.0, 352.0, 630.0, 1166.0, 2299.0, 4544.0, 10241.0, 37635.0, 647278.0, 302857.0, 24370.0, 8195.0, 3752.0, 2039.0, 1050.0, 610.0, 361.0, 208.0, 104.0, 85.0, 41.0, 33.0, 21.0, 18.0, 9.0, 11.0, 13.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.015899658203125, -0.015384674072265625, -0.01486968994140625, -0.014354705810546875, -0.0138397216796875, -0.013324737548828125, -0.01280975341796875, -0.012294769287109375, -0.01177978515625, -0.011264801025390625, -0.01074981689453125, -0.010234832763671875, -0.0097198486328125, -0.009204864501953125, -0.00868988037109375, -0.008174896240234375, -0.007659912109375, -0.007144927978515625, -0.00662994384765625, -0.006114959716796875, -0.0055999755859375, -0.005084991455078125, -0.00457000732421875, -0.004055023193359375, -0.0035400390625, -0.003025054931640625, -0.00251007080078125, -0.001995086669921875, -0.0014801025390625, -0.000965118408203125, -0.00045013427734375, 6.4849853515625e-05, 0.000579833984375, 0.001094818115234375, 0.00160980224609375, 0.002124786376953125, 0.0026397705078125, 0.003154754638671875, 0.00366973876953125, 0.004184722900390625, 0.00469970703125, 0.005214691162109375, 0.00572967529296875, 0.006244659423828125, 0.0067596435546875, 0.007274627685546875, 0.00778961181640625, 0.008304595947265625, 0.008819580078125, 0.009334564208984375, 0.00984954833984375, 0.010364532470703125, 0.0108795166015625, 0.011394500732421875, 0.01190948486328125, 0.012424468994140625, 0.012939453125, 0.013454437255859375, 0.01396942138671875, 0.014484405517578125, 0.0149993896484375, 0.015514373779296875, 0.01602935791015625, 0.016544342041015625, 0.017059326171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 9.0, 9.0, 13.0, 13.0, 22.0, 34.0, 42.0, 68.0, 104.0, 118.0, 155.0, 117.0, 89.0, 62.0, 32.0, 37.0, 17.0, 10.0, 8.0, 7.0, 9.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.6345252990722656e-05, -2.5724060833454132e-05, -2.5102868676185608e-05, -2.4481676518917084e-05, -2.386048436164856e-05, -2.3239292204380035e-05, -2.261810004711151e-05, -2.1996907889842987e-05, -2.1375715732574463e-05, -2.075452357530594e-05, -2.0133331418037415e-05, -1.951213926076889e-05, -1.8890947103500366e-05, -1.8269754946231842e-05, -1.7648562788963318e-05, -1.7027370631694794e-05, -1.640617847442627e-05, -1.5784986317157745e-05, -1.5163794159889221e-05, -1.4542602002620697e-05, -1.3921409845352173e-05, -1.3300217688083649e-05, -1.2679025530815125e-05, -1.20578333735466e-05, -1.1436641216278076e-05, -1.0815449059009552e-05, -1.0194256901741028e-05, -9.573064744472504e-06, -8.95187258720398e-06, -8.330680429935455e-06, -7.709488272666931e-06, -7.088296115398407e-06, -6.467103958129883e-06, -5.845911800861359e-06, -5.2247196435928345e-06, -4.60352748632431e-06, -3.982335329055786e-06, -3.361143171787262e-06, -2.739951014518738e-06, -2.1187588572502136e-06, -1.4975666999816895e-06, -8.763745427131653e-07, -2.551823854446411e-07, 3.6600977182388306e-07, 9.872019290924072e-07, 1.6083940863609314e-06, 2.2295862436294556e-06, 2.8507784008979797e-06, 3.471970558166504e-06, 4.093162715435028e-06, 4.714354872703552e-06, 5.335547029972076e-06, 5.956739187240601e-06, 6.577931344509125e-06, 7.199123501777649e-06, 7.820315659046173e-06, 8.441507816314697e-06, 9.062699973583221e-06, 9.683892130851746e-06, 1.030508428812027e-05, 1.0926276445388794e-05, 1.1547468602657318e-05, 1.2168660759925842e-05, 1.2789852917194366e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 18.0, 20.0, 19.0, 30.0, 42.0, 59.0, 98.0, 131.0, 209.0, 338.0, 578.0, 948.0, 1787.0, 3368.0, 7251.0, 20892.0, 191722.0, 760106.0, 40360.0, 10545.0, 4473.0, 2281.0, 1236.0, 709.0, 457.0, 254.0, 159.0, 127.0, 78.0, 58.0, 39.0, 37.0, 17.0, 14.0, 12.0, 18.0, 6.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.017822265625, -0.01719045639038086, -0.01655864715576172, -0.015926837921142578, -0.015295028686523438, -0.014663219451904297, -0.014031410217285156, -0.013399600982666016, -0.012767791748046875, -0.012135982513427734, -0.011504173278808594, -0.010872364044189453, -0.010240554809570312, -0.009608745574951172, -0.008976936340332031, -0.00834512710571289, -0.00771331787109375, -0.007081508636474609, -0.006449699401855469, -0.005817890167236328, -0.0051860809326171875, -0.004554271697998047, -0.003922462463378906, -0.0032906532287597656, -0.002658843994140625, -0.0020270347595214844, -0.0013952255249023438, -0.0007634162902832031, -0.0001316070556640625, 0.0005002021789550781, 0.0011320114135742188, 0.0017638206481933594, 0.0023956298828125, 0.0030274391174316406, 0.0036592483520507812, 0.004291057586669922, 0.0049228668212890625, 0.005554676055908203, 0.006186485290527344, 0.006818294525146484, 0.007450103759765625, 0.008081912994384766, 0.008713722229003906, 0.009345531463623047, 0.009977340698242188, 0.010609149932861328, 0.011240959167480469, 0.01187276840209961, 0.01250457763671875, 0.01313638687133789, 0.013768196105957031, 0.014400005340576172, 0.015031814575195312, 0.015663623809814453, 0.016295433044433594, 0.016927242279052734, 0.017559051513671875, 0.018190860748291016, 0.018822669982910156, 0.019454479217529297, 0.020086288452148438, 0.020718097686767578, 0.02134990692138672, 0.02198171615600586, 0.022613525390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 6.0, 7.0, 6.0, 16.0, 14.0, 47.0, 97.0, 258.0, 289.0, 129.0, 36.0, 25.0, 10.0, 10.0, 7.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0097198486328125, -0.009450256824493408, -0.009180665016174316, -0.008911073207855225, -0.008641481399536133, -0.008371889591217041, -0.00810229778289795, -0.007832705974578857, -0.007563114166259766, -0.007293522357940674, -0.007023930549621582, -0.00675433874130249, -0.0064847469329833984, -0.006215155124664307, -0.005945563316345215, -0.005675971508026123, -0.005406379699707031, -0.0051367878913879395, -0.004867196083068848, -0.004597604274749756, -0.004328012466430664, -0.004058420658111572, -0.0037888288497924805, -0.0035192370414733887, -0.003249645233154297, -0.002980053424835205, -0.0027104616165161133, -0.0024408698081970215, -0.0021712779998779297, -0.0019016861915588379, -0.001632094383239746, -0.0013625025749206543, -0.0010929107666015625, -0.0008233189582824707, -0.0005537271499633789, -0.0002841353416442871, -1.4543533325195312e-05, 0.0002550482749938965, 0.0005246400833129883, 0.0007942318916320801, 0.0010638236999511719, 0.0013334155082702637, 0.0016030073165893555, 0.0018725991249084473, 0.002142190933227539, 0.002411782741546631, 0.0026813745498657227, 0.0029509663581848145, 0.0032205581665039062, 0.003490149974822998, 0.00375974178314209, 0.004029333591461182, 0.0042989253997802734, 0.004568517208099365, 0.004838109016418457, 0.005107700824737549, 0.005377292633056641, 0.005646884441375732, 0.005916476249694824, 0.006186068058013916, 0.006455659866333008, 0.0067252516746521, 0.006994843482971191, 0.007264435291290283, 0.007534027099609375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 24.0, 67.0, 173.0, 261.0, 247.0, 136.0, 56.0, 16.0, 11.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59414541721344, -1.5484282970428467, -1.5027111768722534, -1.4569940567016602, -1.411276936531067, -1.3655598163604736, -1.3198425769805908, -1.2741254568099976, -1.2284083366394043, -1.182691216468811, -1.1369740962982178, -1.0912569761276245, -1.0455398559570312, -0.9998226761817932, -0.9541055560112, -0.9083883762359619, -0.8626713156700134, -0.8169541954994202, -0.7712370753288269, -0.7255198955535889, -0.6798027753829956, -0.6340856552124023, -0.5883685350418091, -0.5426514148712158, -0.49693426489830017, -0.4512171447277069, -0.40549999475479126, -0.359782874584198, -0.31406575441360474, -0.2683486044406891, -0.22263148427009583, -0.17691433429718018, -0.13119721412658691, -0.08548007905483246, -0.0397629514336586, 0.005954176187515259, 0.051671311259269714, 0.09738844633102417, 0.14310556650161743, 0.18882271647453308, 0.23453983664512634, 0.2802569568157196, 0.32597410678863525, 0.3716912269592285, 0.4174083471298218, 0.4631254971027374, 0.5088425874710083, 0.5545597672462463, 0.6002768874168396, 0.6459940075874329, 0.6917111277580261, 0.7374283075332642, 0.7831454277038574, 0.8288625478744507, 0.874579668045044, 0.9202967882156372, 0.9660139083862305, 1.0117310285568237, 1.057448148727417, 1.1031652688980103, 1.1488823890686035, 1.1945996284484863, 1.24031662940979, 1.2860338687896729, 1.3317509889602661]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 10.0, 27.0, 40.0, 75.0, 115.0, 148.0, 165.0, 143.0, 107.0, 71.0, 47.0, 26.0, 14.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0395655632019043, -1.0002890825271606, -0.961012601852417, -0.9217360615730286, -0.8824595808982849, -0.8431831002235413, -0.8039065599441528, -0.7646300792694092, -0.7253535985946655, -0.6860771179199219, -0.6468006372451782, -0.6075240969657898, -0.5682476162910461, -0.5289711356163025, -0.48969462513923645, -0.4504181146621704, -0.41114163398742676, -0.3718651533126831, -0.33258864283561707, -0.293312132358551, -0.2540356516838074, -0.21475915610790253, -0.17548266053199768, -0.13620615005493164, -0.09692966938018799, -0.05765317380428314, -0.018376678228378296, 0.02089981734752655, 0.060176312923431396, 0.09945280849933624, 0.1387293040752411, 0.17800581455230713, 0.21728229522705078, 0.25655877590179443, 0.2958352863788605, 0.3351117968559265, 0.37438827753067017, 0.4136647582054138, 0.45294126868247986, 0.4922177791595459, 0.5314942598342896, 0.5707707405090332, 0.6100472211837769, 0.6493237614631653, 0.6886002421379089, 0.7278767228126526, 0.767153263092041, 0.8064297437667847, 0.8457062244415283, 0.884982705116272, 0.9242591857910156, 0.963535726070404, 1.002812147140503, 1.0420887470245361, 1.0813652276992798, 1.1206417083740234, 1.159918189048767, 1.1991946697235107, 1.2384711503982544, 1.277747631072998, 1.3170242309570312, 1.356300711631775, 1.3955771923065186, 1.4348536729812622, 1.4741301536560059]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 6.0, 10.0, 11.0, 12.0, 22.0, 32.0, 55.0, 114.0, 242.0, 499.0, 1151.0, 2621.0, 7029.0, 24735.0, 784883.0, 200302.0, 17462.0, 5476.0, 2222.0, 864.0, 392.0, 185.0, 91.0, 58.0, 37.0, 13.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.9619140625, -0.9351043701171875, -0.908294677734375, -0.8814849853515625, -0.85467529296875, -0.8278656005859375, -0.801055908203125, -0.7742462158203125, -0.7474365234375, -0.7206268310546875, -0.693817138671875, -0.6670074462890625, -0.64019775390625, -0.6133880615234375, -0.586578369140625, -0.5597686767578125, -0.532958984375, -0.5061492919921875, -0.479339599609375, -0.4525299072265625, -0.42572021484375, -0.3989105224609375, -0.372100830078125, -0.3452911376953125, -0.3184814453125, -0.2916717529296875, -0.264862060546875, -0.2380523681640625, -0.21124267578125, -0.1844329833984375, -0.157623291015625, -0.1308135986328125, -0.10400390625, -0.0771942138671875, -0.050384521484375, -0.0235748291015625, 0.00323486328125, 0.0300445556640625, 0.056854248046875, 0.0836639404296875, 0.1104736328125, 0.1372833251953125, 0.164093017578125, 0.1909027099609375, 0.21771240234375, 0.2445220947265625, 0.271331787109375, 0.2981414794921875, 0.324951171875, 0.3517608642578125, 0.378570556640625, 0.4053802490234375, 0.43218994140625, 0.4589996337890625, 0.485809326171875, 0.5126190185546875, 0.5394287109375, 0.5662384033203125, 0.593048095703125, 0.6198577880859375, 0.64666748046875, 0.6734771728515625, 0.700286865234375, 0.7270965576171875, 0.75390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 10.0, 8.0, 14.0, 38.0, 59.0, 109.0, 127.0, 140.0, 145.0, 117.0, 80.0, 61.0, 54.0, 20.0, 13.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9013671875, -1.8281707763671875, -1.754974365234375, -1.6817779541015625, -1.60858154296875, -1.5353851318359375, -1.462188720703125, -1.3889923095703125, -1.3157958984375, -1.2425994873046875, -1.169403076171875, -1.0962066650390625, -1.02301025390625, -0.9498138427734375, -0.876617431640625, -0.8034210205078125, -0.730224609375, -0.6570281982421875, -0.583831787109375, -0.5106353759765625, -0.43743896484375, -0.3642425537109375, -0.291046142578125, -0.2178497314453125, -0.1446533203125, -0.0714569091796875, 0.001739501953125, 0.0749359130859375, 0.14813232421875, 0.2213287353515625, 0.294525146484375, 0.3677215576171875, 0.44091796875, 0.5141143798828125, 0.587310791015625, 0.6605072021484375, 0.73370361328125, 0.8069000244140625, 0.880096435546875, 0.9532928466796875, 1.0264892578125, 1.0996856689453125, 1.172882080078125, 1.2460784912109375, 1.31927490234375, 1.3924713134765625, 1.465667724609375, 1.5388641357421875, 1.612060546875, 1.6852569580078125, 1.758453369140625, 1.8316497802734375, 1.90484619140625, 1.9780426025390625, 2.051239013671875, 2.1244354248046875, 2.1976318359375, 2.2708282470703125, 2.344024658203125, 2.4172210693359375, 2.49041748046875, 2.5636138916015625, 2.636810302734375, 2.7100067138671875, 2.783203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 13.0, 12.0, 25.0, 62.0, 109.0, 435.0, 1045926.0, 1682.0, 154.0, 61.0, 33.0, 16.0, 12.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.301025390625, -9.01611328125, -8.731201171875, -8.4462890625, -8.161376953125, -7.87646484375, -7.591552734375, -7.306640625, -7.021728515625, -6.73681640625, -6.451904296875, -6.1669921875, -5.882080078125, -5.59716796875, -5.312255859375, -5.02734375, -4.742431640625, -4.45751953125, -4.172607421875, -3.8876953125, -3.602783203125, -3.31787109375, -3.032958984375, -2.748046875, -2.463134765625, -2.17822265625, -1.893310546875, -1.6083984375, -1.323486328125, -1.03857421875, -0.753662109375, -0.46875, -0.183837890625, 0.10107421875, 0.385986328125, 0.6708984375, 0.955810546875, 1.24072265625, 1.525634765625, 1.810546875, 2.095458984375, 2.38037109375, 2.665283203125, 2.9501953125, 3.235107421875, 3.52001953125, 3.804931640625, 4.08984375, 4.374755859375, 4.65966796875, 4.944580078125, 5.2294921875, 5.514404296875, 5.79931640625, 6.084228515625, 6.369140625, 6.654052734375, 6.93896484375, 7.223876953125, 7.5087890625, 7.793701171875, 8.07861328125, 8.363525390625, 8.6484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 8.0, 14.0, 14.0, 31.0, 58.0, 107.0, 172.0, 166.0, 178.0, 123.0, 58.0, 32.0, 14.0, 13.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.81317138671875, -4.6654052734375, -4.51763916015625, -4.369873046875, -4.22210693359375, -4.0743408203125, -3.92657470703125, -3.77880859375, -3.63104248046875, -3.4832763671875, -3.33551025390625, -3.187744140625, -3.03997802734375, -2.8922119140625, -2.74444580078125, -2.5966796875, -2.44891357421875, -2.3011474609375, -2.15338134765625, -2.005615234375, -1.85784912109375, -1.7100830078125, -1.56231689453125, -1.41455078125, -1.26678466796875, -1.1190185546875, -0.97125244140625, -0.823486328125, -0.67572021484375, -0.5279541015625, -0.38018798828125, -0.232421875, -0.08465576171875, 0.0631103515625, 0.21087646484375, 0.358642578125, 0.50640869140625, 0.6541748046875, 0.80194091796875, 0.94970703125, 1.09747314453125, 1.2452392578125, 1.39300537109375, 1.540771484375, 1.68853759765625, 1.8363037109375, 1.98406982421875, 2.1318359375, 2.27960205078125, 2.4273681640625, 2.57513427734375, 2.722900390625, 2.87066650390625, 3.0184326171875, 3.16619873046875, 3.31396484375, 3.46173095703125, 3.6094970703125, 3.75726318359375, 3.905029296875, 4.05279541015625, 4.2005615234375, 4.34832763671875, 4.49609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 8.0, 28.0, 36.0, 51.0, 117.0, 256.0, 658.0, 2092.0, 13585.0, 875173.0, 146086.0, 7894.0, 1561.0, 520.0, 244.0, 91.0, 55.0, 24.0, 22.0, 7.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3893928527832031, -0.37717437744140625, -0.3649559020996094, -0.3527374267578125, -0.3405189514160156, -0.32830047607421875, -0.3160820007324219, -0.303863525390625, -0.2916450500488281, -0.27942657470703125, -0.2672080993652344, -0.2549896240234375, -0.24277114868164062, -0.23055267333984375, -0.21833419799804688, -0.20611572265625, -0.19389724731445312, -0.18167877197265625, -0.16946029663085938, -0.1572418212890625, -0.14502334594726562, -0.13280487060546875, -0.12058639526367188, -0.108367919921875, -0.09614944458007812, -0.08393096923828125, -0.07171249389648438, -0.0594940185546875, -0.047275543212890625, -0.03505706787109375, -0.022838592529296875, -0.0106201171875, 0.001598358154296875, 0.01381683349609375, 0.026035308837890625, 0.0382537841796875, 0.050472259521484375, 0.06269073486328125, 0.07490921020507812, 0.087127685546875, 0.09934616088867188, 0.11156463623046875, 0.12378311157226562, 0.1360015869140625, 0.14822006225585938, 0.16043853759765625, 0.17265701293945312, 0.18487548828125, 0.19709396362304688, 0.20931243896484375, 0.22153091430664062, 0.2337493896484375, 0.24596786499023438, 0.25818634033203125, 0.2704048156738281, 0.282623291015625, 0.2948417663574219, 0.30706024169921875, 0.3192787170410156, 0.3314971923828125, 0.3437156677246094, 0.35593414306640625, 0.3681526184082031, 0.38037109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 9.0, 5.0, 6.0, 5.0, 10.0, 12.0, 24.0, 46.0, 89.0, 310.0, 249.0, 87.0, 45.0, 29.0, 16.0, 11.0, 5.0, 4.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6047229766845703e-05, -2.5003217160701752e-05, -2.39592045545578e-05, -2.291519194841385e-05, -2.1871179342269897e-05, -2.0827166736125946e-05, -1.9783154129981995e-05, -1.8739141523838043e-05, -1.7695128917694092e-05, -1.665111631155014e-05, -1.560710370540619e-05, -1.4563091099262238e-05, -1.3519078493118286e-05, -1.2475065886974335e-05, -1.1431053280830383e-05, -1.0387040674686432e-05, -9.34302806854248e-06, -8.299015462398529e-06, -7.255002856254578e-06, -6.210990250110626e-06, -5.166977643966675e-06, -4.122965037822723e-06, -3.078952431678772e-06, -2.0349398255348206e-06, -9.909272193908691e-07, 5.3085386753082275e-08, 1.0970979928970337e-06, 2.141110599040985e-06, 3.1851232051849365e-06, 4.229135811328888e-06, 5.273148417472839e-06, 6.317161023616791e-06, 7.361173629760742e-06, 8.405186235904694e-06, 9.449198842048645e-06, 1.0493211448192596e-05, 1.1537224054336548e-05, 1.25812366604805e-05, 1.362524926662445e-05, 1.4669261872768402e-05, 1.5713274478912354e-05, 1.6757287085056305e-05, 1.7801299691200256e-05, 1.8845312297344208e-05, 1.988932490348816e-05, 2.093333750963211e-05, 2.1977350115776062e-05, 2.3021362721920013e-05, 2.4065375328063965e-05, 2.5109387934207916e-05, 2.6153400540351868e-05, 2.719741314649582e-05, 2.824142575263977e-05, 2.9285438358783722e-05, 3.0329450964927673e-05, 3.1373463571071625e-05, 3.2417476177215576e-05, 3.346148878335953e-05, 3.450550138950348e-05, 3.554951399564743e-05, 3.659352660179138e-05, 3.763753920793533e-05, 3.8681551814079285e-05, 3.9725564420223236e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 16.0, 21.0, 25.0, 48.0, 77.0, 124.0, 227.0, 426.0, 828.0, 1979.0, 5455.0, 20734.0, 348270.0, 638240.0, 22368.0, 5839.0, 2013.0, 838.0, 435.0, 212.0, 116.0, 68.0, 56.0, 35.0, 24.0, 14.0, 12.0, 7.0, 9.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.260009765625, -0.2510528564453125, -0.242095947265625, -0.2331390380859375, -0.22418212890625, -0.2152252197265625, -0.206268310546875, -0.1973114013671875, -0.1883544921875, -0.1793975830078125, -0.170440673828125, -0.1614837646484375, -0.15252685546875, -0.1435699462890625, -0.134613037109375, -0.1256561279296875, -0.11669921875, -0.1077423095703125, -0.098785400390625, -0.0898284912109375, -0.08087158203125, -0.0719146728515625, -0.062957763671875, -0.0540008544921875, -0.0450439453125, -0.0360870361328125, -0.027130126953125, -0.0181732177734375, -0.00921630859375, -0.0002593994140625, 0.008697509765625, 0.0176544189453125, 0.026611328125, 0.0355682373046875, 0.044525146484375, 0.0534820556640625, 0.06243896484375, 0.0713958740234375, 0.080352783203125, 0.0893096923828125, 0.0982666015625, 0.1072235107421875, 0.116180419921875, 0.1251373291015625, 0.13409423828125, 0.1430511474609375, 0.152008056640625, 0.1609649658203125, 0.169921875, 0.1788787841796875, 0.187835693359375, 0.1967926025390625, 0.20574951171875, 0.2147064208984375, 0.223663330078125, 0.2326202392578125, 0.2415771484375, 0.2505340576171875, 0.259490966796875, 0.2684478759765625, 0.27740478515625, 0.2863616943359375, 0.295318603515625, 0.3042755126953125, 0.313232421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 2.0, 11.0, 11.0, 28.0, 39.0, 83.0, 176.0, 390.0, 89.0, 58.0, 33.0, 16.0, 12.0, 12.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18771076202392578, -0.18316078186035156, -0.17861080169677734, -0.17406082153320312, -0.1695108413696289, -0.1649608612060547, -0.16041088104248047, -0.15586090087890625, -0.15131092071533203, -0.1467609405517578, -0.1422109603881836, -0.13766098022460938, -0.13311100006103516, -0.12856101989746094, -0.12401103973388672, -0.1194610595703125, -0.11491107940673828, -0.11036109924316406, -0.10581111907958984, -0.10126113891601562, -0.0967111587524414, -0.09216117858886719, -0.08761119842529297, -0.08306121826171875, -0.07851123809814453, -0.07396125793457031, -0.0694112777709961, -0.06486129760742188, -0.060311317443847656, -0.05576133728027344, -0.05121135711669922, -0.046661376953125, -0.04211139678955078, -0.03756141662597656, -0.033011436462402344, -0.028461456298828125, -0.023911476135253906, -0.019361495971679688, -0.014811515808105469, -0.01026153564453125, -0.005711555480957031, -0.0011615753173828125, 0.0033884048461914062, 0.007938385009765625, 0.012488365173339844, 0.017038345336914062, 0.02158832550048828, 0.0261383056640625, 0.03068828582763672, 0.03523826599121094, 0.039788246154785156, 0.044338226318359375, 0.048888206481933594, 0.05343818664550781, 0.05798816680908203, 0.06253814697265625, 0.06708812713623047, 0.07163810729980469, 0.0761880874633789, 0.08073806762695312, 0.08528804779052734, 0.08983802795410156, 0.09438800811767578, 0.09893798828125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 43.0, 97.0, 157.0, 230.0, 212.0, 146.0, 53.0, 26.0, 11.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.920499324798584, -2.8390042781829834, -2.757509469985962, -2.6760144233703613, -2.59451961517334, -2.5130245685577393, -2.4315295219421387, -2.350034713745117, -2.2685396671295166, -2.187044620513916, -2.1055498123168945, -2.024054765701294, -1.942559838294983, -1.8610649108886719, -1.7795698642730713, -1.6980749368667603, -1.6165800094604492, -1.5350850820541382, -1.4535901546478271, -1.3720951080322266, -1.2906001806259155, -1.2091052532196045, -1.127610206604004, -1.0461152791976929, -0.9646203517913818, -0.8831254243850708, -0.801630437374115, -0.7201354503631592, -0.6386405229568481, -0.5571455955505371, -0.4756506085395813, -0.3941556215286255, -0.31266093254089355, -0.23116597533226013, -0.1496710181236267, -0.06817606091499329, 0.013318896293640137, 0.09481385350227356, 0.17630881071090698, 0.2578037977218628, 0.33929872512817383, 0.42079368233680725, 0.5022886395454407, 0.5837836265563965, 0.6652785539627075, 0.7467734813690186, 0.8282684683799744, 0.9097634553909302, 0.9912583827972412, 1.0727533102035522, 1.1542482376098633, 1.2357432842254639, 1.317238211631775, 1.398733139038086, 1.4802281856536865, 1.5617231130599976, 1.6432180404663086, 1.7247129678726196, 1.8062078952789307, 1.8877029418945312, 1.9691978693008423, 2.0506927967071533, 2.132187843322754, 2.2136826515197754, 2.295177698135376]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 17.0, 17.0, 25.0, 52.0, 57.0, 70.0, 81.0, 75.0, 82.0, 79.0, 80.0, 77.0, 74.0, 47.0, 49.0, 27.0, 23.0, 22.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.432645320892334, -4.28529691696167, -4.137948513031006, -3.990600109100342, -3.8432517051696777, -3.6959033012390137, -3.5485551357269287, -3.4012067317962646, -3.2538583278656006, -3.1065099239349365, -2.9591615200042725, -2.8118131160736084, -2.6644649505615234, -2.5171165466308594, -2.3697681427001953, -2.2224197387695312, -2.075071334838867, -1.9277229309082031, -1.780374526977539, -1.6330262422561646, -1.4856778383255005, -1.3383294343948364, -1.190981149673462, -1.0436327457427979, -0.8962843418121338, -0.7489359378814697, -0.6015875935554504, -0.45423921942710876, -0.3068908452987671, -0.15954244136810303, -0.01219409704208374, 0.13515424728393555, 0.2825026512145996, 0.4298510253429413, 0.577199399471283, 0.7245477437973022, 0.8718961477279663, 1.0192445516586304, 1.1665928363800049, 1.313941240310669, 1.461289644241333, 1.608638048171997, 1.7559864521026611, 1.9033347368240356, 2.05068302154541, 2.198031425476074, 2.3453798294067383, 2.4927282333374023, 2.6400766372680664, 2.7874250411987305, 2.9347734451293945, 3.0821218490600586, 3.2294702529907227, 3.3768186569213867, 3.5241668224334717, 3.6715152263641357, 3.8188636302948, 3.966212034225464, 4.113560199737549, 4.260908603668213, 4.408257007598877, 4.555605411529541, 4.702953815460205, 4.850302219390869, 4.997650623321533]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 14.0, 11.0, 17.0, 26.0, 21.0, 43.0, 59.0, 93.0, 175.0, 423.0, 1334.0, 5970.0, 66938.0, 4045458.0, 66011.0, 5685.0, 1181.0, 380.0, 170.0, 75.0, 58.0, 45.0, 17.0, 21.0, 12.0, 14.0, 12.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.189453125, -2.117645263671875, -2.04583740234375, -1.974029541015625, -1.9022216796875, -1.830413818359375, -1.75860595703125, -1.686798095703125, -1.614990234375, -1.543182373046875, -1.47137451171875, -1.399566650390625, -1.3277587890625, -1.255950927734375, -1.18414306640625, -1.112335205078125, -1.04052734375, -0.968719482421875, -0.89691162109375, -0.825103759765625, -0.7532958984375, -0.681488037109375, -0.60968017578125, -0.537872314453125, -0.466064453125, -0.394256591796875, -0.32244873046875, -0.250640869140625, -0.1788330078125, -0.107025146484375, -0.03521728515625, 0.036590576171875, 0.1083984375, 0.180206298828125, 0.25201416015625, 0.323822021484375, 0.3956298828125, 0.467437744140625, 0.53924560546875, 0.611053466796875, 0.682861328125, 0.754669189453125, 0.82647705078125, 0.898284912109375, 0.9700927734375, 1.041900634765625, 1.11370849609375, 1.185516357421875, 1.25732421875, 1.329132080078125, 1.40093994140625, 1.472747802734375, 1.5445556640625, 1.616363525390625, 1.68817138671875, 1.759979248046875, 1.831787109375, 1.903594970703125, 1.97540283203125, 2.047210693359375, 2.1190185546875, 2.190826416015625, 2.26263427734375, 2.334442138671875, 2.40625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 10.0, 21.0, 13.0, 42.0, 58.0, 103.0, 140.0, 165.0, 153.0, 113.0, 84.0, 42.0, 29.0, 15.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.2521209716796875, -1.211273193359375, -1.1704254150390625, -1.12957763671875, -1.0887298583984375, -1.047882080078125, -1.0070343017578125, -0.9661865234375, -0.9253387451171875, -0.884490966796875, -0.8436431884765625, -0.80279541015625, -0.7619476318359375, -0.721099853515625, -0.6802520751953125, -0.639404296875, -0.5985565185546875, -0.557708740234375, -0.5168609619140625, -0.47601318359375, -0.4351654052734375, -0.394317626953125, -0.3534698486328125, -0.3126220703125, -0.2717742919921875, -0.230926513671875, -0.1900787353515625, -0.14923095703125, -0.1083831787109375, -0.067535400390625, -0.0266876220703125, 0.01416015625, 0.0550079345703125, 0.095855712890625, 0.1367034912109375, 0.17755126953125, 0.2183990478515625, 0.259246826171875, 0.3000946044921875, 0.3409423828125, 0.3817901611328125, 0.422637939453125, 0.4634857177734375, 0.50433349609375, 0.5451812744140625, 0.586029052734375, 0.6268768310546875, 0.667724609375, 0.7085723876953125, 0.749420166015625, 0.7902679443359375, 0.83111572265625, 0.8719635009765625, 0.912811279296875, 0.9536590576171875, 0.9945068359375, 1.0353546142578125, 1.076202392578125, 1.1170501708984375, 1.15789794921875, 1.1987457275390625, 1.239593505859375, 1.2804412841796875, 1.3212890625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 9.0, 10.0, 25.0, 24.0, 60.0, 118.0, 328.0, 1562.0, 21261.0, 4065931.0, 100435.0, 3682.0, 523.0, 137.0, 75.0, 30.0, 19.0, 15.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33221435546875, -2.2562255859375, -2.18023681640625, -2.104248046875, -2.02825927734375, -1.9522705078125, -1.87628173828125, -1.80029296875, -1.72430419921875, -1.6483154296875, -1.57232666015625, -1.496337890625, -1.42034912109375, -1.3443603515625, -1.26837158203125, -1.1923828125, -1.11639404296875, -1.0404052734375, -0.96441650390625, -0.888427734375, -0.81243896484375, -0.7364501953125, -0.66046142578125, -0.58447265625, -0.50848388671875, -0.4324951171875, -0.35650634765625, -0.280517578125, -0.20452880859375, -0.1285400390625, -0.05255126953125, 0.0234375, 0.09942626953125, 0.1754150390625, 0.25140380859375, 0.327392578125, 0.40338134765625, 0.4793701171875, 0.55535888671875, 0.63134765625, 0.70733642578125, 0.7833251953125, 0.85931396484375, 0.935302734375, 1.01129150390625, 1.0872802734375, 1.16326904296875, 1.2392578125, 1.31524658203125, 1.3912353515625, 1.46722412109375, 1.543212890625, 1.61920166015625, 1.6951904296875, 1.77117919921875, 1.84716796875, 1.92315673828125, 1.9991455078125, 2.07513427734375, 2.151123046875, 2.22711181640625, 2.3031005859375, 2.37908935546875, 2.455078125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 8.0, 7.0, 11.0, 13.0, 34.0, 41.0, 71.0, 138.0, 301.0, 902.0, 1409.0, 641.0, 210.0, 84.0, 50.0, 42.0, 24.0, 18.0, 18.0, 10.0, 12.0, 11.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.284149169921875, -0.27337646484375, -0.262603759765625, -0.2518310546875, -0.241058349609375, -0.23028564453125, -0.219512939453125, -0.208740234375, -0.197967529296875, -0.18719482421875, -0.176422119140625, -0.1656494140625, -0.154876708984375, -0.14410400390625, -0.133331298828125, -0.12255859375, -0.111785888671875, -0.10101318359375, -0.090240478515625, -0.0794677734375, -0.068695068359375, -0.05792236328125, -0.047149658203125, -0.036376953125, -0.025604248046875, -0.01483154296875, -0.004058837890625, 0.0067138671875, 0.017486572265625, 0.02825927734375, 0.039031982421875, 0.0498046875, 0.060577392578125, 0.07135009765625, 0.082122802734375, 0.0928955078125, 0.103668212890625, 0.11444091796875, 0.125213623046875, 0.135986328125, 0.146759033203125, 0.15753173828125, 0.168304443359375, 0.1790771484375, 0.189849853515625, 0.20062255859375, 0.211395263671875, 0.22216796875, 0.232940673828125, 0.24371337890625, 0.254486083984375, 0.2652587890625, 0.276031494140625, 0.28680419921875, 0.297576904296875, 0.308349609375, 0.319122314453125, 0.32989501953125, 0.340667724609375, 0.3514404296875, 0.362213134765625, 0.37298583984375, 0.383758544921875, 0.39453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 12.0, 34.0, 85.0, 214.0, 302.0, 212.0, 92.0, 42.0, 12.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5103890895843506, -3.4348366260528564, -3.3592841625213623, -3.2837319374084473, -3.208179473876953, -3.132627010345459, -3.057074546813965, -2.9815220832824707, -2.9059696197509766, -2.8304171562194824, -2.7548646926879883, -2.6793124675750732, -2.603760004043579, -2.528207540512085, -2.452655076980591, -2.3771026134490967, -2.3015503883361816, -2.2259979248046875, -2.1504454612731934, -2.0748932361602783, -1.9993407726287842, -1.92378830909729, -1.848235845565796, -1.7726833820343018, -1.6971310377120972, -1.621578574180603, -1.5460262298583984, -1.4704737663269043, -1.3949213027954102, -1.3193689584732056, -1.2438164949417114, -1.1682641506195068, -1.0927119255065918, -1.0171594619750977, -0.9416071176528931, -0.8660546541213989, -0.7905022501945496, -0.7149498462677002, -0.639397382736206, -0.5638449788093567, -0.4882925748825073, -0.41274017095565796, -0.3371877372264862, -0.26163530349731445, -0.1860828995704651, -0.11053049564361572, -0.03497806191444397, 0.04057437181472778, 0.11612677574157715, 0.1916791945695877, 0.26723161339759827, 0.34278404712677, 0.4183364510536194, 0.49388885498046875, 0.5694413185119629, 0.6449937224388123, 0.7205461263656616, 0.796098530292511, 0.8716509342193604, 0.9472033977508545, 1.0227558612823486, 1.0983082056045532, 1.1738606691360474, 1.249413013458252, 1.324965476989746]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 11.0, 16.0, 27.0, 54.0, 73.0, 92.0, 105.0, 127.0, 122.0, 114.0, 76.0, 67.0, 58.0, 30.0, 19.0, 12.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.397276759147644, -1.3529143333435059, -1.3085520267486572, -1.264189600944519, -1.2198271751403809, -1.1754648685455322, -1.131102442741394, -1.0867400169372559, -1.0423777103424072, -0.9980153441429138, -0.9536529183387756, -0.9092905521392822, -0.8649281859397888, -0.8205658197402954, -0.7762033939361572, -0.7318410277366638, -0.6874786019325256, -0.6431162357330322, -0.598753809928894, -0.5543914437294006, -0.5100290775299072, -0.46566668152809143, -0.42130428552627563, -0.3769419193267822, -0.33257952332496643, -0.28821712732315063, -0.24385476112365723, -0.19949236512184143, -0.15512998402118683, -0.11076760292053223, -0.06640520691871643, -0.022042840719223022, 0.022319555282592773, 0.06668193638324738, 0.11104432493448257, 0.15540671348571777, 0.19976909458637238, 0.24413147568702698, 0.2884938716888428, 0.3328562378883362, 0.377218633890152, 0.4215810298919678, 0.4659433960914612, 0.5103057622909546, 0.5546681880950928, 0.5990305542945862, 0.6433929204940796, 0.6877553462982178, 0.7321177124977112, 0.7764800786972046, 0.8208425045013428, 0.8652048707008362, 0.9095672369003296, 0.9539296627044678, 0.9982920289039612, 1.0426543951034546, 1.0870168209075928, 1.131379246711731, 1.1757415533065796, 1.2201039791107178, 1.264466404914856, 1.3088287115097046, 1.3531911373138428, 1.3975534439086914, 1.4419158697128296]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 3.0, 15.0, 23.0, 34.0, 84.0, 150.0, 353.0, 914.0, 3023.0, 27222.0, 808517.0, 197019.0, 8493.0, 1634.0, 566.0, 237.0, 112.0, 55.0, 38.0, 16.0, 12.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4365234375, -0.4239692687988281, -0.41141510009765625, -0.3988609313964844, -0.3863067626953125, -0.3737525939941406, -0.36119842529296875, -0.3486442565917969, -0.336090087890625, -0.3235359191894531, -0.31098175048828125, -0.2984275817871094, -0.2858734130859375, -0.2733192443847656, -0.26076507568359375, -0.24821090698242188, -0.23565673828125, -0.22310256958007812, -0.21054840087890625, -0.19799423217773438, -0.1854400634765625, -0.17288589477539062, -0.16033172607421875, -0.14777755737304688, -0.135223388671875, -0.12266921997070312, -0.11011505126953125, -0.09756088256835938, -0.0850067138671875, -0.07245254516601562, -0.05989837646484375, -0.047344207763671875, -0.0347900390625, -0.022235870361328125, -0.00968170166015625, 0.002872467041015625, 0.0154266357421875, 0.027980804443359375, 0.04053497314453125, 0.053089141845703125, 0.065643310546875, 0.07819747924804688, 0.09075164794921875, 0.10330581665039062, 0.1158599853515625, 0.12841415405273438, 0.14096832275390625, 0.15352249145507812, 0.16607666015625, 0.17863082885742188, 0.19118499755859375, 0.20373916625976562, 0.2162933349609375, 0.22884750366210938, 0.24140167236328125, 0.2539558410644531, 0.266510009765625, 0.2790641784667969, 0.29161834716796875, 0.3041725158691406, 0.3167266845703125, 0.3292808532714844, 0.34183502197265625, 0.3543891906738281, 0.366943359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 10.0, 11.0, 26.0, 49.0, 82.0, 96.0, 104.0, 118.0, 142.0, 119.0, 87.0, 70.0, 39.0, 23.0, 12.0, 5.0, 10.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8457412719726562, -0.8130645751953125, -0.7803878784179688, -0.747711181640625, -0.7150344848632812, -0.6823577880859375, -0.6496810913085938, -0.61700439453125, -0.5843276977539062, -0.5516510009765625, -0.5189743041992188, -0.486297607421875, -0.45362091064453125, -0.4209442138671875, -0.38826751708984375, -0.3555908203125, -0.32291412353515625, -0.2902374267578125, -0.25756072998046875, -0.224884033203125, -0.19220733642578125, -0.1595306396484375, -0.12685394287109375, -0.09417724609375, -0.06150054931640625, -0.0288238525390625, 0.00385284423828125, 0.036529541015625, 0.06920623779296875, 0.1018829345703125, 0.13455963134765625, 0.167236328125, 0.19991302490234375, 0.2325897216796875, 0.26526641845703125, 0.297943115234375, 0.33061981201171875, 0.3632965087890625, 0.39597320556640625, 0.42864990234375, 0.46132659912109375, 0.4940032958984375, 0.5266799926757812, 0.559356689453125, 0.5920333862304688, 0.6247100830078125, 0.6573867797851562, 0.6900634765625, 0.7227401733398438, 0.7554168701171875, 0.7880935668945312, 0.820770263671875, 0.8534469604492188, 0.8861236572265625, 0.9188003540039062, 0.95147705078125, 0.9841537475585938, 1.0168304443359375, 1.0495071411132812, 1.082183837890625, 1.1148605346679688, 1.1475372314453125, 1.1802139282226562, 1.212890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 11.0, 13.0, 19.0, 22.0, 42.0, 57.0, 95.0, 151.0, 215.0, 362.0, 574.0, 927.0, 1657.0, 2689.0, 4437.0, 8346.0, 15092.0, 28913.0, 59016.0, 122817.0, 240342.0, 267612.0, 149278.0, 70736.0, 35037.0, 17638.0, 9476.0, 5219.0, 3079.0, 1827.0, 1051.0, 620.0, 434.0, 279.0, 180.0, 92.0, 70.0, 52.0, 26.0, 14.0, 21.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.05330324172973633, -0.051644325256347656, -0.049985408782958984, -0.04832649230957031, -0.04666757583618164, -0.04500865936279297, -0.0433497428894043, -0.041690826416015625, -0.04003190994262695, -0.03837299346923828, -0.03671407699584961, -0.03505516052246094, -0.033396244049072266, -0.031737327575683594, -0.030078411102294922, -0.02841949462890625, -0.026760578155517578, -0.025101661682128906, -0.023442745208740234, -0.021783828735351562, -0.02012491226196289, -0.01846599578857422, -0.016807079315185547, -0.015148162841796875, -0.013489246368408203, -0.011830329895019531, -0.01017141342163086, -0.008512496948242188, -0.006853580474853516, -0.005194664001464844, -0.003535747528076172, -0.0018768310546875, -0.00021791458129882812, 0.0014410018920898438, 0.0030999183654785156, 0.0047588348388671875, 0.006417751312255859, 0.008076667785644531, 0.009735584259033203, 0.011394500732421875, 0.013053417205810547, 0.014712333679199219, 0.01637125015258789, 0.018030166625976562, 0.019689083099365234, 0.021347999572753906, 0.023006916046142578, 0.02466583251953125, 0.026324748992919922, 0.027983665466308594, 0.029642581939697266, 0.03130149841308594, 0.03296041488647461, 0.03461933135986328, 0.03627824783325195, 0.037937164306640625, 0.0395960807800293, 0.04125499725341797, 0.04291391372680664, 0.04457283020019531, 0.046231746673583984, 0.047890663146972656, 0.04954957962036133, 0.05120849609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 12.0, 6.0, 10.0, 21.0, 16.0, 20.0, 27.0, 27.0, 28.0, 33.0, 31.0, 34.0, 52.0, 45.0, 46.0, 57.0, 43.0, 45.0, 42.0, 52.0, 44.0, 39.0, 36.0, 27.0, 35.0, 27.0, 20.0, 20.0, 17.0, 19.0, 7.0, 9.0, 6.0, 7.0, 4.0, 5.0, 3.0, 11.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.83642578125, -0.80999755859375, -0.7835693359375, -0.75714111328125, -0.730712890625, -0.70428466796875, -0.6778564453125, -0.65142822265625, -0.625, -0.59857177734375, -0.5721435546875, -0.54571533203125, -0.519287109375, -0.49285888671875, -0.4664306640625, -0.44000244140625, -0.41357421875, -0.38714599609375, -0.3607177734375, -0.33428955078125, -0.307861328125, -0.28143310546875, -0.2550048828125, -0.22857666015625, -0.2021484375, -0.17572021484375, -0.1492919921875, -0.12286376953125, -0.096435546875, -0.07000732421875, -0.0435791015625, -0.01715087890625, 0.00927734375, 0.03570556640625, 0.0621337890625, 0.08856201171875, 0.114990234375, 0.14141845703125, 0.1678466796875, 0.19427490234375, 0.220703125, 0.24713134765625, 0.2735595703125, 0.29998779296875, 0.326416015625, 0.35284423828125, 0.3792724609375, 0.40570068359375, 0.43212890625, 0.45855712890625, 0.4849853515625, 0.51141357421875, 0.537841796875, 0.56427001953125, 0.5906982421875, 0.61712646484375, 0.6435546875, 0.66998291015625, 0.6964111328125, 0.72283935546875, 0.749267578125, 0.77569580078125, 0.8021240234375, 0.82855224609375, 0.85498046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 9.0, 9.0, 18.0, 19.0, 26.0, 65.0, 79.0, 120.0, 202.0, 461.0, 788.0, 1576.0, 3469.0, 8836.0, 29790.0, 153865.0, 614097.0, 184437.0, 33837.0, 9749.0, 3587.0, 1638.0, 826.0, 438.0, 229.0, 124.0, 73.0, 48.0, 31.0, 24.0, 17.0, 19.0, 16.0, 9.0, 7.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00820159912109375, -0.007949590682983398, -0.007697582244873047, -0.007445573806762695, -0.007193565368652344, -0.006941556930541992, -0.006689548492431641, -0.006437540054321289, -0.0061855316162109375, -0.005933523178100586, -0.005681514739990234, -0.005429506301879883, -0.005177497863769531, -0.00492548942565918, -0.004673480987548828, -0.0044214725494384766, -0.004169464111328125, -0.0039174556732177734, -0.003665447235107422, -0.0034134387969970703, -0.0031614303588867188, -0.002909421920776367, -0.0026574134826660156, -0.002405405044555664, -0.0021533966064453125, -0.001901388168334961, -0.0016493797302246094, -0.0013973712921142578, -0.0011453628540039062, -0.0008933544158935547, -0.0006413459777832031, -0.00038933753967285156, -0.0001373291015625, 0.00011467933654785156, 0.0003666877746582031, 0.0006186962127685547, 0.0008707046508789062, 0.0011227130889892578, 0.0013747215270996094, 0.001626729965209961, 0.0018787384033203125, 0.002130746841430664, 0.0023827552795410156, 0.002634763717651367, 0.0028867721557617188, 0.0031387805938720703, 0.003390789031982422, 0.0036427974700927734, 0.003894805908203125, 0.0041468143463134766, 0.004398822784423828, 0.00465083122253418, 0.004902839660644531, 0.005154848098754883, 0.005406856536865234, 0.005658864974975586, 0.0059108734130859375, 0.006162881851196289, 0.006414890289306641, 0.006666898727416992, 0.006918907165527344, 0.007170915603637695, 0.007422924041748047, 0.0076749324798583984, 0.00792694091796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 14.0, 5.0, 12.0, 23.0, 41.0, 53.0, 73.0, 76.0, 112.0, 117.0, 95.0, 109.0, 88.0, 51.0, 41.0, 29.0, 19.0, 10.0, 7.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.6888603568077087e-05, -1.6372650861740112e-05, -1.5856698155403137e-05, -1.5340745449066162e-05, -1.4824792742729187e-05, -1.4308840036392212e-05, -1.3792887330055237e-05, -1.3276934623718262e-05, -1.2760981917381287e-05, -1.2245029211044312e-05, -1.1729076504707336e-05, -1.1213123798370361e-05, -1.0697171092033386e-05, -1.0181218385696411e-05, -9.665265679359436e-06, -9.149312973022461e-06, -8.633360266685486e-06, -8.11740756034851e-06, -7.601454854011536e-06, -7.0855021476745605e-06, -6.5695494413375854e-06, -6.05359673500061e-06, -5.537644028663635e-06, -5.02169132232666e-06, -4.505738615989685e-06, -3.98978590965271e-06, -3.473833203315735e-06, -2.9578804969787598e-06, -2.4419277906417847e-06, -1.9259750843048096e-06, -1.4100223779678345e-06, -8.940696716308594e-07, -3.781169652938843e-07, 1.3783574104309082e-07, 6.537884473800659e-07, 1.169741153717041e-06, 1.6856938600540161e-06, 2.201646566390991e-06, 2.7175992727279663e-06, 3.2335519790649414e-06, 3.7495046854019165e-06, 4.265457391738892e-06, 4.781410098075867e-06, 5.297362804412842e-06, 5.813315510749817e-06, 6.329268217086792e-06, 6.845220923423767e-06, 7.361173629760742e-06, 7.877126336097717e-06, 8.393079042434692e-06, 8.909031748771667e-06, 9.424984455108643e-06, 9.940937161445618e-06, 1.0456889867782593e-05, 1.0972842574119568e-05, 1.1488795280456543e-05, 1.2004747986793518e-05, 1.2520700693130493e-05, 1.3036653399467468e-05, 1.3552606105804443e-05, 1.4068558812141418e-05, 1.4584511518478394e-05, 1.5100464224815369e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 2.0, 7.0, 4.0, 19.0, 23.0, 30.0, 36.0, 75.0, 112.0, 187.0, 343.0, 606.0, 1175.0, 2320.0, 5210.0, 12941.0, 39520.0, 206627.0, 606160.0, 126010.0, 28824.0, 9894.0, 4138.0, 2009.0, 976.0, 493.0, 272.0, 188.0, 107.0, 67.0, 50.0, 38.0, 20.0, 21.0, 18.0, 7.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008819580078125, -0.008555293083190918, -0.008291006088256836, -0.008026719093322754, -0.007762432098388672, -0.00749814510345459, -0.007233858108520508, -0.006969571113586426, -0.006705284118652344, -0.006440997123718262, -0.00617671012878418, -0.005912423133850098, -0.005648136138916016, -0.005383849143981934, -0.0051195621490478516, -0.0048552751541137695, -0.0045909881591796875, -0.0043267011642456055, -0.0040624141693115234, -0.0037981271743774414, -0.0035338401794433594, -0.0032695531845092773, -0.0030052661895751953, -0.0027409791946411133, -0.0024766921997070312, -0.0022124052047729492, -0.0019481182098388672, -0.0016838312149047852, -0.0014195442199707031, -0.001155257225036621, -0.0008909702301025391, -0.000626683235168457, -0.000362396240234375, -9.810924530029297e-05, 0.00016617774963378906, 0.0004304647445678711, 0.0006947517395019531, 0.0009590387344360352, 0.0012233257293701172, 0.0014876127243041992, 0.0017518997192382812, 0.0020161867141723633, 0.0022804737091064453, 0.0025447607040405273, 0.0028090476989746094, 0.0030733346939086914, 0.0033376216888427734, 0.0036019086837768555, 0.0038661956787109375, 0.0041304826736450195, 0.0043947696685791016, 0.004659056663513184, 0.004923343658447266, 0.005187630653381348, 0.00545191764831543, 0.005716204643249512, 0.005980491638183594, 0.006244778633117676, 0.006509065628051758, 0.00677335262298584, 0.007037639617919922, 0.007301926612854004, 0.007566213607788086, 0.007830500602722168, 0.00809478759765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 10.0, 8.0, 11.0, 13.0, 9.0, 12.0, 22.0, 29.0, 42.0, 44.0, 90.0, 100.0, 135.0, 119.0, 100.0, 58.0, 42.0, 33.0, 21.0, 16.0, 14.0, 6.0, 12.0, 7.0, 5.0, 3.0, 2.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00312042236328125, -0.0030185580253601074, -0.002916693687438965, -0.0028148293495178223, -0.0027129650115966797, -0.002611100673675537, -0.0025092363357543945, -0.002407371997833252, -0.0023055076599121094, -0.002203643321990967, -0.0021017789840698242, -0.0019999146461486816, -0.001898050308227539, -0.0017961859703063965, -0.001694321632385254, -0.0015924572944641113, -0.0014905929565429688, -0.0013887286186218262, -0.0012868642807006836, -0.001184999942779541, -0.0010831356048583984, -0.0009812712669372559, -0.0008794069290161133, -0.0007775425910949707, -0.0006756782531738281, -0.0005738139152526855, -0.00047194957733154297, -0.0003700852394104004, -0.0002682209014892578, -0.00016635656356811523, -6.449222564697266e-05, 3.737211227416992e-05, 0.0001392364501953125, 0.00024110078811645508, 0.00034296512603759766, 0.00044482946395874023, 0.0005466938018798828, 0.0006485581398010254, 0.000750422477722168, 0.0008522868156433105, 0.0009541511535644531, 0.0010560154914855957, 0.0011578798294067383, 0.0012597441673278809, 0.0013616085052490234, 0.001463472843170166, 0.0015653371810913086, 0.0016672015190124512, 0.0017690658569335938, 0.0018709301948547363, 0.001972794532775879, 0.0020746588706970215, 0.002176523208618164, 0.0022783875465393066, 0.0023802518844604492, 0.002482116222381592, 0.0025839805603027344, 0.002685844898223877, 0.0027877092361450195, 0.002889573574066162, 0.0029914379119873047, 0.0030933022499084473, 0.00319516658782959, 0.0032970309257507324, 0.003398895263671875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 12.0, 37.0, 80.0, 171.0, 246.0, 218.0, 136.0, 54.0, 22.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5487481355667114, -1.5097471475601196, -1.4707462787628174, -1.4317452907562256, -1.3927443027496338, -1.3537434339523315, -1.3147424459457397, -1.2757415771484375, -1.2367405891418457, -1.197739601135254, -1.1587387323379517, -1.1197377443313599, -1.0807368755340576, -1.0417358875274658, -1.002734899520874, -0.963733971118927, -0.92473304271698, -0.885732114315033, -0.8467311859130859, -0.8077301979064941, -0.7687292695045471, -0.7297283411026001, -0.6907273530960083, -0.6517264246940613, -0.6127254962921143, -0.5737245678901672, -0.5347236394882202, -0.4957226514816284, -0.4567217230796814, -0.4177207946777344, -0.37871983647346497, -0.33971887826919556, -0.30071794986724854, -0.2617170214653015, -0.2227160632610321, -0.1837151199579239, -0.14471417665481567, -0.10571323335170746, -0.06671229004859924, -0.027711331844329834, 0.011289596557617188, 0.0502905398607254, 0.08929148316383362, 0.12829242646694183, 0.16729336977005005, 0.20629431307315826, 0.24529525637626648, 0.2842962145805359, 0.3232971429824829, 0.36229807138442993, 0.40129902958869934, 0.44029998779296875, 0.47930091619491577, 0.5183018445968628, 0.5573028326034546, 0.5963037610054016, 0.6353046894073486, 0.6743056178092957, 0.7133065462112427, 0.7523075342178345, 0.7913084626197815, 0.8303093910217285, 0.8693103790283203, 0.9083113074302673, 0.9473122358322144]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 16.0, 13.0, 32.0, 58.0, 76.0, 91.0, 119.0, 123.0, 134.0, 102.0, 85.0, 63.0, 40.0, 26.0, 16.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.863971471786499, -0.8327522873878479, -0.8015331625938416, -0.7703139781951904, -0.7390948534011841, -0.707875669002533, -0.6766564846038818, -0.6454373598098755, -0.6142182350158691, -0.582999050617218, -0.5517799258232117, -0.5205607414245605, -0.4893416166305542, -0.4581224322319031, -0.42690327763557434, -0.3956841230392456, -0.3644649386405945, -0.33324578404426575, -0.302026629447937, -0.2708074450492859, -0.23958830535411835, -0.2083691507577896, -0.17714998126029968, -0.14593082666397095, -0.11471167206764221, -0.08349251747131348, -0.052273355424404144, -0.021054193377494812, 0.010164961218833923, 0.04138411581516266, 0.07260328531265259, 0.10382243990898132, 0.13504159450531006, 0.1662607491016388, 0.19747990369796753, 0.22869907319545746, 0.259918212890625, 0.2911373972892761, 0.32235655188560486, 0.3535757064819336, 0.38479486107826233, 0.41601401567459106, 0.4472331702709198, 0.47845232486724854, 0.5096715092658997, 0.540890634059906, 0.5721098184585571, 0.6033289432525635, 0.6345481276512146, 0.6657673120498657, 0.6969864368438721, 0.7282056212425232, 0.7594247460365295, 0.7906439304351807, 0.821863055229187, 0.8530822396278381, 0.8843014240264893, 0.9155206084251404, 0.9467397332191467, 0.9779589176177979, 1.0091780424118042, 1.0403971672058105, 1.0716164112091064, 1.1028355360031128, 1.1340546607971191]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 11.0, 11.0, 24.0, 37.0, 46.0, 101.0, 201.0, 443.0, 910.0, 2450.0, 7427.0, 34372.0, 786653.0, 190511.0, 17684.0, 4713.0, 1623.0, 672.0, 327.0, 146.0, 78.0, 39.0, 24.0, 17.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.84765625, -0.82330322265625, -0.7989501953125, -0.77459716796875, -0.750244140625, -0.72589111328125, -0.7015380859375, -0.67718505859375, -0.65283203125, -0.62847900390625, -0.6041259765625, -0.57977294921875, -0.555419921875, -0.53106689453125, -0.5067138671875, -0.48236083984375, -0.4580078125, -0.43365478515625, -0.4093017578125, -0.38494873046875, -0.360595703125, -0.33624267578125, -0.3118896484375, -0.28753662109375, -0.26318359375, -0.23883056640625, -0.2144775390625, -0.19012451171875, -0.165771484375, -0.14141845703125, -0.1170654296875, -0.09271240234375, -0.068359375, -0.04400634765625, -0.0196533203125, 0.00469970703125, 0.029052734375, 0.05340576171875, 0.0777587890625, 0.10211181640625, 0.12646484375, 0.15081787109375, 0.1751708984375, 0.19952392578125, 0.223876953125, 0.24822998046875, 0.2725830078125, 0.29693603515625, 0.3212890625, 0.34564208984375, 0.3699951171875, 0.39434814453125, 0.418701171875, 0.44305419921875, 0.4674072265625, 0.49176025390625, 0.51611328125, 0.54046630859375, 0.5648193359375, 0.58917236328125, 0.613525390625, 0.63787841796875, 0.6622314453125, 0.68658447265625, 0.7109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 11.0, 12.0, 19.0, 49.0, 57.0, 92.0, 102.0, 125.0, 146.0, 110.0, 92.0, 72.0, 58.0, 33.0, 17.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.905609130859375, -1.84637451171875, -1.787139892578125, -1.7279052734375, -1.668670654296875, -1.60943603515625, -1.550201416015625, -1.490966796875, -1.431732177734375, -1.37249755859375, -1.313262939453125, -1.2540283203125, -1.194793701171875, -1.13555908203125, -1.076324462890625, -1.01708984375, -0.957855224609375, -0.89862060546875, -0.839385986328125, -0.7801513671875, -0.720916748046875, -0.66168212890625, -0.602447509765625, -0.543212890625, -0.483978271484375, -0.42474365234375, -0.365509033203125, -0.3062744140625, -0.247039794921875, -0.18780517578125, -0.128570556640625, -0.0693359375, -0.010101318359375, 0.04913330078125, 0.108367919921875, 0.1676025390625, 0.226837158203125, 0.28607177734375, 0.345306396484375, 0.404541015625, 0.463775634765625, 0.52301025390625, 0.582244873046875, 0.6414794921875, 0.700714111328125, 0.75994873046875, 0.819183349609375, 0.87841796875, 0.937652587890625, 0.99688720703125, 1.056121826171875, 1.1153564453125, 1.174591064453125, 1.23382568359375, 1.293060302734375, 1.352294921875, 1.411529541015625, 1.47076416015625, 1.529998779296875, 1.5892333984375, 1.648468017578125, 1.70770263671875, 1.766937255859375, 1.826171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 14.0, 11.0, 13.0, 19.0, 16.0, 22.0, 26.0, 39.0, 68.0, 92.0, 141.0, 192.0, 300.0, 695.0, 3442.0, 62887.0, 961935.0, 15585.0, 1596.0, 474.0, 292.0, 167.0, 108.0, 92.0, 74.0, 50.0, 32.0, 33.0, 23.0, 21.0, 19.0, 12.0, 7.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.5012359619140625, -1.451690673828125, -1.4021453857421875, -1.35260009765625, -1.3030548095703125, -1.253509521484375, -1.2039642333984375, -1.1544189453125, -1.1048736572265625, -1.055328369140625, -1.0057830810546875, -0.95623779296875, -0.9066925048828125, -0.857147216796875, -0.8076019287109375, -0.758056640625, -0.7085113525390625, -0.658966064453125, -0.6094207763671875, -0.55987548828125, -0.5103302001953125, -0.460784912109375, -0.4112396240234375, -0.3616943359375, -0.3121490478515625, -0.262603759765625, -0.2130584716796875, -0.16351318359375, -0.1139678955078125, -0.064422607421875, -0.0148773193359375, 0.03466796875, 0.0842132568359375, 0.133758544921875, 0.1833038330078125, 0.23284912109375, 0.2823944091796875, 0.331939697265625, 0.3814849853515625, 0.4310302734375, 0.4805755615234375, 0.530120849609375, 0.5796661376953125, 0.62921142578125, 0.6787567138671875, 0.728302001953125, 0.7778472900390625, 0.827392578125, 0.8769378662109375, 0.926483154296875, 0.9760284423828125, 1.02557373046875, 1.0751190185546875, 1.124664306640625, 1.1742095947265625, 1.2237548828125, 1.2733001708984375, 1.322845458984375, 1.3723907470703125, 1.42193603515625, 1.4714813232421875, 1.521026611328125, 1.5705718994140625, 1.6201171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 2.0, 10.0, 13.0, 12.0, 16.0, 22.0, 28.0, 20.0, 43.0, 24.0, 43.0, 39.0, 42.0, 47.0, 61.0, 41.0, 60.0, 47.0, 54.0, 58.0, 49.0, 29.0, 36.0, 30.0, 23.0, 20.0, 18.0, 13.0, 12.0, 12.0, 10.0, 6.0, 8.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.04010009765625, -1.0040283203125, -0.96795654296875, -0.931884765625, -0.89581298828125, -0.8597412109375, -0.82366943359375, -0.78759765625, -0.75152587890625, -0.7154541015625, -0.67938232421875, -0.643310546875, -0.60723876953125, -0.5711669921875, -0.53509521484375, -0.4990234375, -0.46295166015625, -0.4268798828125, -0.39080810546875, -0.354736328125, -0.31866455078125, -0.2825927734375, -0.24652099609375, -0.21044921875, -0.17437744140625, -0.1383056640625, -0.10223388671875, -0.066162109375, -0.03009033203125, 0.0059814453125, 0.04205322265625, 0.078125, 0.11419677734375, 0.1502685546875, 0.18634033203125, 0.222412109375, 0.25848388671875, 0.2945556640625, 0.33062744140625, 0.36669921875, 0.40277099609375, 0.4388427734375, 0.47491455078125, 0.510986328125, 0.54705810546875, 0.5831298828125, 0.61920166015625, 0.6552734375, 0.69134521484375, 0.7274169921875, 0.76348876953125, 0.799560546875, 0.83563232421875, 0.8717041015625, 0.90777587890625, 0.94384765625, 0.97991943359375, 1.0159912109375, 1.05206298828125, 1.088134765625, 1.12420654296875, 1.1602783203125, 1.19635009765625, 1.232421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 18.0, 15.0, 35.0, 51.0, 87.0, 202.0, 413.0, 950.0, 3228.0, 22439.0, 944922.0, 68243.0, 5581.0, 1319.0, 495.0, 238.0, 130.0, 65.0, 34.0, 26.0, 11.0, 9.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.26837921142578125, -0.2586822509765625, -0.24898529052734375, -0.239288330078125, -0.22959136962890625, -0.2198944091796875, -0.21019744873046875, -0.20050048828125, -0.19080352783203125, -0.1811065673828125, -0.17140960693359375, -0.161712646484375, -0.15201568603515625, -0.1423187255859375, -0.13262176513671875, -0.1229248046875, -0.11322784423828125, -0.1035308837890625, -0.09383392333984375, -0.084136962890625, -0.07444000244140625, -0.0647430419921875, -0.05504608154296875, -0.04534912109375, -0.03565216064453125, -0.0259552001953125, -0.01625823974609375, -0.006561279296875, 0.00313568115234375, 0.0128326416015625, 0.02252960205078125, 0.0322265625, 0.04192352294921875, 0.0516204833984375, 0.06131744384765625, 0.071014404296875, 0.08071136474609375, 0.0904083251953125, 0.10010528564453125, 0.10980224609375, 0.11949920654296875, 0.1291961669921875, 0.13889312744140625, 0.148590087890625, 0.15828704833984375, 0.1679840087890625, 0.17768096923828125, 0.1873779296875, 0.19707489013671875, 0.2067718505859375, 0.21646881103515625, 0.226165771484375, 0.23586273193359375, 0.2455596923828125, 0.25525665283203125, 0.26495361328125, 0.27465057373046875, 0.2843475341796875, 0.29404449462890625, 0.303741455078125, 0.31343841552734375, 0.3231353759765625, 0.33283233642578125, 0.342529296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 6.0, 10.0, 16.0, 28.0, 55.0, 89.0, 236.0, 274.0, 104.0, 52.0, 30.0, 18.0, 13.0, 11.0, 8.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.968311309814453e-05, -2.8858892619609833e-05, -2.8034672141075134e-05, -2.7210451662540436e-05, -2.6386231184005737e-05, -2.556201070547104e-05, -2.473779022693634e-05, -2.3913569748401642e-05, -2.3089349269866943e-05, -2.2265128791332245e-05, -2.1440908312797546e-05, -2.0616687834262848e-05, -1.979246735572815e-05, -1.896824687719345e-05, -1.8144026398658752e-05, -1.7319805920124054e-05, -1.6495585441589355e-05, -1.5671364963054657e-05, -1.4847144484519958e-05, -1.402292400598526e-05, -1.3198703527450562e-05, -1.2374483048915863e-05, -1.1550262570381165e-05, -1.0726042091846466e-05, -9.901821613311768e-06, -9.077601134777069e-06, -8.25338065624237e-06, -7.429160177707672e-06, -6.604939699172974e-06, -5.780719220638275e-06, -4.956498742103577e-06, -4.132278263568878e-06, -3.3080577850341797e-06, -2.483837306499481e-06, -1.6596168279647827e-06, -8.353963494300842e-07, -1.1175870895385742e-08, 8.130446076393127e-07, 1.6372650861740112e-06, 2.4614855647087097e-06, 3.285706043243408e-06, 4.109926521778107e-06, 4.934147000312805e-06, 5.758367478847504e-06, 6.582587957382202e-06, 7.406808435916901e-06, 8.231028914451599e-06, 9.055249392986298e-06, 9.879469871520996e-06, 1.0703690350055695e-05, 1.1527910828590393e-05, 1.2352131307125092e-05, 1.317635178565979e-05, 1.4000572264194489e-05, 1.4824792742729187e-05, 1.5649013221263885e-05, 1.6473233699798584e-05, 1.7297454178333282e-05, 1.812167465686798e-05, 1.894589513540268e-05, 1.9770115613937378e-05, 2.0594336092472076e-05, 2.1418556571006775e-05, 2.2242777049541473e-05, 2.3066997528076172e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 8.0, 11.0, 20.0, 25.0, 39.0, 75.0, 187.0, 387.0, 1326.0, 6016.0, 74046.0, 943386.0, 18902.0, 2867.0, 764.0, 253.0, 96.0, 60.0, 33.0, 14.0, 13.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307861328125, -0.2956809997558594, -0.28350067138671875, -0.2713203430175781, -0.2591400146484375, -0.24695968627929688, -0.23477935791015625, -0.22259902954101562, -0.210418701171875, -0.19823837280273438, -0.18605804443359375, -0.17387771606445312, -0.1616973876953125, -0.14951705932617188, -0.13733673095703125, -0.12515640258789062, -0.11297607421875, -0.10079574584960938, -0.08861541748046875, -0.07643508911132812, -0.0642547607421875, -0.052074432373046875, -0.03989410400390625, -0.027713775634765625, -0.015533447265625, -0.003353118896484375, 0.00882720947265625, 0.021007537841796875, 0.0331878662109375, 0.045368194580078125, 0.05754852294921875, 0.06972885131835938, 0.0819091796875, 0.09408950805664062, 0.10626983642578125, 0.11845016479492188, 0.1306304931640625, 0.14281082153320312, 0.15499114990234375, 0.16717147827148438, 0.179351806640625, 0.19153213500976562, 0.20371246337890625, 0.21589279174804688, 0.2280731201171875, 0.24025344848632812, 0.25243377685546875, 0.2646141052246094, 0.27679443359375, 0.2889747619628906, 0.30115509033203125, 0.3133354187011719, 0.3255157470703125, 0.3376960754394531, 0.34987640380859375, 0.3620567321777344, 0.374237060546875, 0.3864173889160156, 0.39859771728515625, 0.4107780456542969, 0.4229583740234375, 0.4351387023925781, 0.44731903076171875, 0.4594993591308594, 0.4716796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 13.0, 8.0, 11.0, 16.0, 32.0, 54.0, 210.0, 444.0, 66.0, 43.0, 32.0, 26.0, 18.0, 3.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.1605968475341797, -0.15627670288085938, -0.15195655822753906, -0.14763641357421875, -0.14331626892089844, -0.13899612426757812, -0.1346759796142578, -0.1303558349609375, -0.1260356903076172, -0.12171554565429688, -0.11739540100097656, -0.11307525634765625, -0.10875511169433594, -0.10443496704101562, -0.10011482238769531, -0.095794677734375, -0.09147453308105469, -0.08715438842773438, -0.08283424377441406, -0.07851409912109375, -0.07419395446777344, -0.06987380981445312, -0.06555366516113281, -0.0612335205078125, -0.05691337585449219, -0.052593231201171875, -0.04827308654785156, -0.04395294189453125, -0.03963279724121094, -0.035312652587890625, -0.030992507934570312, -0.02667236328125, -0.022352218627929688, -0.018032073974609375, -0.013711929321289062, -0.00939178466796875, -0.0050716400146484375, -0.000751495361328125, 0.0035686492919921875, 0.0078887939453125, 0.012208938598632812, 0.016529083251953125, 0.020849227905273438, 0.02516937255859375, 0.029489517211914062, 0.033809661865234375, 0.03812980651855469, 0.042449951171875, 0.04677009582519531, 0.051090240478515625, 0.05541038513183594, 0.05973052978515625, 0.06405067443847656, 0.06837081909179688, 0.07269096374511719, 0.0770111083984375, 0.08133125305175781, 0.08565139770507812, 0.08997154235839844, 0.09429168701171875, 0.09861183166503906, 0.10293197631835938, 0.10725212097167969, 0.111572265625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 9.0, 24.0, 117.0, 355.0, 364.0, 117.0, 17.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.676401615142822, -7.536910057067871, -7.397418975830078, -7.257927417755127, -7.118435859680176, -6.978944778442383, -6.839453220367432, -6.699962139129639, -6.5604705810546875, -6.420979022979736, -6.281487941741943, -6.141996383666992, -6.002505302429199, -5.863013744354248, -5.723522186279297, -5.584031105041504, -5.444539546966553, -5.305047988891602, -5.165556907653809, -5.026065349578857, -4.886573791503906, -4.747082710266113, -4.607591152191162, -4.468100070953369, -4.328608512878418, -4.189116954803467, -4.049625873565674, -3.9101343154907227, -3.7706429958343506, -3.6311516761779785, -3.4916601181030273, -3.3521687984466553, -3.212677478790283, -3.073186159133911, -2.933694839477539, -2.794203281402588, -2.654711961746216, -2.5152206420898438, -2.3757290840148926, -2.2362377643585205, -2.0967464447021484, -1.9572551250457764, -1.8177636861801147, -1.6782722473144531, -1.538780927658081, -1.399289608001709, -1.2597981691360474, -1.1203067302703857, -0.9808155298233032, -0.8413241505622864, -0.7018327713012695, -0.5623413920402527, -0.42285001277923584, -0.283358633518219, -0.14386725425720215, -0.004375874996185303, 0.13511550426483154, 0.2746068835258484, 0.41409826278686523, 0.5535896420478821, 0.6930810213088989, 0.8325724005699158, 0.9720637798309326, 1.1115550994873047, 1.2510465383529663]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 7.0, 12.0, 9.0, 12.0, 27.0, 26.0, 45.0, 41.0, 60.0, 67.0, 59.0, 89.0, 66.0, 77.0, 81.0, 65.0, 59.0, 54.0, 30.0, 41.0, 29.0, 15.0, 9.0, 7.0, 12.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4342539310455322, -3.3390231132507324, -3.2437920570373535, -3.1485612392425537, -3.053330421447754, -2.958099603652954, -2.862868547439575, -2.7676377296447754, -2.6724069118499756, -2.577176094055176, -2.481945037841797, -2.386714220046997, -2.2914834022521973, -2.1962525844573975, -2.1010215282440186, -2.0057907104492188, -1.9105597734451294, -1.81532883644104, -1.7200980186462402, -1.6248670816421509, -1.529636263847351, -1.4344053268432617, -1.339174509048462, -1.2439435720443726, -1.1487126350402832, -1.0534816980361938, -0.958250880241394, -0.8630199432373047, -0.7677891254425049, -0.6725581884384155, -0.577327311038971, -0.48209643363952637, -0.38686561584472656, -0.291634738445282, -0.1964038461446762, -0.10117295384407043, -0.0059420764446258545, 0.08928880095481873, 0.1845197081565857, 0.2797505855560303, 0.37498146295547485, 0.47021234035491943, 0.565443217754364, 0.6606740951538086, 0.755905032157898, 0.8511358499526978, 0.9463667869567871, 1.041597604751587, 1.1368285417556763, 1.2320594787597656, 1.3272902965545654, 1.4225212335586548, 1.5177520513534546, 1.612982988357544, 1.7082138061523438, 1.803444743156433, 1.8986756801605225, 1.9939066171646118, 2.089137554168701, 2.184368371963501, 2.279599189758301, 2.3748300075531006, 2.4700610637664795, 2.5652918815612793, 2.660522699356079]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 3.0, 9.0, 7.0, 11.0, 10.0, 10.0, 20.0, 19.0, 23.0, 27.0, 50.0, 62.0, 80.0, 90.0, 148.0, 241.0, 377.0, 1123.0, 4842.0, 46067.0, 4061792.0, 70445.0, 5899.0, 1605.0, 521.0, 224.0, 157.0, 90.0, 75.0, 69.0, 44.0, 28.0, 24.0, 23.0, 12.0, 14.0, 10.0, 12.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.875, -1.8115234375, -1.748046875, -1.6845703125, -1.62109375, -1.5576171875, -1.494140625, -1.4306640625, -1.3671875, -1.3037109375, -1.240234375, -1.1767578125, -1.11328125, -1.0498046875, -0.986328125, -0.9228515625, -0.859375, -0.7958984375, -0.732421875, -0.6689453125, -0.60546875, -0.5419921875, -0.478515625, -0.4150390625, -0.3515625, -0.2880859375, -0.224609375, -0.1611328125, -0.09765625, -0.0341796875, 0.029296875, 0.0927734375, 0.15625, 0.2197265625, 0.283203125, 0.3466796875, 0.41015625, 0.4736328125, 0.537109375, 0.6005859375, 0.6640625, 0.7275390625, 0.791015625, 0.8544921875, 0.91796875, 0.9814453125, 1.044921875, 1.1083984375, 1.171875, 1.2353515625, 1.298828125, 1.3623046875, 1.42578125, 1.4892578125, 1.552734375, 1.6162109375, 1.6796875, 1.7431640625, 1.806640625, 1.8701171875, 1.93359375, 1.9970703125, 2.060546875, 2.1240234375, 2.1875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 16.0, 41.0, 72.0, 147.0, 179.0, 177.0, 141.0, 113.0, 70.0, 25.0, 9.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.598114013671875, -1.55267333984375, -1.507232666015625, -1.4617919921875, -1.416351318359375, -1.37091064453125, -1.325469970703125, -1.280029296875, -1.234588623046875, -1.18914794921875, -1.143707275390625, -1.0982666015625, -1.052825927734375, -1.00738525390625, -0.961944580078125, -0.91650390625, -0.871063232421875, -0.82562255859375, -0.780181884765625, -0.7347412109375, -0.689300537109375, -0.64385986328125, -0.598419189453125, -0.552978515625, -0.507537841796875, -0.46209716796875, -0.416656494140625, -0.3712158203125, -0.325775146484375, -0.28033447265625, -0.234893798828125, -0.189453125, -0.144012451171875, -0.09857177734375, -0.053131103515625, -0.0076904296875, 0.037750244140625, 0.08319091796875, 0.128631591796875, 0.174072265625, 0.219512939453125, 0.26495361328125, 0.310394287109375, 0.3558349609375, 0.401275634765625, 0.44671630859375, 0.492156982421875, 0.53759765625, 0.583038330078125, 0.62847900390625, 0.673919677734375, 0.7193603515625, 0.764801025390625, 0.81024169921875, 0.855682373046875, 0.901123046875, 0.946563720703125, 0.99200439453125, 1.037445068359375, 1.0828857421875, 1.128326416015625, 1.17376708984375, 1.219207763671875, 1.2646484375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 11.0, 12.0, 30.0, 60.0, 151.0, 565.0, 5779.0, 4123282.0, 62533.0, 1426.0, 252.0, 88.0, 36.0, 19.0, 15.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.95172119140625, -4.8331298828125, -4.71453857421875, -4.595947265625, -4.47735595703125, -4.3587646484375, -4.24017333984375, -4.12158203125, -4.00299072265625, -3.8843994140625, -3.76580810546875, -3.647216796875, -3.52862548828125, -3.4100341796875, -3.29144287109375, -3.1728515625, -3.05426025390625, -2.9356689453125, -2.81707763671875, -2.698486328125, -2.57989501953125, -2.4613037109375, -2.34271240234375, -2.22412109375, -2.10552978515625, -1.9869384765625, -1.86834716796875, -1.749755859375, -1.63116455078125, -1.5125732421875, -1.39398193359375, -1.275390625, -1.15679931640625, -1.0382080078125, -0.91961669921875, -0.801025390625, -0.68243408203125, -0.5638427734375, -0.44525146484375, -0.32666015625, -0.20806884765625, -0.0894775390625, 0.02911376953125, 0.147705078125, 0.26629638671875, 0.3848876953125, 0.50347900390625, 0.6220703125, 0.74066162109375, 0.8592529296875, 0.97784423828125, 1.096435546875, 1.21502685546875, 1.3336181640625, 1.45220947265625, 1.57080078125, 1.68939208984375, 1.8079833984375, 1.92657470703125, 2.045166015625, 2.16375732421875, 2.2823486328125, 2.40093994140625, 2.51953125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 13.0, 19.0, 32.0, 53.0, 142.0, 472.0, 1617.0, 1162.0, 311.0, 98.0, 43.0, 25.0, 18.0, 17.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.27567291259765625, -0.2617950439453125, -0.24791717529296875, -0.234039306640625, -0.22016143798828125, -0.2062835693359375, -0.19240570068359375, -0.17852783203125, -0.16464996337890625, -0.1507720947265625, -0.13689422607421875, -0.123016357421875, -0.10913848876953125, -0.0952606201171875, -0.08138275146484375, -0.0675048828125, -0.05362701416015625, -0.0397491455078125, -0.02587127685546875, -0.011993408203125, 0.00188446044921875, 0.0157623291015625, 0.02964019775390625, 0.04351806640625, 0.05739593505859375, 0.0712738037109375, 0.08515167236328125, 0.099029541015625, 0.11290740966796875, 0.1267852783203125, 0.14066314697265625, 0.154541015625, 0.16841888427734375, 0.1822967529296875, 0.19617462158203125, 0.210052490234375, 0.22393035888671875, 0.2378082275390625, 0.25168609619140625, 0.26556396484375, 0.27944183349609375, 0.2933197021484375, 0.30719757080078125, 0.321075439453125, 0.33495330810546875, 0.3488311767578125, 0.36270904541015625, 0.3765869140625, 0.39046478271484375, 0.4043426513671875, 0.41822052001953125, 0.432098388671875, 0.44597625732421875, 0.4598541259765625, 0.47373199462890625, 0.48760986328125, 0.5014877319335938, 0.5153656005859375, 0.5292434692382812, 0.543121337890625, 0.5569992065429688, 0.5708770751953125, 0.5847549438476562, 0.5986328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 17.0, 14.0, 50.0, 112.0, 189.0, 233.0, 184.0, 109.0, 51.0, 28.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.646538734436035, -2.594982385635376, -2.543426275253296, -2.4918699264526367, -2.4403138160705566, -2.3887574672698975, -2.3372013568878174, -2.285645008087158, -2.234088897705078, -2.182532548904419, -2.130976438522339, -2.0794200897216797, -2.0278639793395996, -1.97630774974823, -1.9247515201568604, -1.8731951713562012, -1.8216389417648315, -1.770082712173462, -1.7185264825820923, -1.6669702529907227, -1.615414023399353, -1.5638577938079834, -1.5123014450073242, -1.4607453346252441, -1.409188985824585, -1.3576327562332153, -1.3060765266418457, -1.254520297050476, -1.2029640674591064, -1.1514078378677368, -1.0998516082763672, -1.048295259475708, -0.9967392086982727, -0.9451829791069031, -0.8936267495155334, -0.842070460319519, -0.7905142307281494, -0.7389580011367798, -0.6874017715454102, -0.6358455419540405, -0.5842893123626709, -0.5327330827713013, -0.48117685317993164, -0.4296205937862396, -0.37806436419487, -0.32650813460350037, -0.27495187520980835, -0.22339564561843872, -0.1718394160270691, -0.12028317898511887, -0.06872694194316864, -0.017170697450637817, 0.03438553214073181, 0.08594176173210144, 0.13749802112579346, 0.18905425071716309, 0.24061048030853271, 0.29216670989990234, 0.343722939491272, 0.395279198884964, 0.4468354284763336, 0.49839165806770325, 0.5499479174613953, 0.6015041470527649, 0.6530603766441345]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 19.0, 43.0, 50.0, 60.0, 90.0, 111.0, 113.0, 102.0, 105.0, 84.0, 83.0, 51.0, 32.0, 24.0, 21.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1858028173446655, -1.149379849433899, -1.1129570007324219, -1.0765340328216553, -1.0401111841201782, -1.0036882162094116, -0.9672653675079346, -0.930842399597168, -0.8944195508956909, -0.8579966425895691, -0.8215737342834473, -0.7851508259773254, -0.7487279176712036, -0.7123050093650818, -0.67588210105896, -0.6394591331481934, -0.6030362248420715, -0.5666133165359497, -0.5301904082298279, -0.49376749992370605, -0.45734459161758423, -0.4209216833114624, -0.3844987452030182, -0.34807583689689636, -0.31165292859077454, -0.2752300202846527, -0.23880711197853088, -0.20238418877124786, -0.16596128046512604, -0.1295383721590042, -0.09311544895172119, -0.056692540645599365, -0.02026963233947754, 0.016153279691934586, 0.05257619172334671, 0.08899910748004913, 0.12542201578617096, 0.16184492409229279, 0.1982678472995758, 0.23469075560569763, 0.27111366391181946, 0.3075365722179413, 0.3439594805240631, 0.3803824186325073, 0.41680532693862915, 0.453228235244751, 0.4896511435508728, 0.5260740518569946, 0.5624969601631165, 0.5989198684692383, 0.6353427767753601, 0.6717656850814819, 0.7081885933876038, 0.7446115016937256, 0.7810344696044922, 0.8174573183059692, 0.8538802862167358, 0.8903031945228577, 0.9267261028289795, 0.9631490111351013, 0.9995719194412231, 1.0359948873519897, 1.0724177360534668, 1.1088407039642334, 1.1452635526657104]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 20.0, 19.0, 38.0, 39.0, 88.0, 188.0, 356.0, 1134.0, 6766.0, 113309.0, 872390.0, 48606.0, 4133.0, 822.0, 301.0, 133.0, 69.0, 46.0, 35.0, 17.0, 15.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.3242149353027344, -0.31420135498046875, -0.3041877746582031, -0.2941741943359375, -0.2841606140136719, -0.27414703369140625, -0.2641334533691406, -0.254119873046875, -0.24410629272460938, -0.23409271240234375, -0.22407913208007812, -0.2140655517578125, -0.20405197143554688, -0.19403839111328125, -0.18402481079101562, -0.17401123046875, -0.16399765014648438, -0.15398406982421875, -0.14397048950195312, -0.1339569091796875, -0.12394332885742188, -0.11392974853515625, -0.10391616821289062, -0.093902587890625, -0.08388900756835938, -0.07387542724609375, -0.06386184692382812, -0.0538482666015625, -0.043834686279296875, -0.03382110595703125, -0.023807525634765625, -0.0137939453125, -0.003780364990234375, 0.00623321533203125, 0.016246795654296875, 0.0262603759765625, 0.036273956298828125, 0.04628753662109375, 0.056301116943359375, 0.066314697265625, 0.07632827758789062, 0.08634185791015625, 0.09635543823242188, 0.1063690185546875, 0.11638259887695312, 0.12639617919921875, 0.13640975952148438, 0.14642333984375, 0.15643692016601562, 0.16645050048828125, 0.17646408081054688, 0.1864776611328125, 0.19649124145507812, 0.20650482177734375, 0.21651840209960938, 0.226531982421875, 0.23654556274414062, 0.24655914306640625, 0.2565727233886719, 0.2665863037109375, 0.2765998840332031, 0.28661346435546875, 0.2966270446777344, 0.306640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 12.0, 48.0, 51.0, 81.0, 140.0, 128.0, 144.0, 122.0, 111.0, 73.0, 39.0, 27.0, 15.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89990234375, -0.8728103637695312, -0.8457183837890625, -0.8186264038085938, -0.791534423828125, -0.7644424438476562, -0.7373504638671875, -0.7102584838867188, -0.68316650390625, -0.6560745239257812, -0.6289825439453125, -0.6018905639648438, -0.574798583984375, -0.5477066040039062, -0.5206146240234375, -0.49352264404296875, -0.4664306640625, -0.43933868408203125, -0.4122467041015625, -0.38515472412109375, -0.358062744140625, -0.33097076416015625, -0.3038787841796875, -0.27678680419921875, -0.24969482421875, -0.22260284423828125, -0.1955108642578125, -0.16841888427734375, -0.141326904296875, -0.11423492431640625, -0.0871429443359375, -0.06005096435546875, -0.032958984375, -0.00586700439453125, 0.0212249755859375, 0.04831695556640625, 0.075408935546875, 0.10250091552734375, 0.1295928955078125, 0.15668487548828125, 0.18377685546875, 0.21086883544921875, 0.2379608154296875, 0.26505279541015625, 0.292144775390625, 0.31923675537109375, 0.3463287353515625, 0.37342071533203125, 0.4005126953125, 0.42760467529296875, 0.4546966552734375, 0.48178863525390625, 0.508880615234375, 0.5359725952148438, 0.5630645751953125, 0.5901565551757812, 0.61724853515625, 0.6443405151367188, 0.6714324951171875, 0.6985244750976562, 0.725616455078125, 0.7527084350585938, 0.7798004150390625, 0.8068923950195312, 0.833984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 9.0, 13.0, 21.0, 25.0, 34.0, 66.0, 112.0, 159.0, 257.0, 383.0, 600.0, 899.0, 1590.0, 2636.0, 4408.0, 7292.0, 13320.0, 24558.0, 47999.0, 101451.0, 209448.0, 286080.0, 174835.0, 83318.0, 40370.0, 21074.0, 11170.0, 6499.0, 3688.0, 2343.0, 1447.0, 902.0, 523.0, 368.0, 228.0, 155.0, 90.0, 68.0, 38.0, 24.0, 13.0, 13.0, 11.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.048248291015625, -0.046844482421875, -0.045440673828125, -0.044036865234375, -0.042633056640625, -0.041229248046875, -0.039825439453125, -0.038421630859375, -0.037017822265625, -0.035614013671875, -0.034210205078125, -0.032806396484375, -0.031402587890625, -0.029998779296875, -0.028594970703125, -0.027191162109375, -0.025787353515625, -0.024383544921875, -0.022979736328125, -0.021575927734375, -0.020172119140625, -0.018768310546875, -0.017364501953125, -0.015960693359375, -0.014556884765625, -0.013153076171875, -0.011749267578125, -0.010345458984375, -0.008941650390625, -0.007537841796875, -0.006134033203125, -0.004730224609375, -0.003326416015625, -0.001922607421875, -0.000518798828125, 0.000885009765625, 0.002288818359375, 0.003692626953125, 0.005096435546875, 0.006500244140625, 0.007904052734375, 0.009307861328125, 0.010711669921875, 0.012115478515625, 0.013519287109375, 0.014923095703125, 0.016326904296875, 0.017730712890625, 0.019134521484375, 0.020538330078125, 0.021942138671875, 0.023345947265625, 0.024749755859375, 0.026153564453125, 0.027557373046875, 0.028961181640625, 0.030364990234375, 0.031768798828125, 0.033172607421875, 0.034576416015625, 0.035980224609375, 0.037384033203125, 0.038787841796875, 0.040191650390625, 0.041595458984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 6.0, 6.0, 3.0, 4.0, 5.0, 11.0, 10.0, 8.0, 18.0, 16.0, 22.0, 28.0, 27.0, 31.0, 35.0, 45.0, 49.0, 33.0, 49.0, 47.0, 62.0, 44.0, 44.0, 42.0, 44.0, 43.0, 36.0, 35.0, 24.0, 27.0, 19.0, 23.0, 16.0, 16.0, 13.0, 8.0, 8.0, 9.0, 8.0, 6.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.740234375, -0.718719482421875, -0.69720458984375, -0.675689697265625, -0.6541748046875, -0.632659912109375, -0.61114501953125, -0.589630126953125, -0.568115234375, -0.546600341796875, -0.52508544921875, -0.503570556640625, -0.4820556640625, -0.460540771484375, -0.43902587890625, -0.417510986328125, -0.39599609375, -0.374481201171875, -0.35296630859375, -0.331451416015625, -0.3099365234375, -0.288421630859375, -0.26690673828125, -0.245391845703125, -0.223876953125, -0.202362060546875, -0.18084716796875, -0.159332275390625, -0.1378173828125, -0.116302490234375, -0.09478759765625, -0.073272705078125, -0.0517578125, -0.030242919921875, -0.00872802734375, 0.012786865234375, 0.0343017578125, 0.055816650390625, 0.07733154296875, 0.098846435546875, 0.120361328125, 0.141876220703125, 0.16339111328125, 0.184906005859375, 0.2064208984375, 0.227935791015625, 0.24945068359375, 0.270965576171875, 0.29248046875, 0.313995361328125, 0.33551025390625, 0.357025146484375, 0.3785400390625, 0.400054931640625, 0.42156982421875, 0.443084716796875, 0.464599609375, 0.486114501953125, 0.50762939453125, 0.529144287109375, 0.5506591796875, 0.572174072265625, 0.59368896484375, 0.615203857421875, 0.63671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 13.0, 24.0, 30.0, 47.0, 78.0, 157.0, 350.0, 843.0, 3232.0, 21434.0, 517058.0, 479256.0, 20912.0, 3357.0, 940.0, 359.0, 166.0, 108.0, 49.0, 43.0, 29.0, 15.0, 16.0, 11.0, 6.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.018273353576660156, -0.017702102661132812, -0.01713085174560547, -0.016559600830078125, -0.01598834991455078, -0.015417098999023438, -0.014845848083496094, -0.01427459716796875, -0.013703346252441406, -0.013132095336914062, -0.012560844421386719, -0.011989593505859375, -0.011418342590332031, -0.010847091674804688, -0.010275840759277344, -0.00970458984375, -0.009133338928222656, -0.008562088012695312, -0.007990837097167969, -0.007419586181640625, -0.006848335266113281, -0.0062770843505859375, -0.005705833435058594, -0.00513458251953125, -0.004563331604003906, -0.0039920806884765625, -0.0034208297729492188, -0.002849578857421875, -0.0022783279418945312, -0.0017070770263671875, -0.0011358261108398438, -0.0005645751953125, 6.67572021484375e-06, 0.0005779266357421875, 0.0011491775512695312, 0.001720428466796875, 0.0022916793823242188, 0.0028629302978515625, 0.0034341812133789062, 0.00400543212890625, 0.004576683044433594, 0.0051479339599609375, 0.005719184875488281, 0.006290435791015625, 0.006861686706542969, 0.0074329376220703125, 0.008004188537597656, 0.008575439453125, 0.009146690368652344, 0.009717941284179688, 0.010289192199707031, 0.010860443115234375, 0.011431694030761719, 0.012002944946289062, 0.012574195861816406, 0.01314544677734375, 0.013716697692871094, 0.014287948608398438, 0.014859199523925781, 0.015430450439453125, 0.01600170135498047, 0.016572952270507812, 0.017144203186035156, 0.0177154541015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 13.0, 27.0, 36.0, 83.0, 144.0, 193.0, 189.0, 126.0, 80.0, 56.0, 21.0, 12.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.4656375646591187e-05, -3.378838300704956e-05, -3.2920390367507935e-05, -3.205239772796631e-05, -3.118440508842468e-05, -3.0316412448883057e-05, -2.944841980934143e-05, -2.8580427169799805e-05, -2.771243453025818e-05, -2.6844441890716553e-05, -2.5976449251174927e-05, -2.51084566116333e-05, -2.4240463972091675e-05, -2.337247133255005e-05, -2.2504478693008423e-05, -2.1636486053466797e-05, -2.076849341392517e-05, -1.9900500774383545e-05, -1.903250813484192e-05, -1.8164515495300293e-05, -1.7296522855758667e-05, -1.642853021621704e-05, -1.5560537576675415e-05, -1.4692544937133789e-05, -1.3824552297592163e-05, -1.2956559658050537e-05, -1.2088567018508911e-05, -1.1220574378967285e-05, -1.035258173942566e-05, -9.484589099884033e-06, -8.616596460342407e-06, -7.748603820800781e-06, -6.880611181259155e-06, -6.012618541717529e-06, -5.144625902175903e-06, -4.276633262634277e-06, -3.4086406230926514e-06, -2.5406479835510254e-06, -1.6726553440093994e-06, -8.046627044677734e-07, 6.332993507385254e-08, 9.313225746154785e-07, 1.7993152141571045e-06, 2.6673078536987305e-06, 3.5353004932403564e-06, 4.403293132781982e-06, 5.271285772323608e-06, 6.139278411865234e-06, 7.00727105140686e-06, 7.875263690948486e-06, 8.743256330490112e-06, 9.611248970031738e-06, 1.0479241609573364e-05, 1.134723424911499e-05, 1.2215226888656616e-05, 1.3083219528198242e-05, 1.3951212167739868e-05, 1.4819204807281494e-05, 1.568719744682312e-05, 1.6555190086364746e-05, 1.7423182725906372e-05, 1.8291175365447998e-05, 1.9159168004989624e-05, 2.002716064453125e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 11.0, 26.0, 39.0, 50.0, 83.0, 123.0, 236.0, 368.0, 678.0, 1319.0, 2810.0, 7126.0, 24868.0, 200347.0, 725659.0, 62663.0, 13597.0, 4481.0, 1841.0, 933.0, 537.0, 275.0, 180.0, 110.0, 63.0, 37.0, 20.0, 13.0, 13.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0178070068359375, -0.017287373542785645, -0.01676774024963379, -0.016248106956481934, -0.015728473663330078, -0.015208840370178223, -0.014689207077026367, -0.014169573783874512, -0.013649940490722656, -0.0131303071975708, -0.012610673904418945, -0.01209104061126709, -0.011571407318115234, -0.011051774024963379, -0.010532140731811523, -0.010012507438659668, -0.009492874145507812, -0.008973240852355957, -0.008453607559204102, -0.007933974266052246, -0.007414340972900391, -0.006894707679748535, -0.00637507438659668, -0.005855441093444824, -0.005335807800292969, -0.004816174507141113, -0.004296541213989258, -0.0037769079208374023, -0.003257274627685547, -0.0027376413345336914, -0.002218008041381836, -0.0016983747482299805, -0.001178741455078125, -0.0006591081619262695, -0.00013947486877441406, 0.0003801584243774414, 0.0008997917175292969, 0.0014194250106811523, 0.0019390583038330078, 0.0024586915969848633, 0.0029783248901367188, 0.0034979581832885742, 0.00401759147644043, 0.004537224769592285, 0.005056858062744141, 0.005576491355895996, 0.0060961246490478516, 0.006615757942199707, 0.0071353912353515625, 0.007655024528503418, 0.008174657821655273, 0.008694291114807129, 0.009213924407958984, 0.00973355770111084, 0.010253190994262695, 0.01077282428741455, 0.011292457580566406, 0.011812090873718262, 0.012331724166870117, 0.012851357460021973, 0.013370990753173828, 0.013890624046325684, 0.014410257339477539, 0.014929890632629395, 0.01544952392578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 11.0, 8.0, 10.0, 13.0, 29.0, 57.0, 86.0, 151.0, 214.0, 154.0, 107.0, 55.0, 45.0, 13.0, 18.0, 6.0, 3.0, 8.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00441741943359375, -0.004268050193786621, -0.004118680953979492, -0.003969311714172363, -0.0038199424743652344, -0.0036705732345581055, -0.0035212039947509766, -0.0033718347549438477, -0.0032224655151367188, -0.00307309627532959, -0.002923727035522461, -0.002774357795715332, -0.002624988555908203, -0.0024756193161010742, -0.0023262500762939453, -0.0021768808364868164, -0.0020275115966796875, -0.0018781423568725586, -0.0017287731170654297, -0.0015794038772583008, -0.0014300346374511719, -0.001280665397644043, -0.001131296157836914, -0.0009819269180297852, -0.0008325576782226562, -0.0006831884384155273, -0.0005338191986083984, -0.00038444995880126953, -0.00023508071899414062, -8.571147918701172e-05, 6.365776062011719e-05, 0.0002130270004272461, 0.000362396240234375, 0.0005117654800415039, 0.0006611347198486328, 0.0008105039596557617, 0.0009598731994628906, 0.0011092424392700195, 0.0012586116790771484, 0.0014079809188842773, 0.0015573501586914062, 0.0017067193984985352, 0.001856088638305664, 0.002005457878112793, 0.002154827117919922, 0.0023041963577270508, 0.0024535655975341797, 0.0026029348373413086, 0.0027523040771484375, 0.0029016733169555664, 0.0030510425567626953, 0.0032004117965698242, 0.003349781036376953, 0.003499150276184082, 0.003648519515991211, 0.00379788875579834, 0.003947257995605469, 0.004096627235412598, 0.0042459964752197266, 0.0043953657150268555, 0.004544734954833984, 0.004694104194641113, 0.004843473434448242, 0.004992842674255371, 0.0051422119140625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 18.0, 33.0, 79.0, 161.0, 209.0, 233.0, 122.0, 81.0, 38.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123475432395935, -1.095318078994751, -1.067160725593567, -1.0390033721923828, -1.0108460187911987, -0.9826886653900146, -0.9545313119888306, -0.9263739585876465, -0.8982166051864624, -0.8700592517852783, -0.8419018983840942, -0.8137445449829102, -0.7855871915817261, -0.757429838180542, -0.7292724847793579, -0.7011151313781738, -0.6729577779769897, -0.6448004245758057, -0.6166430711746216, -0.5884857177734375, -0.5603283643722534, -0.5321710109710693, -0.5040136575698853, -0.47585630416870117, -0.4476989507675171, -0.419541597366333, -0.3913842439651489, -0.36322689056396484, -0.33506953716278076, -0.3069121837615967, -0.2787548303604126, -0.2505974769592285, -0.2224401831626892, -0.19428282976150513, -0.16612547636032104, -0.13796812295913696, -0.10981076955795288, -0.0816534161567688, -0.05349606275558472, -0.025338709354400635, 0.0028186440467834473, 0.03097599744796753, 0.05913335084915161, 0.0872907042503357, 0.11544805765151978, 0.14360541105270386, 0.17176276445388794, 0.19992011785507202, 0.2280774712562561, 0.2562348246574402, 0.28439217805862427, 0.31254953145980835, 0.34070688486099243, 0.3688642382621765, 0.3970215916633606, 0.4251789450645447, 0.45333629846572876, 0.48149365186691284, 0.5096510052680969, 0.537808358669281, 0.5659657120704651, 0.5941230654716492, 0.6222804188728333, 0.6504377722740173, 0.6785951256752014]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 13.0, 17.0, 49.0, 62.0, 73.0, 131.0, 131.0, 121.0, 115.0, 102.0, 85.0, 46.0, 27.0, 18.0, 12.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8134170770645142, -0.788963794708252, -0.7645105719566345, -0.7400572896003723, -0.7156040072441101, -0.6911507248878479, -0.6666975021362305, -0.6422442197799683, -0.617790937423706, -0.5933376550674438, -0.5688844323158264, -0.5444311499595642, -0.519977867603302, -0.4955246150493622, -0.47107136249542236, -0.44661808013916016, -0.42216482758522034, -0.3977115750312805, -0.3732582926750183, -0.3488050401210785, -0.3243517577648163, -0.29989850521087646, -0.27544522285461426, -0.25099197030067444, -0.22653870284557343, -0.2020854353904724, -0.1776321679353714, -0.15317890048027039, -0.12872564792633057, -0.10427237302064896, -0.07981911301612854, -0.05536584556102753, -0.030912578105926514, -0.00645931251347065, 0.017993953078985214, 0.04244721680879593, 0.06690048426389694, 0.09135375171899796, 0.11580701172351837, 0.14026027917861938, 0.1647135466337204, 0.1891668140888214, 0.21362008154392242, 0.23807334899902344, 0.26252660155296326, 0.28697988390922546, 0.3114331364631653, 0.3358864188194275, 0.3603396713733673, 0.38479292392730713, 0.40924620628356934, 0.43369945883750916, 0.45815274119377136, 0.4826059937477112, 0.5070592761039734, 0.5315124988555908, 0.555965781211853, 0.5804190635681152, 0.6048722863197327, 0.6293255686759949, 0.6537788510322571, 0.6782321333885193, 0.7026853561401367, 0.7271386384963989, 0.7515919208526611]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 18.0, 9.0, 11.0, 18.0, 29.0, 42.0, 52.0, 112.0, 205.0, 419.0, 1023.0, 2409.0, 6593.0, 21735.0, 93508.0, 662757.0, 207485.0, 35673.0, 10282.0, 3525.0, 1365.0, 623.0, 260.0, 125.0, 88.0, 43.0, 31.0, 21.0, 23.0, 12.0, 9.0, 9.0, 7.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6171875, -0.5988693237304688, -0.5805511474609375, -0.5622329711914062, -0.543914794921875, -0.5255966186523438, -0.5072784423828125, -0.48896026611328125, -0.47064208984375, -0.45232391357421875, -0.4340057373046875, -0.41568756103515625, -0.397369384765625, -0.37905120849609375, -0.3607330322265625, -0.34241485595703125, -0.3240966796875, -0.30577850341796875, -0.2874603271484375, -0.26914215087890625, -0.250823974609375, -0.23250579833984375, -0.2141876220703125, -0.19586944580078125, -0.17755126953125, -0.15923309326171875, -0.1409149169921875, -0.12259674072265625, -0.104278564453125, -0.08596038818359375, -0.0676422119140625, -0.04932403564453125, -0.031005859375, -0.01268768310546875, 0.0056304931640625, 0.02394866943359375, 0.042266845703125, 0.06058502197265625, 0.0789031982421875, 0.09722137451171875, 0.11553955078125, 0.13385772705078125, 0.1521759033203125, 0.17049407958984375, 0.188812255859375, 0.20713043212890625, 0.2254486083984375, 0.24376678466796875, 0.2620849609375, 0.28040313720703125, 0.2987213134765625, 0.31703948974609375, 0.335357666015625, 0.35367584228515625, 0.3719940185546875, 0.39031219482421875, 0.40863037109375, 0.42694854736328125, 0.4452667236328125, 0.46358489990234375, 0.481903076171875, 0.5002212524414062, 0.5185394287109375, 0.5368576049804688, 0.55517578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 15.0, 30.0, 50.0, 79.0, 100.0, 125.0, 135.0, 134.0, 97.0, 102.0, 42.0, 39.0, 25.0, 15.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.907440185546875, -1.85687255859375, -1.806304931640625, -1.7557373046875, -1.705169677734375, -1.65460205078125, -1.604034423828125, -1.553466796875, -1.502899169921875, -1.45233154296875, -1.401763916015625, -1.3511962890625, -1.300628662109375, -1.25006103515625, -1.199493408203125, -1.14892578125, -1.098358154296875, -1.04779052734375, -0.997222900390625, -0.9466552734375, -0.896087646484375, -0.84552001953125, -0.794952392578125, -0.744384765625, -0.693817138671875, -0.64324951171875, -0.592681884765625, -0.5421142578125, -0.491546630859375, -0.44097900390625, -0.390411376953125, -0.33984375, -0.289276123046875, -0.23870849609375, -0.188140869140625, -0.1375732421875, -0.087005615234375, -0.03643798828125, 0.014129638671875, 0.064697265625, 0.115264892578125, 0.16583251953125, 0.216400146484375, 0.2669677734375, 0.317535400390625, 0.36810302734375, 0.418670654296875, 0.46923828125, 0.519805908203125, 0.57037353515625, 0.620941162109375, 0.6715087890625, 0.722076416015625, 0.77264404296875, 0.823211669921875, 0.873779296875, 0.924346923828125, 0.97491455078125, 1.025482177734375, 1.0760498046875, 1.126617431640625, 1.17718505859375, 1.227752685546875, 1.2783203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 13.0, 7.0, 9.0, 19.0, 30.0, 30.0, 43.0, 57.0, 124.0, 199.0, 409.0, 1198.0, 5428.0, 35526.0, 681487.0, 297023.0, 21523.0, 3715.0, 917.0, 290.0, 184.0, 89.0, 64.0, 51.0, 28.0, 17.0, 12.0, 13.0, 10.0, 5.0, 8.0, 6.0, 3.0, 0.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.220703125, -1.1884765625, -1.15625, -1.1240234375, -1.091796875, -1.0595703125, -1.02734375, -0.9951171875, -0.962890625, -0.9306640625, -0.8984375, -0.8662109375, -0.833984375, -0.8017578125, -0.76953125, -0.7373046875, -0.705078125, -0.6728515625, -0.640625, -0.6083984375, -0.576171875, -0.5439453125, -0.51171875, -0.4794921875, -0.447265625, -0.4150390625, -0.3828125, -0.3505859375, -0.318359375, -0.2861328125, -0.25390625, -0.2216796875, -0.189453125, -0.1572265625, -0.125, -0.0927734375, -0.060546875, -0.0283203125, 0.00390625, 0.0361328125, 0.068359375, 0.1005859375, 0.1328125, 0.1650390625, 0.197265625, 0.2294921875, 0.26171875, 0.2939453125, 0.326171875, 0.3583984375, 0.390625, 0.4228515625, 0.455078125, 0.4873046875, 0.51953125, 0.5517578125, 0.583984375, 0.6162109375, 0.6484375, 0.6806640625, 0.712890625, 0.7451171875, 0.77734375, 0.8095703125, 0.841796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 7.0, 10.0, 15.0, 15.0, 16.0, 23.0, 32.0, 34.0, 37.0, 59.0, 52.0, 55.0, 67.0, 48.0, 76.0, 65.0, 52.0, 61.0, 50.0, 42.0, 33.0, 29.0, 21.0, 13.0, 12.0, 9.0, 14.0, 10.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9263381958007812, -0.8922271728515625, -0.8581161499023438, -0.824005126953125, -0.7898941040039062, -0.7557830810546875, -0.7216720581054688, -0.68756103515625, -0.6534500122070312, -0.6193389892578125, -0.5852279663085938, -0.551116943359375, -0.5170059204101562, -0.4828948974609375, -0.44878387451171875, -0.4146728515625, -0.38056182861328125, -0.3464508056640625, -0.31233978271484375, -0.278228759765625, -0.24411773681640625, -0.2100067138671875, -0.17589569091796875, -0.14178466796875, -0.10767364501953125, -0.0735626220703125, -0.03945159912109375, -0.005340576171875, 0.02877044677734375, 0.0628814697265625, 0.09699249267578125, 0.131103515625, 0.16521453857421875, 0.1993255615234375, 0.23343658447265625, 0.267547607421875, 0.30165863037109375, 0.3357696533203125, 0.36988067626953125, 0.40399169921875, 0.43810272216796875, 0.4722137451171875, 0.5063247680664062, 0.540435791015625, 0.5745468139648438, 0.6086578369140625, 0.6427688598632812, 0.6768798828125, 0.7109909057617188, 0.7451019287109375, 0.7792129516601562, 0.813323974609375, 0.8474349975585938, 0.8815460205078125, 0.9156570434570312, 0.94976806640625, 0.9838790893554688, 1.0179901123046875, 1.0521011352539062, 1.086212158203125, 1.1203231811523438, 1.1544342041015625, 1.1885452270507812, 1.22265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 7.0, 18.0, 27.0, 55.0, 118.0, 277.0, 784.0, 3485.0, 25270.0, 739294.0, 261240.0, 14530.0, 2395.0, 593.0, 204.0, 105.0, 51.0, 20.0, 23.0, 16.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.16806983947753906, -0.16072463989257812, -0.1533794403076172, -0.14603424072265625, -0.1386890411376953, -0.13134384155273438, -0.12399864196777344, -0.1166534423828125, -0.10930824279785156, -0.10196304321289062, -0.09461784362792969, -0.08727264404296875, -0.07992744445800781, -0.07258224487304688, -0.06523704528808594, -0.057891845703125, -0.05054664611816406, -0.043201446533203125, -0.03585624694824219, -0.02851104736328125, -0.021165847778320312, -0.013820648193359375, -0.0064754486083984375, 0.0008697509765625, 0.008214950561523438, 0.015560150146484375, 0.022905349731445312, 0.03025054931640625, 0.03759574890136719, 0.044940948486328125, 0.05228614807128906, 0.05963134765625, 0.06697654724121094, 0.07432174682617188, 0.08166694641113281, 0.08901214599609375, 0.09635734558105469, 0.10370254516601562, 0.11104774475097656, 0.1183929443359375, 0.12573814392089844, 0.13308334350585938, 0.1404285430908203, 0.14777374267578125, 0.1551189422607422, 0.16246414184570312, 0.16980934143066406, 0.177154541015625, 0.18449974060058594, 0.19184494018554688, 0.1991901397705078, 0.20653533935546875, 0.2138805389404297, 0.22122573852539062, 0.22857093811035156, 0.2359161376953125, 0.24326133728027344, 0.2506065368652344, 0.2579517364501953, 0.26529693603515625, 0.2726421356201172, 0.2799873352050781, 0.28733253479003906, 0.294677734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 4.0, 6.0, 10.0, 13.0, 27.0, 34.0, 52.0, 88.0, 190.0, 235.0, 138.0, 80.0, 45.0, 28.0, 15.0, 11.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.987550735473633e-05, -3.8953498005867004e-05, -3.803148865699768e-05, -3.710947930812836e-05, -3.618746995925903e-05, -3.526546061038971e-05, -3.4343451261520386e-05, -3.342144191265106e-05, -3.249943256378174e-05, -3.1577423214912415e-05, -3.065541386604309e-05, -2.9733404517173767e-05, -2.8811395168304443e-05, -2.788938581943512e-05, -2.6967376470565796e-05, -2.6045367121696472e-05, -2.512335777282715e-05, -2.4201348423957825e-05, -2.32793390750885e-05, -2.2357329726219177e-05, -2.1435320377349854e-05, -2.051331102848053e-05, -1.9591301679611206e-05, -1.8669292330741882e-05, -1.774728298187256e-05, -1.6825273633003235e-05, -1.590326428413391e-05, -1.4981254935264587e-05, -1.4059245586395264e-05, -1.313723623752594e-05, -1.2215226888656616e-05, -1.1293217539787292e-05, -1.0371208190917969e-05, -9.449198842048645e-06, -8.527189493179321e-06, -7.6051801443099976e-06, -6.683170795440674e-06, -5.76116144657135e-06, -4.839152097702026e-06, -3.917142748832703e-06, -2.995133399963379e-06, -2.073124051094055e-06, -1.1511147022247314e-06, -2.2910535335540771e-07, 6.92903995513916e-07, 1.6149133443832397e-06, 2.5369226932525635e-06, 3.458932042121887e-06, 4.380941390991211e-06, 5.302950739860535e-06, 6.224960088729858e-06, 7.146969437599182e-06, 8.068978786468506e-06, 8.99098813533783e-06, 9.912997484207153e-06, 1.0835006833076477e-05, 1.17570161819458e-05, 1.2679025530815125e-05, 1.3601034879684448e-05, 1.4523044228553772e-05, 1.5445053577423096e-05, 1.636706292629242e-05, 1.7289072275161743e-05, 1.8211081624031067e-05, 1.913309097290039e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 14.0, 17.0, 30.0, 39.0, 52.0, 86.0, 163.0, 208.0, 393.0, 635.0, 1269.0, 2275.0, 5073.0, 14546.0, 62822.0, 616921.0, 283752.0, 41108.0, 10561.0, 4167.0, 1936.0, 1021.0, 548.0, 321.0, 191.0, 128.0, 77.0, 51.0, 34.0, 27.0, 23.0, 16.0, 6.0, 8.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.13402938842773438, -0.12938690185546875, -0.12474441528320312, -0.1201019287109375, -0.11545944213867188, -0.11081695556640625, -0.10617446899414062, -0.101531982421875, -0.09688949584960938, -0.09224700927734375, -0.08760452270507812, -0.0829620361328125, -0.07831954956054688, -0.07367706298828125, -0.06903457641601562, -0.06439208984375, -0.059749603271484375, -0.05510711669921875, -0.050464630126953125, -0.0458221435546875, -0.041179656982421875, -0.03653717041015625, -0.031894683837890625, -0.027252197265625, -0.022609710693359375, -0.01796722412109375, -0.013324737548828125, -0.0086822509765625, -0.004039764404296875, 0.00060272216796875, 0.005245208740234375, 0.0098876953125, 0.014530181884765625, 0.01917266845703125, 0.023815155029296875, 0.0284576416015625, 0.033100128173828125, 0.03774261474609375, 0.042385101318359375, 0.047027587890625, 0.051670074462890625, 0.05631256103515625, 0.060955047607421875, 0.0655975341796875, 0.07024002075195312, 0.07488250732421875, 0.07952499389648438, 0.08416748046875, 0.08880996704101562, 0.09345245361328125, 0.09809494018554688, 0.1027374267578125, 0.10737991333007812, 0.11202239990234375, 0.11666488647460938, 0.121307373046875, 0.12594985961914062, 0.13059234619140625, 0.13523483276367188, 0.1398773193359375, 0.14451980590820312, 0.14916229248046875, 0.15380477905273438, 0.158447265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 3.0, 5.0, 1.0, 0.0, 6.0, 10.0, 9.0, 13.0, 34.0, 25.0, 45.0, 39.0, 43.0, 75.0, 115.0, 170.0, 118.0, 63.0, 41.0, 44.0, 31.0, 25.0, 15.0, 18.0, 18.0, 8.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06292724609375, -0.0609898567199707, -0.059052467346191406, -0.05711507797241211, -0.05517768859863281, -0.053240299224853516, -0.05130290985107422, -0.04936552047729492, -0.047428131103515625, -0.04549074172973633, -0.04355335235595703, -0.041615962982177734, -0.03967857360839844, -0.03774118423461914, -0.035803794860839844, -0.03386640548706055, -0.03192901611328125, -0.029991626739501953, -0.028054237365722656, -0.02611684799194336, -0.024179458618164062, -0.022242069244384766, -0.02030467987060547, -0.018367290496826172, -0.016429901123046875, -0.014492511749267578, -0.012555122375488281, -0.010617733001708984, -0.008680343627929688, -0.006742954254150391, -0.004805564880371094, -0.002868175506591797, -0.0009307861328125, 0.0010066032409667969, 0.0029439926147460938, 0.004881381988525391, 0.0068187713623046875, 0.008756160736083984, 0.010693550109863281, 0.012630939483642578, 0.014568328857421875, 0.016505718231201172, 0.01844310760498047, 0.020380496978759766, 0.022317886352539062, 0.02425527572631836, 0.026192665100097656, 0.028130054473876953, 0.03006744384765625, 0.03200483322143555, 0.033942222595214844, 0.03587961196899414, 0.03781700134277344, 0.039754390716552734, 0.04169178009033203, 0.04362916946411133, 0.045566558837890625, 0.04750394821166992, 0.04944133758544922, 0.051378726959228516, 0.05331611633300781, 0.05525350570678711, 0.057190895080566406, 0.0591282844543457, 0.061065673828125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 26.0, 49.0, 167.0, 306.0, 263.0, 135.0, 41.0, 9.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6782100200653076, -2.5941450595855713, -2.510079860687256, -2.4260149002075195, -2.341949701309204, -2.2578847408294678, -2.1738195419311523, -2.089754581451416, -2.0056896209716797, -1.9216245412826538, -1.837559461593628, -1.7534945011138916, -1.6694293022155762, -1.5853643417358398, -1.501299262046814, -1.417234182357788, -1.3331689834594727, -1.2491039037704468, -1.165038824081421, -1.0809738636016846, -0.9969087243080139, -0.912843644618988, -0.8287786245346069, -0.744713544845581, -0.6606484651565552, -0.5765833854675293, -0.4925183355808258, -0.4084532856941223, -0.32438820600509644, -0.24032312631607056, -0.15625810623168945, -0.07219302654266357, 0.011872053146362305, 0.09593711793422699, 0.18000218272209167, 0.26406723260879517, 0.34813231229782104, 0.4321973919868469, 0.516262412071228, 0.6003274917602539, 0.6843925714492798, 0.7684576511383057, 0.8525227308273315, 0.9365877509117126, 1.0206527709960938, 1.1047179698944092, 1.1887829303741455, 1.2728480100631714, 1.3569130897521973, 1.4409781694412231, 1.525043249130249, 1.6091082096099854, 1.6931734085083008, 1.777238368988037, 1.861303448677063, 1.9453685283660889, 2.0294337272644043, 2.1134986877441406, 2.197563886642456, 2.2816288471221924, 2.365694046020508, 2.449759006500244, 2.5338239669799805, 2.617889165878296, 2.7019541263580322]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 11.0, 23.0, 33.0, 31.0, 34.0, 64.0, 47.0, 49.0, 70.0, 61.0, 66.0, 51.0, 69.0, 64.0, 65.0, 41.0, 55.0, 35.0, 36.0, 29.0, 16.0, 11.0, 9.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.8740768432617188, -2.8042612075805664, -2.734445571899414, -2.6646299362182617, -2.5948143005371094, -2.524998664855957, -2.4551830291748047, -2.3853673934936523, -2.3155517578125, -2.2457361221313477, -2.1759204864501953, -2.106104850769043, -2.0362892150878906, -1.9664735794067383, -1.8966578245162964, -1.826842188835144, -1.7570264339447021, -1.6872107982635498, -1.6173951625823975, -1.5475795269012451, -1.4777638912200928, -1.4079482555389404, -1.3381325006484985, -1.2683168649673462, -1.1985012292861938, -1.1286855936050415, -1.0588699579238892, -0.989054262638092, -0.9192386269569397, -0.8494229912757874, -0.7796072959899902, -0.7097916603088379, -0.6399761438369751, -0.5701605081558228, -0.5003448724746704, -0.4305291771888733, -0.36071354150772095, -0.2908979058265686, -0.22108224034309387, -0.15126657485961914, -0.0814509391784668, -0.01163528859615326, 0.05818036198616028, 0.12799601256847382, 0.19781166315078735, 0.2676272988319397, 0.33744296431541443, 0.40725862979888916, 0.4770742654800415, 0.5468899011611938, 0.6167055368423462, 0.6865212321281433, 0.7563368678092957, 0.826152503490448, 0.8959681987762451, 0.9657838344573975, 1.0355994701385498, 1.1054151058197021, 1.1752307415008545, 1.2450463771820068, 1.3148620128631592, 1.3846776485443115, 1.4544934034347534, 1.5243090391159058, 1.594124674797058]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 12.0, 10.0, 11.0, 31.0, 27.0, 49.0, 62.0, 113.0, 158.0, 380.0, 1171.0, 6245.0, 152055.0, 3998838.0, 28493.0, 4647.0, 1376.0, 284.0, 123.0, 67.0, 45.0, 16.0, 21.0, 11.0, 9.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9306640625, -1.8726959228515625, -1.814727783203125, -1.7567596435546875, -1.69879150390625, -1.6408233642578125, -1.582855224609375, -1.5248870849609375, -1.4669189453125, -1.4089508056640625, -1.350982666015625, -1.2930145263671875, -1.23504638671875, -1.1770782470703125, -1.119110107421875, -1.0611419677734375, -1.003173828125, -0.9452056884765625, -0.887237548828125, -0.8292694091796875, -0.77130126953125, -0.7133331298828125, -0.655364990234375, -0.5973968505859375, -0.5394287109375, -0.4814605712890625, -0.423492431640625, -0.3655242919921875, -0.30755615234375, -0.2495880126953125, -0.191619873046875, -0.1336517333984375, -0.07568359375, -0.0177154541015625, 0.040252685546875, 0.0982208251953125, 0.15618896484375, 0.2141571044921875, 0.272125244140625, 0.3300933837890625, 0.3880615234375, 0.4460296630859375, 0.503997802734375, 0.5619659423828125, 0.61993408203125, 0.6779022216796875, 0.735870361328125, 0.7938385009765625, 0.851806640625, 0.9097747802734375, 0.967742919921875, 1.0257110595703125, 1.08367919921875, 1.1416473388671875, 1.199615478515625, 1.2575836181640625, 1.3155517578125, 1.3735198974609375, 1.431488037109375, 1.4894561767578125, 1.54742431640625, 1.6053924560546875, 1.663360595703125, 1.7213287353515625, 1.779296875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 42.0, 80.0, 112.0, 150.0, 178.0, 153.0, 118.0, 73.0, 42.0, 20.0, 14.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.368194580078125, -1.33599853515625, -1.303802490234375, -1.2716064453125, -1.239410400390625, -1.20721435546875, -1.175018310546875, -1.142822265625, -1.110626220703125, -1.07843017578125, -1.046234130859375, -1.0140380859375, -0.981842041015625, -0.94964599609375, -0.917449951171875, -0.88525390625, -0.853057861328125, -0.82086181640625, -0.788665771484375, -0.7564697265625, -0.724273681640625, -0.69207763671875, -0.659881591796875, -0.627685546875, -0.595489501953125, -0.56329345703125, -0.531097412109375, -0.4989013671875, -0.466705322265625, -0.43450927734375, -0.402313232421875, -0.3701171875, -0.337921142578125, -0.30572509765625, -0.273529052734375, -0.2413330078125, -0.209136962890625, -0.17694091796875, -0.144744873046875, -0.112548828125, -0.080352783203125, -0.04815673828125, -0.015960693359375, 0.0162353515625, 0.048431396484375, 0.08062744140625, 0.112823486328125, 0.14501953125, 0.177215576171875, 0.20941162109375, 0.241607666015625, 0.2738037109375, 0.305999755859375, 0.33819580078125, 0.370391845703125, 0.402587890625, 0.434783935546875, 0.46697998046875, 0.499176025390625, 0.5313720703125, 0.563568115234375, 0.59576416015625, 0.627960205078125, 0.66015625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 4.0, 19.0, 54.0, 134.0, 793.0, 6655.0, 4129050.0, 55193.0, 1882.0, 295.0, 93.0, 35.0, 12.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.14453125, -4.042816162109375, -3.94110107421875, -3.839385986328125, -3.7376708984375, -3.635955810546875, -3.53424072265625, -3.432525634765625, -3.330810546875, -3.229095458984375, -3.12738037109375, -3.025665283203125, -2.9239501953125, -2.822235107421875, -2.72052001953125, -2.618804931640625, -2.51708984375, -2.415374755859375, -2.31365966796875, -2.211944580078125, -2.1102294921875, -2.008514404296875, -1.90679931640625, -1.805084228515625, -1.703369140625, -1.601654052734375, -1.49993896484375, -1.398223876953125, -1.2965087890625, -1.194793701171875, -1.09307861328125, -0.991363525390625, -0.8896484375, -0.787933349609375, -0.68621826171875, -0.584503173828125, -0.4827880859375, -0.381072998046875, -0.27935791015625, -0.177642822265625, -0.075927734375, 0.025787353515625, 0.12750244140625, 0.229217529296875, 0.3309326171875, 0.432647705078125, 0.53436279296875, 0.636077880859375, 0.73779296875, 0.839508056640625, 0.94122314453125, 1.042938232421875, 1.1446533203125, 1.246368408203125, 1.34808349609375, 1.449798583984375, 1.551513671875, 1.653228759765625, 1.75494384765625, 1.856658935546875, 1.9583740234375, 2.060089111328125, 2.16180419921875, 2.263519287109375, 2.365234375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 3.0, 6.0, 9.0, 17.0, 29.0, 61.0, 162.0, 665.0, 1759.0, 975.0, 224.0, 78.0, 41.0, 10.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33154296875, -0.31810760498046875, -0.3046722412109375, -0.29123687744140625, -0.277801513671875, -0.26436614990234375, -0.2509307861328125, -0.23749542236328125, -0.22406005859375, -0.21062469482421875, -0.1971893310546875, -0.18375396728515625, -0.170318603515625, -0.15688323974609375, -0.1434478759765625, -0.13001251220703125, -0.1165771484375, -0.10314178466796875, -0.0897064208984375, -0.07627105712890625, -0.062835693359375, -0.04940032958984375, -0.0359649658203125, -0.02252960205078125, -0.00909423828125, 0.00434112548828125, 0.0177764892578125, 0.03121185302734375, 0.044647216796875, 0.05808258056640625, 0.0715179443359375, 0.08495330810546875, 0.098388671875, 0.11182403564453125, 0.1252593994140625, 0.13869476318359375, 0.152130126953125, 0.16556549072265625, 0.1790008544921875, 0.19243621826171875, 0.20587158203125, 0.21930694580078125, 0.2327423095703125, 0.24617767333984375, 0.259613037109375, 0.27304840087890625, 0.2864837646484375, 0.29991912841796875, 0.3133544921875, 0.32678985595703125, 0.3402252197265625, 0.35366058349609375, 0.367095947265625, 0.38053131103515625, 0.3939666748046875, 0.40740203857421875, 0.42083740234375, 0.43427276611328125, 0.4477081298828125, 0.46114349365234375, 0.474578857421875, 0.48801422119140625, 0.5014495849609375, 0.5148849487304688, 0.5283203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 12.0, 20.0, 16.0, 28.0, 26.0, 41.0, 52.0, 64.0, 91.0, 98.0, 112.0, 88.0, 72.0, 51.0, 59.0, 50.0, 34.0, 27.0, 25.0, 10.0, 11.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4316434860229492, -0.41458261013031006, -0.3975217640399933, -0.3804608881473541, -0.36340004205703735, -0.3463391661643982, -0.32927829027175903, -0.3122174143791199, -0.2951565682888031, -0.27809569239616394, -0.26103484630584717, -0.243973970413208, -0.22691310942173004, -0.20985224843025208, -0.19279137253761292, -0.17573051154613495, -0.15866965055465698, -0.14160878956317902, -0.12454792112112045, -0.10748705267906189, -0.09042619168758392, -0.07336533069610596, -0.056304462254047394, -0.03924359381198883, -0.022182732820510864, -0.0051218681037425995, 0.011938996613025665, 0.02899986132979393, 0.046060726046562195, 0.06312158703804016, 0.08018245548009872, 0.09724332392215729, 0.11430424451828003, 0.131365105509758, 0.14842596650123596, 0.16548684239387512, 0.1825477033853531, 0.19960856437683105, 0.21666944026947021, 0.23373030126094818, 0.25079116225242615, 0.2678520381450653, 0.2849128842353821, 0.30197376012802124, 0.3190346360206604, 0.3360954821109772, 0.35315635800361633, 0.3702172040939331, 0.38727807998657227, 0.4043389558792114, 0.4213998019695282, 0.43846067786216736, 0.45552152395248413, 0.4725823998451233, 0.48964327573776245, 0.5067041516304016, 0.523764967918396, 0.5408258438110352, 0.5578867197036743, 0.5749475359916687, 0.5920084118843079, 0.609069287776947, 0.6261301636695862, 0.6431910395622253, 0.6602519154548645]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 22.0, 26.0, 22.0, 38.0, 51.0, 61.0, 57.0, 77.0, 86.0, 87.0, 80.0, 65.0, 70.0, 53.0, 48.0, 43.0, 27.0, 28.0, 15.0, 17.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5584561228752136, -0.5387117862701416, -0.5189673900604248, -0.4992230236530304, -0.479478657245636, -0.4597342908382416, -0.43998992443084717, -0.42024555802345276, -0.40050119161605835, -0.38075682520866394, -0.36101245880126953, -0.3412680923938751, -0.3215237259864807, -0.3017793595790863, -0.2820349931716919, -0.2622906267642975, -0.24254626035690308, -0.22280189394950867, -0.20305752754211426, -0.18331316113471985, -0.16356879472732544, -0.14382442831993103, -0.12408006191253662, -0.10433569550514221, -0.0845913290977478, -0.0648469626903534, -0.045102596282958984, -0.025358229875564575, -0.005613863468170166, 0.014130502939224243, 0.03387486934661865, 0.05361923575401306, 0.07336366176605225, 0.09310802817344666, 0.11285239458084106, 0.13259676098823547, 0.15234112739562988, 0.1720854938030243, 0.1918298602104187, 0.2115742266178131, 0.23131859302520752, 0.25106295943260193, 0.27080732583999634, 0.29055169224739075, 0.31029605865478516, 0.33004042506217957, 0.349784791469574, 0.3695291578769684, 0.3892735242843628, 0.4090178906917572, 0.4287622570991516, 0.448506623506546, 0.46825098991394043, 0.48799535632133484, 0.5077397227287292, 0.5274840593338013, 0.5472284555435181, 0.5669728517532349, 0.5867171883583069, 0.6064615249633789, 0.6262059211730957, 0.6459503173828125, 0.6656946539878845, 0.6854389905929565, 0.7051833868026733]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 15.0, 23.0, 60.0, 87.0, 128.0, 256.0, 489.0, 1196.0, 5889.0, 167497.0, 836595.0, 32276.0, 2421.0, 795.0, 358.0, 198.0, 107.0, 67.0, 33.0, 24.0, 13.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23456764221191406, -0.22706985473632812, -0.2195720672607422, -0.21207427978515625, -0.2045764923095703, -0.19707870483398438, -0.18958091735839844, -0.1820831298828125, -0.17458534240722656, -0.16708755493164062, -0.1595897674560547, -0.15209197998046875, -0.1445941925048828, -0.13709640502929688, -0.12959861755371094, -0.122100830078125, -0.11460304260253906, -0.10710525512695312, -0.09960746765136719, -0.09210968017578125, -0.08461189270019531, -0.07711410522460938, -0.06961631774902344, -0.0621185302734375, -0.05462074279785156, -0.047122955322265625, -0.03962516784667969, -0.03212738037109375, -0.024629592895507812, -0.017131805419921875, -0.009634017944335938, -0.00213623046875, 0.0053615570068359375, 0.012859344482421875, 0.020357131958007812, 0.02785491943359375, 0.03535270690917969, 0.042850494384765625, 0.05034828186035156, 0.0578460693359375, 0.06534385681152344, 0.07284164428710938, 0.08033943176269531, 0.08783721923828125, 0.09533500671386719, 0.10283279418945312, 0.11033058166503906, 0.117828369140625, 0.12532615661621094, 0.13282394409179688, 0.1403217315673828, 0.14781951904296875, 0.1553173065185547, 0.16281509399414062, 0.17031288146972656, 0.1778106689453125, 0.18530845642089844, 0.19280624389648438, 0.2003040313720703, 0.20780181884765625, 0.2152996063232422, 0.22279739379882812, 0.23029518127441406, 0.23779296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 9.0, 11.0, 13.0, 23.0, 30.0, 53.0, 51.0, 64.0, 78.0, 89.0, 98.0, 78.0, 67.0, 85.0, 70.0, 57.0, 40.0, 28.0, 23.0, 17.0, 9.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42138671875, -0.4077720642089844, -0.39415740966796875, -0.3805427551269531, -0.3669281005859375, -0.3533134460449219, -0.33969879150390625, -0.3260841369628906, -0.312469482421875, -0.2988548278808594, -0.28524017333984375, -0.2716255187988281, -0.2580108642578125, -0.24439620971679688, -0.23078155517578125, -0.21716690063476562, -0.20355224609375, -0.18993759155273438, -0.17632293701171875, -0.16270828247070312, -0.1490936279296875, -0.13547897338867188, -0.12186431884765625, -0.10824966430664062, -0.094635009765625, -0.08102035522460938, -0.06740570068359375, -0.053791046142578125, -0.0401763916015625, -0.026561737060546875, -0.01294708251953125, 0.000667572021484375, 0.0142822265625, 0.027896881103515625, 0.04151153564453125, 0.055126190185546875, 0.0687408447265625, 0.08235549926757812, 0.09597015380859375, 0.10958480834960938, 0.123199462890625, 0.13681411743164062, 0.15042877197265625, 0.16404342651367188, 0.1776580810546875, 0.19127273559570312, 0.20488739013671875, 0.21850204467773438, 0.23211669921875, 0.24573135375976562, 0.25934600830078125, 0.2729606628417969, 0.2865753173828125, 0.3001899719238281, 0.31380462646484375, 0.3274192810058594, 0.341033935546875, 0.3546485900878906, 0.36826324462890625, 0.3818778991699219, 0.3954925537109375, 0.4091072082519531, 0.42272186279296875, 0.4363365173339844, 0.449951171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 9.0, 8.0, 6.0, 16.0, 16.0, 44.0, 59.0, 84.0, 136.0, 201.0, 312.0, 503.0, 856.0, 1387.0, 2339.0, 4151.0, 7513.0, 13888.0, 26768.0, 53197.0, 105627.0, 190427.0, 248172.0, 183797.0, 101608.0, 51054.0, 25837.0, 13429.0, 7213.0, 4023.0, 2311.0, 1381.0, 829.0, 509.0, 289.0, 203.0, 129.0, 67.0, 52.0, 43.0, 33.0, 12.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032928466796875, -0.03177165985107422, -0.030614852905273438, -0.029458045959472656, -0.028301239013671875, -0.027144432067871094, -0.025987625122070312, -0.02483081817626953, -0.02367401123046875, -0.02251720428466797, -0.021360397338867188, -0.020203590393066406, -0.019046783447265625, -0.017889976501464844, -0.016733169555664062, -0.015576362609863281, -0.0144195556640625, -0.013262748718261719, -0.012105941772460938, -0.010949134826660156, -0.009792327880859375, -0.008635520935058594, -0.0074787139892578125, -0.006321907043457031, -0.00516510009765625, -0.004008293151855469, -0.0028514862060546875, -0.0016946792602539062, -0.000537872314453125, 0.0006189346313476562, 0.0017757415771484375, 0.0029325485229492188, 0.00408935546875, 0.005246162414550781, 0.0064029693603515625, 0.007559776306152344, 0.008716583251953125, 0.009873390197753906, 0.011030197143554688, 0.012187004089355469, 0.01334381103515625, 0.014500617980957031, 0.015657424926757812, 0.016814231872558594, 0.017971038818359375, 0.019127845764160156, 0.020284652709960938, 0.02144145965576172, 0.0225982666015625, 0.02375507354736328, 0.024911880493164062, 0.026068687438964844, 0.027225494384765625, 0.028382301330566406, 0.029539108276367188, 0.03069591522216797, 0.03185272216796875, 0.03300952911376953, 0.03416633605957031, 0.035323143005371094, 0.036479949951171875, 0.037636756896972656, 0.03879356384277344, 0.03995037078857422, 0.041107177734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 7.0, 11.0, 8.0, 14.0, 18.0, 16.0, 9.0, 20.0, 27.0, 34.0, 44.0, 47.0, 41.0, 42.0, 41.0, 32.0, 36.0, 47.0, 46.0, 53.0, 47.0, 46.0, 39.0, 38.0, 42.0, 29.0, 30.0, 14.0, 22.0, 21.0, 15.0, 13.0, 12.0, 5.0, 7.0, 2.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.6357421875, -0.6165618896484375, -0.597381591796875, -0.5782012939453125, -0.55902099609375, -0.5398406982421875, -0.520660400390625, -0.5014801025390625, -0.4822998046875, -0.4631195068359375, -0.443939208984375, -0.4247589111328125, -0.40557861328125, -0.3863983154296875, -0.367218017578125, -0.3480377197265625, -0.328857421875, -0.3096771240234375, -0.290496826171875, -0.2713165283203125, -0.25213623046875, -0.2329559326171875, -0.213775634765625, -0.1945953369140625, -0.1754150390625, -0.1562347412109375, -0.137054443359375, -0.1178741455078125, -0.09869384765625, -0.0795135498046875, -0.060333251953125, -0.0411529541015625, -0.02197265625, -0.0027923583984375, 0.016387939453125, 0.0355682373046875, 0.05474853515625, 0.0739288330078125, 0.093109130859375, 0.1122894287109375, 0.1314697265625, 0.1506500244140625, 0.169830322265625, 0.1890106201171875, 0.20819091796875, 0.2273712158203125, 0.246551513671875, 0.2657318115234375, 0.284912109375, 0.3040924072265625, 0.323272705078125, 0.3424530029296875, 0.36163330078125, 0.3808135986328125, 0.399993896484375, 0.4191741943359375, 0.4383544921875, 0.4575347900390625, 0.476715087890625, 0.4958953857421875, 0.51507568359375, 0.5342559814453125, 0.553436279296875, 0.5726165771484375, 0.591796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 18.0, 24.0, 24.0, 50.0, 85.0, 142.0, 227.0, 443.0, 794.0, 1510.0, 3205.0, 8307.0, 27791.0, 139172.0, 628055.0, 187617.0, 34341.0, 9503.0, 3590.0, 1643.0, 809.0, 477.0, 270.0, 154.0, 108.0, 53.0, 37.0, 27.0, 16.0, 13.0, 7.0, 14.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007808685302734375, -0.007553279399871826, -0.007297873497009277, -0.0070424675941467285, -0.00678706169128418, -0.006531655788421631, -0.006276249885559082, -0.006020843982696533, -0.005765438079833984, -0.0055100321769714355, -0.005254626274108887, -0.004999220371246338, -0.004743814468383789, -0.00448840856552124, -0.004233002662658691, -0.003977596759796143, -0.0037221908569335938, -0.003466784954071045, -0.003211379051208496, -0.0029559731483459473, -0.0027005672454833984, -0.0024451613426208496, -0.0021897554397583008, -0.001934349536895752, -0.0016789436340332031, -0.0014235377311706543, -0.0011681318283081055, -0.0009127259254455566, -0.0006573200225830078, -0.000401914119720459, -0.00014650821685791016, 0.00010889768600463867, 0.0003643035888671875, 0.0006197094917297363, 0.0008751153945922852, 0.001130521297454834, 0.0013859272003173828, 0.0016413331031799316, 0.0018967390060424805, 0.0021521449089050293, 0.002407550811767578, 0.002662956714630127, 0.0029183626174926758, 0.0031737685203552246, 0.0034291744232177734, 0.0036845803260803223, 0.003939986228942871, 0.00419539213180542, 0.004450798034667969, 0.004706203937530518, 0.004961609840393066, 0.005217015743255615, 0.005472421646118164, 0.005727827548980713, 0.005983233451843262, 0.0062386393547058105, 0.006494045257568359, 0.006749451160430908, 0.007004857063293457, 0.007260262966156006, 0.007515668869018555, 0.0077710747718811035, 0.008026480674743652, 0.008281886577606201, 0.00853729248046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 17.0, 10.0, 13.0, 33.0, 32.0, 68.0, 88.0, 155.0, 151.0, 143.0, 96.0, 65.0, 48.0, 24.0, 10.0, 10.0, 12.0, 12.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2814998626708984e-05, -1.2191012501716614e-05, -1.1567026376724243e-05, -1.0943040251731873e-05, -1.0319054126739502e-05, -9.695068001747131e-06, -9.07108187675476e-06, -8.44709575176239e-06, -7.82310962677002e-06, -7.199123501777649e-06, -6.575137376785278e-06, -5.951151251792908e-06, -5.327165126800537e-06, -4.7031790018081665e-06, -4.079192876815796e-06, -3.4552067518234253e-06, -2.8312206268310547e-06, -2.207234501838684e-06, -1.5832483768463135e-06, -9.592622518539429e-07, -3.3527612686157227e-07, 2.8870999813079834e-07, 9.126961231231689e-07, 1.5366822481155396e-06, 2.16066837310791e-06, 2.7846544981002808e-06, 3.4086406230926514e-06, 4.032626748085022e-06, 4.656612873077393e-06, 5.280598998069763e-06, 5.904585123062134e-06, 6.528571248054504e-06, 7.152557373046875e-06, 7.776543498039246e-06, 8.400529623031616e-06, 9.024515748023987e-06, 9.648501873016357e-06, 1.0272487998008728e-05, 1.0896474123001099e-05, 1.152046024799347e-05, 1.214444637298584e-05, 1.276843249797821e-05, 1.3392418622970581e-05, 1.4016404747962952e-05, 1.4640390872955322e-05, 1.5264376997947693e-05, 1.5888363122940063e-05, 1.6512349247932434e-05, 1.7136335372924805e-05, 1.7760321497917175e-05, 1.8384307622909546e-05, 1.9008293747901917e-05, 1.9632279872894287e-05, 2.0256265997886658e-05, 2.088025212287903e-05, 2.15042382478714e-05, 2.212822437286377e-05, 2.275221049785614e-05, 2.337619662284851e-05, 2.400018274784088e-05, 2.4624168872833252e-05, 2.5248154997825623e-05, 2.5872141122817993e-05, 2.6496127247810364e-05, 2.7120113372802734e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 11.0, 9.0, 22.0, 28.0, 43.0, 74.0, 78.0, 121.0, 158.0, 244.0, 413.0, 506.0, 885.0, 1440.0, 2181.0, 4092.0, 7930.0, 17160.0, 43304.0, 136800.0, 423125.0, 275914.0, 79222.0, 28506.0, 12278.0, 5962.0, 3179.0, 1807.0, 1083.0, 638.0, 447.0, 273.0, 198.0, 129.0, 93.0, 59.0, 39.0, 19.0, 25.0, 20.0, 10.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00568389892578125, -0.005510449409484863, -0.0053369998931884766, -0.00516355037689209, -0.004990100860595703, -0.004816651344299316, -0.00464320182800293, -0.004469752311706543, -0.004296302795410156, -0.0041228532791137695, -0.003949403762817383, -0.003775954246520996, -0.0036025047302246094, -0.0034290552139282227, -0.003255605697631836, -0.0030821561813354492, -0.0029087066650390625, -0.0027352571487426758, -0.002561807632446289, -0.0023883581161499023, -0.0022149085998535156, -0.002041459083557129, -0.0018680095672607422, -0.0016945600509643555, -0.0015211105346679688, -0.001347661018371582, -0.0011742115020751953, -0.0010007619857788086, -0.0008273124694824219, -0.0006538629531860352, -0.00048041343688964844, -0.0003069639205932617, -0.000133514404296875, 3.993511199951172e-05, 0.00021338462829589844, 0.00038683414459228516, 0.0005602836608886719, 0.0007337331771850586, 0.0009071826934814453, 0.001080632209777832, 0.0012540817260742188, 0.0014275312423706055, 0.0016009807586669922, 0.001774430274963379, 0.0019478797912597656, 0.0021213293075561523, 0.002294778823852539, 0.0024682283401489258, 0.0026416778564453125, 0.0028151273727416992, 0.002988576889038086, 0.0031620264053344727, 0.0033354759216308594, 0.003508925437927246, 0.003682374954223633, 0.0038558244705200195, 0.004029273986816406, 0.004202723503112793, 0.00437617301940918, 0.004549622535705566, 0.004723072052001953, 0.00489652156829834, 0.0050699710845947266, 0.005243420600891113, 0.0054168701171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 6.0, 5.0, 7.0, 11.0, 14.0, 12.0, 19.0, 34.0, 31.0, 67.0, 86.0, 108.0, 109.0, 105.0, 90.0, 77.0, 45.0, 52.0, 32.0, 22.0, 15.0, 8.0, 12.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002147674560546875, -0.002077728509902954, -0.002007782459259033, -0.0019378364086151123, -0.0018678903579711914, -0.0017979443073272705, -0.0017279982566833496, -0.0016580522060394287, -0.0015881061553955078, -0.001518160104751587, -0.001448214054107666, -0.0013782680034637451, -0.0013083219528198242, -0.0012383759021759033, -0.0011684298515319824, -0.0010984838008880615, -0.0010285377502441406, -0.0009585916996002197, -0.0008886456489562988, -0.0008186995983123779, -0.000748753547668457, -0.0006788074970245361, -0.0006088614463806152, -0.0005389153957366943, -0.00046896934509277344, -0.00039902329444885254, -0.00032907724380493164, -0.00025913119316101074, -0.00018918514251708984, -0.00011923909187316895, -4.929304122924805e-05, 2.065300941467285e-05, 9.059906005859375e-05, 0.00016054511070251465, 0.00023049116134643555, 0.00030043721199035645, 0.00037038326263427734, 0.00044032931327819824, 0.0005102753639221191, 0.00058022141456604, 0.0006501674652099609, 0.0007201135158538818, 0.0007900595664978027, 0.0008600056171417236, 0.0009299516677856445, 0.0009998977184295654, 0.0010698437690734863, 0.0011397898197174072, 0.0012097358703613281, 0.001279681921005249, 0.00134962797164917, 0.0014195740222930908, 0.0014895200729370117, 0.0015594661235809326, 0.0016294121742248535, 0.0016993582248687744, 0.0017693042755126953, 0.0018392503261566162, 0.0019091963768005371, 0.001979142427444458, 0.002049088478088379, 0.0021190345287323, 0.0021889805793762207, 0.0022589266300201416, 0.0023288726806640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 16.0, 30.0, 37.0, 52.0, 78.0, 102.0, 149.0, 118.0, 121.0, 77.0, 76.0, 45.0, 33.0, 20.0, 19.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3188175559043884, -0.3051067590713501, -0.2913959324359894, -0.27768513560295105, -0.26397430896759033, -0.250263512134552, -0.23655270040035248, -0.22284188866615295, -0.20913109183311462, -0.1954202800989151, -0.18170946836471558, -0.16799867153167725, -0.15428785979747772, -0.1405770480632782, -0.12686623632907867, -0.11315543204545975, -0.09944461286067963, -0.0857338011264801, -0.07202299684286118, -0.05831218510866165, -0.044601377099752426, -0.0308905690908432, -0.017179757356643677, -0.0034689530730247498, 0.010241858661174774, 0.023952666670084, 0.037663474678993225, 0.05137428641319275, 0.06508509814739227, 0.0787959024310112, 0.09250671416521072, 0.10621751844882965, 0.11992833018302917, 0.1336391419172287, 0.14734995365142822, 0.16106075048446655, 0.17477156221866608, 0.1884823739528656, 0.20219318568706512, 0.21590399742126465, 0.22961479425430298, 0.2433256059885025, 0.257036417722702, 0.27074721455574036, 0.2844580411911011, 0.2981688380241394, 0.31187963485717773, 0.32559046149253845, 0.33930128812789917, 0.3530120849609375, 0.3667229115962982, 0.38043370842933655, 0.39414453506469727, 0.4078553318977356, 0.4215661287307739, 0.43527695536613464, 0.448987752199173, 0.4626985490322113, 0.476409375667572, 0.49012017250061035, 0.5038309693336487, 0.517541766166687, 0.5312526226043701, 0.5449634194374084, 0.5586742162704468]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 13.0, 20.0, 28.0, 32.0, 45.0, 62.0, 68.0, 69.0, 95.0, 85.0, 88.0, 81.0, 72.0, 54.0, 51.0, 45.0, 27.0, 21.0, 18.0, 10.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38540777564048767, -0.37241607904434204, -0.3594244122505188, -0.34643271565437317, -0.33344101905822754, -0.3204493224620819, -0.3074576258659363, -0.29446595907211304, -0.2814742624759674, -0.2684825658798218, -0.25549089908599854, -0.2424992024898529, -0.22950750589370728, -0.21651580929756165, -0.2035241276025772, -0.19053244590759277, -0.17754074931144714, -0.1645490527153015, -0.15155737102031708, -0.13856568932533264, -0.125573992729187, -0.11258230358362198, -0.09959061443805695, -0.08659892529249191, -0.07360723614692688, -0.06061554700136185, -0.047623857855796814, -0.03463216871023178, -0.021640479564666748, -0.008648790419101715, 0.004342898726463318, 0.01733458787202835, 0.030326247215270996, 0.04331793636083603, 0.05630962550640106, 0.0693013146519661, 0.08229300379753113, 0.09528469294309616, 0.1082763820886612, 0.12126807123422623, 0.13425976037979126, 0.1472514569759369, 0.16024313867092133, 0.17323482036590576, 0.1862265169620514, 0.19921821355819702, 0.21220989525318146, 0.2252015769481659, 0.23819327354431152, 0.25118497014045715, 0.2641766667366028, 0.277168333530426, 0.29016003012657166, 0.3031517267227173, 0.3161433935165405, 0.32913509011268616, 0.3421267867088318, 0.3551184833049774, 0.36811017990112305, 0.3811018466949463, 0.3940935432910919, 0.40708523988723755, 0.4200769066810608, 0.4330686032772064, 0.44606029987335205]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 9.0, 5.0, 13.0, 27.0, 45.0, 65.0, 94.0, 200.0, 377.0, 757.0, 1723.0, 4207.0, 11567.0, 35761.0, 126837.0, 504472.0, 265874.0, 64660.0, 19900.0, 7030.0, 2662.0, 1149.0, 528.0, 244.0, 124.0, 84.0, 71.0, 33.0, 19.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3814888000488281, -0.36722564697265625, -0.3529624938964844, -0.3386993408203125, -0.3244361877441406, -0.31017303466796875, -0.2959098815917969, -0.281646728515625, -0.2673835754394531, -0.25312042236328125, -0.23885726928710938, -0.2245941162109375, -0.21033096313476562, -0.19606781005859375, -0.18180465698242188, -0.16754150390625, -0.15327835083007812, -0.13901519775390625, -0.12475204467773438, -0.1104888916015625, -0.09622573852539062, -0.08196258544921875, -0.06769943237304688, -0.053436279296875, -0.039173126220703125, -0.02490997314453125, -0.010646820068359375, 0.0036163330078125, 0.017879486083984375, 0.03214263916015625, 0.046405792236328125, 0.0606689453125, 0.07493209838867188, 0.08919525146484375, 0.10345840454101562, 0.1177215576171875, 0.13198471069335938, 0.14624786376953125, 0.16051101684570312, 0.174774169921875, 0.18903732299804688, 0.20330047607421875, 0.21756362915039062, 0.2318267822265625, 0.24608993530273438, 0.26035308837890625, 0.2746162414550781, 0.28887939453125, 0.3031425476074219, 0.31740570068359375, 0.3316688537597656, 0.3459320068359375, 0.3601951599121094, 0.37445831298828125, 0.3887214660644531, 0.402984619140625, 0.4172477722167969, 0.43151092529296875, 0.4457740783691406, 0.4600372314453125, 0.4743003845214844, 0.48856353759765625, 0.5028266906738281, 0.51708984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 9.0, 11.0, 16.0, 20.0, 26.0, 34.0, 41.0, 44.0, 55.0, 55.0, 51.0, 69.0, 67.0, 66.0, 58.0, 55.0, 65.0, 46.0, 42.0, 31.0, 32.0, 27.0, 19.0, 13.0, 10.0, 13.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3195610046386719, -0.30342864990234375, -0.2872962951660156, -0.2711639404296875, -0.2550315856933594, -0.23889923095703125, -0.22276687622070312, -0.206634521484375, -0.19050216674804688, -0.17436981201171875, -0.15823745727539062, -0.1421051025390625, -0.12597274780273438, -0.10984039306640625, -0.09370803833007812, -0.07757568359375, -0.061443328857421875, -0.04531097412109375, -0.029178619384765625, -0.0130462646484375, 0.003086090087890625, 0.01921844482421875, 0.035350799560546875, 0.051483154296875, 0.06761550903320312, 0.08374786376953125, 0.09988021850585938, 0.1160125732421875, 0.13214492797851562, 0.14827728271484375, 0.16440963745117188, 0.1805419921875, 0.19667434692382812, 0.21280670166015625, 0.22893905639648438, 0.2450714111328125, 0.2612037658691406, 0.27733612060546875, 0.2934684753417969, 0.309600830078125, 0.3257331848144531, 0.34186553955078125, 0.3579978942871094, 0.3741302490234375, 0.3902626037597656, 0.40639495849609375, 0.4225273132324219, 0.43865966796875, 0.4547920227050781, 0.47092437744140625, 0.4870567321777344, 0.5031890869140625, 0.5193214416503906, 0.5354537963867188, 0.5515861511230469, 0.567718505859375, 0.5838508605957031, 0.5999832153320312, 0.6161155700683594, 0.6322479248046875, 0.6483802795410156, 0.6645126342773438, 0.6806449890136719, 0.69677734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 10.0, 8.0, 18.0, 17.0, 45.0, 72.0, 127.0, 279.0, 569.0, 1305.0, 4040.0, 15575.0, 87739.0, 656139.0, 238691.0, 32900.0, 7208.0, 2205.0, 838.0, 353.0, 191.0, 91.0, 53.0, 31.0, 18.0, 7.0, 7.0, 9.0, 3.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.6771163940429688, -0.6535491943359375, -0.6299819946289062, -0.606414794921875, -0.5828475952148438, -0.5592803955078125, -0.5357131958007812, -0.51214599609375, -0.48857879638671875, -0.4650115966796875, -0.44144439697265625, -0.417877197265625, -0.39430999755859375, -0.3707427978515625, -0.34717559814453125, -0.3236083984375, -0.30004119873046875, -0.2764739990234375, -0.25290679931640625, -0.229339599609375, -0.20577239990234375, -0.1822052001953125, -0.15863800048828125, -0.13507080078125, -0.11150360107421875, -0.0879364013671875, -0.06436920166015625, -0.040802001953125, -0.01723480224609375, 0.0063323974609375, 0.02989959716796875, 0.053466796875, 0.07703399658203125, 0.1006011962890625, 0.12416839599609375, 0.147735595703125, 0.17130279541015625, 0.1948699951171875, 0.21843719482421875, 0.24200439453125, 0.26557159423828125, 0.2891387939453125, 0.31270599365234375, 0.336273193359375, 0.35984039306640625, 0.3834075927734375, 0.40697479248046875, 0.4305419921875, 0.45410919189453125, 0.4776763916015625, 0.5012435913085938, 0.524810791015625, 0.5483779907226562, 0.5719451904296875, 0.5955123901367188, 0.61907958984375, 0.6426467895507812, 0.6662139892578125, 0.6897811889648438, 0.713348388671875, 0.7369155883789062, 0.7604827880859375, 0.7840499877929688, 0.8076171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 8.0, 3.0, 12.0, 16.0, 25.0, 40.0, 45.0, 73.0, 85.0, 79.0, 93.0, 114.0, 93.0, 88.0, 55.0, 49.0, 47.0, 27.0, 17.0, 11.0, 5.0, 11.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.02239990234375, -0.9940185546875, -0.96563720703125, -0.937255859375, -0.90887451171875, -0.8804931640625, -0.85211181640625, -0.82373046875, -0.79534912109375, -0.7669677734375, -0.73858642578125, -0.710205078125, -0.68182373046875, -0.6534423828125, -0.62506103515625, -0.5966796875, -0.56829833984375, -0.5399169921875, -0.51153564453125, -0.483154296875, -0.45477294921875, -0.4263916015625, -0.39801025390625, -0.36962890625, -0.34124755859375, -0.3128662109375, -0.28448486328125, -0.256103515625, -0.22772216796875, -0.1993408203125, -0.17095947265625, -0.142578125, -0.11419677734375, -0.0858154296875, -0.05743408203125, -0.029052734375, -0.00067138671875, 0.0277099609375, 0.05609130859375, 0.08447265625, 0.11285400390625, 0.1412353515625, 0.16961669921875, 0.197998046875, 0.22637939453125, 0.2547607421875, 0.28314208984375, 0.3115234375, 0.33990478515625, 0.3682861328125, 0.39666748046875, 0.425048828125, 0.45343017578125, 0.4818115234375, 0.51019287109375, 0.53857421875, 0.56695556640625, 0.5953369140625, 0.62371826171875, 0.652099609375, 0.68048095703125, 0.7088623046875, 0.73724365234375, 0.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 7.0, 17.0, 32.0, 32.0, 39.0, 58.0, 107.0, 135.0, 200.0, 360.0, 607.0, 1171.0, 2261.0, 4507.0, 9922.0, 23467.0, 62381.0, 199644.0, 487414.0, 165309.0, 53028.0, 20442.0, 8693.0, 4109.0, 1976.0, 1079.0, 577.0, 321.0, 197.0, 126.0, 80.0, 60.0, 50.0, 35.0, 23.0, 11.0, 16.0, 12.0, 9.0, 8.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047943115234375, -0.04646444320678711, -0.04498577117919922, -0.04350709915161133, -0.04202842712402344, -0.04054975509643555, -0.039071083068847656, -0.037592411041259766, -0.036113739013671875, -0.034635066986083984, -0.033156394958496094, -0.0316777229309082, -0.030199050903320312, -0.028720378875732422, -0.02724170684814453, -0.02576303482055664, -0.02428436279296875, -0.02280569076538086, -0.02132701873779297, -0.019848346710205078, -0.018369674682617188, -0.016891002655029297, -0.015412330627441406, -0.013933658599853516, -0.012454986572265625, -0.010976314544677734, -0.009497642517089844, -0.008018970489501953, -0.0065402984619140625, -0.005061626434326172, -0.0035829544067382812, -0.0021042823791503906, -0.0006256103515625, 0.0008530616760253906, 0.0023317337036132812, 0.003810405731201172, 0.0052890777587890625, 0.006767749786376953, 0.008246421813964844, 0.009725093841552734, 0.011203765869140625, 0.012682437896728516, 0.014161109924316406, 0.015639781951904297, 0.017118453979492188, 0.018597126007080078, 0.02007579803466797, 0.02155447006225586, 0.02303314208984375, 0.02451181411743164, 0.02599048614501953, 0.027469158172607422, 0.028947830200195312, 0.030426502227783203, 0.031905174255371094, 0.033383846282958984, 0.034862518310546875, 0.036341190338134766, 0.037819862365722656, 0.03929853439331055, 0.04077720642089844, 0.04225587844848633, 0.04373455047607422, 0.04521322250366211, 0.04669189453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 12.0, 16.0, 24.0, 18.0, 26.0, 38.0, 47.0, 70.0, 70.0, 92.0, 137.0, 97.0, 75.0, 48.0, 45.0, 36.0, 36.0, 31.0, 18.0, 14.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6450881958007812e-05, -1.604389399290085e-05, -1.5636906027793884e-05, -1.522991806268692e-05, -1.4822930097579956e-05, -1.4415942132472992e-05, -1.4008954167366028e-05, -1.3601966202259064e-05, -1.31949782371521e-05, -1.2787990272045135e-05, -1.2381002306938171e-05, -1.1974014341831207e-05, -1.1567026376724243e-05, -1.1160038411617279e-05, -1.0753050446510315e-05, -1.034606248140335e-05, -9.939074516296387e-06, -9.532086551189423e-06, -9.125098586082458e-06, -8.718110620975494e-06, -8.31112265586853e-06, -7.904134690761566e-06, -7.497146725654602e-06, -7.090158760547638e-06, -6.683170795440674e-06, -6.27618283033371e-06, -5.869194865226746e-06, -5.4622069001197815e-06, -5.055218935012817e-06, -4.648230969905853e-06, -4.241243004798889e-06, -3.834255039691925e-06, -3.427267074584961e-06, -3.020279109477997e-06, -2.6132911443710327e-06, -2.2063031792640686e-06, -1.7993152141571045e-06, -1.3923272490501404e-06, -9.853392839431763e-07, -5.783513188362122e-07, -1.7136335372924805e-07, 2.3562461137771606e-07, 6.426125764846802e-07, 1.0496005415916443e-06, 1.4565885066986084e-06, 1.8635764718055725e-06, 2.2705644369125366e-06, 2.6775524020195007e-06, 3.084540367126465e-06, 3.491528332233429e-06, 3.898516297340393e-06, 4.305504262447357e-06, 4.712492227554321e-06, 5.119480192661285e-06, 5.5264681577682495e-06, 5.933456122875214e-06, 6.340444087982178e-06, 6.747432053089142e-06, 7.154420018196106e-06, 7.56140798330307e-06, 7.968395948410034e-06, 8.375383913516998e-06, 8.782371878623962e-06, 9.189359843730927e-06, 9.59634780883789e-06]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 9.0, 5.0, 23.0, 16.0, 17.0, 18.0, 31.0, 48.0, 85.0, 99.0, 180.0, 309.0, 633.0, 1202.0, 2635.0, 7330.0, 30766.0, 260703.0, 664896.0, 60449.0, 11904.0, 3799.0, 1584.0, 789.0, 404.0, 206.0, 138.0, 77.0, 49.0, 35.0, 21.0, 21.0, 18.0, 9.0, 9.0, 3.0, 6.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.13103485107421875, -0.1266937255859375, -0.12235260009765625, -0.118011474609375, -0.11367034912109375, -0.1093292236328125, -0.10498809814453125, -0.10064697265625, -0.09630584716796875, -0.0919647216796875, -0.08762359619140625, -0.083282470703125, -0.07894134521484375, -0.0746002197265625, -0.07025909423828125, -0.06591796875, -0.06157684326171875, -0.0572357177734375, -0.05289459228515625, -0.048553466796875, -0.04421234130859375, -0.0398712158203125, -0.03553009033203125, -0.03118896484375, -0.02684783935546875, -0.0225067138671875, -0.01816558837890625, -0.013824462890625, -0.00948333740234375, -0.0051422119140625, -0.00080108642578125, 0.0035400390625, 0.00788116455078125, 0.0122222900390625, 0.01656341552734375, 0.020904541015625, 0.02524566650390625, 0.0295867919921875, 0.03392791748046875, 0.03826904296875, 0.04261016845703125, 0.0469512939453125, 0.05129241943359375, 0.055633544921875, 0.05997467041015625, 0.0643157958984375, 0.06865692138671875, 0.072998046875, 0.07733917236328125, 0.0816802978515625, 0.08602142333984375, 0.090362548828125, 0.09470367431640625, 0.0990447998046875, 0.10338592529296875, 0.10772705078125, 0.11206817626953125, 0.1164093017578125, 0.12075042724609375, 0.125091552734375, 0.12943267822265625, 0.1337738037109375, 0.13811492919921875, 0.1424560546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 8.0, 11.0, 29.0, 26.0, 51.0, 74.0, 104.0, 219.0, 156.0, 107.0, 69.0, 45.0, 31.0, 21.0, 12.0, 13.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0767822265625, -0.07451820373535156, -0.07225418090820312, -0.06999015808105469, -0.06772613525390625, -0.06546211242675781, -0.06319808959960938, -0.06093406677246094, -0.0586700439453125, -0.05640602111816406, -0.054141998291015625, -0.05187797546386719, -0.04961395263671875, -0.04734992980957031, -0.045085906982421875, -0.04282188415527344, -0.040557861328125, -0.03829383850097656, -0.036029815673828125, -0.03376579284667969, -0.03150177001953125, -0.029237747192382812, -0.026973724365234375, -0.024709701538085938, -0.0224456787109375, -0.020181655883789062, -0.017917633056640625, -0.015653610229492188, -0.01338958740234375, -0.011125564575195312, -0.008861541748046875, -0.0065975189208984375, -0.00433349609375, -0.0020694732666015625, 0.000194549560546875, 0.0024585723876953125, 0.00472259521484375, 0.0069866180419921875, 0.009250640869140625, 0.011514663696289062, 0.0137786865234375, 0.016042709350585938, 0.018306732177734375, 0.020570755004882812, 0.02283477783203125, 0.025098800659179688, 0.027362823486328125, 0.029626846313476562, 0.031890869140625, 0.03415489196777344, 0.036418914794921875, 0.03868293762207031, 0.04094696044921875, 0.04321098327636719, 0.045475006103515625, 0.04773902893066406, 0.0500030517578125, 0.05226707458496094, 0.054531097412109375, 0.05679512023925781, 0.05905914306640625, 0.06132316589355469, 0.06358718872070312, 0.06585121154785156, 0.068115234375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 13.0, 24.0, 43.0, 78.0, 110.0, 164.0, 185.0, 125.0, 105.0, 57.0, 39.0, 19.0, 7.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6336028575897217, -0.5988421440124512, -0.5640814304351807, -0.5293207168579102, -0.49456000328063965, -0.45979928970336914, -0.42503857612609863, -0.3902778625488281, -0.3555171489715576, -0.3207564353942871, -0.2859957218170166, -0.2512350082397461, -0.21647429466247559, -0.18171358108520508, -0.14695286750793457, -0.11219215393066406, -0.07743144035339355, -0.04267072677612305, -0.007910013198852539, 0.02685070037841797, 0.06161141395568848, 0.09637212753295898, 0.1311328411102295, 0.1658935546875, 0.2006542682647705, 0.23541498184204102, 0.2701756954193115, 0.30493640899658203, 0.33969712257385254, 0.37445783615112305, 0.40921854972839355, 0.44397926330566406, 0.4787400960922241, 0.5135008096694946, 0.5482615232467651, 0.5830222368240356, 0.6177829504013062, 0.6525436639785767, 0.6873043775558472, 0.7220650911331177, 0.7568258047103882, 0.7915865182876587, 0.8263472318649292, 0.8611079454421997, 0.8958686590194702, 0.9306293725967407, 0.9653900861740112, 1.0001507997512817, 1.0349115133285522, 1.0696722269058228, 1.1044329404830933, 1.1391936540603638, 1.1739543676376343, 1.2087150812149048, 1.2434757947921753, 1.2782365083694458, 1.3129972219467163, 1.3477579355239868, 1.3825186491012573, 1.4172793626785278, 1.4520400762557983, 1.4868007898330688, 1.5215615034103394, 1.5563222169876099, 1.5910829305648804]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 11.0, 7.0, 7.0, 18.0, 14.0, 23.0, 20.0, 19.0, 29.0, 25.0, 40.0, 54.0, 48.0, 38.0, 49.0, 41.0, 58.0, 61.0, 50.0, 58.0, 35.0, 30.0, 46.0, 40.0, 32.0, 27.0, 29.0, 17.0, 16.0, 11.0, 13.0, 10.0, 5.0, 12.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6061323285102844, -0.5808848738670349, -0.5556374192237854, -0.5303899645805359, -0.5051425099372864, -0.47989505529403687, -0.45464757084846497, -0.42940011620521545, -0.40415266156196594, -0.37890520691871643, -0.3536577522754669, -0.328410267829895, -0.3031628131866455, -0.277915358543396, -0.2526679039001465, -0.22742044925689697, -0.20217299461364746, -0.17692553997039795, -0.15167808532714844, -0.12643061578273773, -0.10118316113948822, -0.07593570649623871, -0.050688236951828, -0.02544078230857849, -0.0001933276653289795, 0.02505413070321083, 0.05030158907175064, 0.07554905116558075, 0.10079650580883026, 0.12604396045207977, 0.15129142999649048, 0.17653888463974, 0.20178639888763428, 0.2270338535308838, 0.2522813081741333, 0.2775287628173828, 0.3027762174606323, 0.32802367210388184, 0.35327115654945374, 0.37851861119270325, 0.40376606583595276, 0.42901352047920227, 0.4542609751224518, 0.4795084595680237, 0.5047559142112732, 0.5300033688545227, 0.5552508234977722, 0.5804982781410217, 0.6057457327842712, 0.6309931874275208, 0.6562406420707703, 0.6814880967140198, 0.7067355513572693, 0.7319830060005188, 0.7572305202484131, 0.7824779748916626, 0.8077254295349121, 0.8329728841781616, 0.8582203388214111, 0.8834677934646606, 0.9087152481079102, 0.9339627027511597, 0.9592101573944092, 0.9844576120376587, 1.0097050666809082]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 9.0, 28.0, 25.0, 51.0, 52.0, 67.0, 81.0, 118.0, 143.0, 182.0, 227.0, 342.0, 431.0, 644.0, 1045357.0, 736.0, 540.0, 360.0, 300.0, 210.0, 164.0, 123.0, 94.0, 78.0, 71.0, 32.0, 42.0, 25.0, 22.0, 11.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0399229526519775, -1.0011014938354492, -0.9622799754142761, -0.923458456993103, -0.8846369981765747, -0.8458155393600464, -0.8069940209388733, -0.7681725025177002, -0.7293510437011719, -0.6905295848846436, -0.6517080664634705, -0.6128865480422974, -0.574065089225769, -0.5352436304092407, -0.4964221119880676, -0.4576006233692169, -0.4187791347503662, -0.3799576461315155, -0.3411361575126648, -0.3023146688938141, -0.2634931802749634, -0.22467169165611267, -0.18585020303726196, -0.14702871441841125, -0.10820722579956055, -0.06938573718070984, -0.03056424856185913, 0.008257240056991577, 0.047078728675842285, 0.085900217294693, 0.1247217059135437, 0.1635431945323944, 0.20236468315124512, 0.24118617177009583, 0.28000766038894653, 0.31882914900779724, 0.35765063762664795, 0.39647212624549866, 0.43529361486434937, 0.4741151034832001, 0.5129365921020508, 0.5517580509185791, 0.5905795693397522, 0.6294010877609253, 0.6682225465774536, 0.7070440053939819, 0.745865523815155, 0.7846870422363281, 0.8235085010528564, 0.8623299598693848, 0.9011514782905579, 0.939972996711731, 0.9787944555282593, 1.0176159143447876, 1.0564374923706055, 1.0952589511871338, 1.134080410003662, 1.1729018688201904, 1.2117233276367188, 1.2505449056625366, 1.289366364479065, 1.3281878232955933, 1.3670094013214111, 1.4058308601379395, 1.4446523189544678]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 12.0, 10.0, 18.0, 21.0, 47.0, 133.0, 820.0, 19471.0, 51449104.0, 1349.0, 197.0, 92.0, 28.0, 24.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8125, -21.06201171875, -20.3115234375, -19.56103515625, -18.810546875, -18.06005859375, -17.3095703125, -16.55908203125, -15.80859375, -15.05810546875, -14.3076171875, -13.55712890625, -12.806640625, -12.05615234375, -11.3056640625, -10.55517578125, -9.8046875, -9.05419921875, -8.3037109375, -7.55322265625, -6.802734375, -6.05224609375, -5.3017578125, -4.55126953125, -3.80078125, -3.05029296875, -2.2998046875, -1.54931640625, -0.798828125, -0.04833984375, 0.7021484375, 1.45263671875, 2.203125, 2.95361328125, 3.7041015625, 4.45458984375, 5.205078125, 5.95556640625, 6.7060546875, 7.45654296875, 8.20703125, 8.95751953125, 9.7080078125, 10.45849609375, 11.208984375, 11.95947265625, 12.7099609375, 13.46044921875, 14.2109375, 14.96142578125, 15.7119140625, 16.46240234375, 17.212890625, 17.96337890625, 18.7138671875, 19.46435546875, 20.21484375, 20.96533203125, 21.7158203125, 22.46630859375, 23.216796875, 23.96728515625, 24.7177734375, 25.46826171875, 26.21875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 4.0, 14.0, 16.0, 27.0, 27.0, 46.0, 67.0, 106.0, 136.0, 216.0, 332.0, 475.0, 653.0, 1005.0, 1401.0, 2056.0, 3020.0, 4246.0, 6245.0, 9389.0, 14179.0, 21157.0, 33039.0, 52466.0, 83307.0, 134180.0, 213739.0, 327931.0, 474813.0, 3626868.0, 442617.0, 305854.0, 196876.0, 122663.0, 75747.0, 47256.0, 30178.0, 19444.0, 12973.0, 8435.0, 5811.0, 3864.0, 2613.0, 1829.0, 1249.0, 905.0, 644.0, 409.0, 265.0, 226.0, 127.0, 101.0, 70.0, 39.0, 37.0, 22.0, 6.0, 13.0, 6.0, 5.0, 2.0], "bins": [-0.295654296875, -0.2865333557128906, -0.27741241455078125, -0.2682914733886719, -0.2591705322265625, -0.2500495910644531, -0.24092864990234375, -0.23180770874023438, -0.222686767578125, -0.21356582641601562, -0.20444488525390625, -0.19532394409179688, -0.1862030029296875, -0.17708206176757812, -0.16796112060546875, -0.15884017944335938, -0.14971923828125, -0.14059829711914062, -0.13147735595703125, -0.12235641479492188, -0.1132354736328125, -0.10411453247070312, -0.09499359130859375, -0.08587265014648438, -0.076751708984375, -0.06763076782226562, -0.05850982666015625, -0.049388885498046875, -0.0402679443359375, -0.031147003173828125, -0.02202606201171875, -0.012905120849609375, -0.0037841796875, 0.005336761474609375, 0.01445770263671875, 0.023578643798828125, 0.0326995849609375, 0.041820526123046875, 0.05094146728515625, 0.060062408447265625, 0.069183349609375, 0.07830429077148438, 0.08742523193359375, 0.09654617309570312, 0.1056671142578125, 0.11478805541992188, 0.12390899658203125, 0.13302993774414062, 0.14215087890625, 0.15127182006835938, 0.16039276123046875, 0.16951370239257812, 0.1786346435546875, 0.18775558471679688, 0.19687652587890625, 0.20599746704101562, 0.215118408203125, 0.22423934936523438, 0.23336029052734375, 0.24248123168945312, 0.2516021728515625, 0.2607231140136719, 0.26984405517578125, 0.2789649963378906, 0.2880859375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 19.0, 14.0, 16.0, 19.0, 16.0, 26.0, 26.0, 25.0, 26.0, 38.0, 38.0, 26.0, 38.0, 36.0, 43.0, 314.0, 774.0, 32.0, 41.0, 26.0, 32.0, 49.0, 47.0, 37.0, 25.0, 31.0, 36.0, 25.0, 23.0, 16.0, 8.0, 10.0, 12.0, 5.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.7265625, -5.5533447265625, -5.380126953125, -5.2069091796875, -5.03369140625, -4.8604736328125, -4.687255859375, -4.5140380859375, -4.3408203125, -4.1676025390625, -3.994384765625, -3.8211669921875, -3.64794921875, -3.4747314453125, -3.301513671875, -3.1282958984375, -2.955078125, -2.7818603515625, -2.608642578125, -2.4354248046875, -2.26220703125, -2.0889892578125, -1.915771484375, -1.7425537109375, -1.5693359375, -1.3961181640625, -1.222900390625, -1.0496826171875, -0.87646484375, -0.7032470703125, -0.530029296875, -0.3568115234375, -0.18359375, -0.0103759765625, 0.162841796875, 0.3360595703125, 0.50927734375, 0.6824951171875, 0.855712890625, 1.0289306640625, 1.2021484375, 1.3753662109375, 1.548583984375, 1.7218017578125, 1.89501953125, 2.0682373046875, 2.241455078125, 2.4146728515625, 2.587890625, 2.7611083984375, 2.934326171875, 3.1075439453125, 3.28076171875, 3.4539794921875, 3.627197265625, 3.8004150390625, 3.9736328125, 4.1468505859375, 4.320068359375, 4.4932861328125, 4.66650390625, 4.8397216796875, 5.012939453125, 5.1861572265625, 5.359375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 7.0, 25.0, 38.0, 40.0, 60.0, 128.0, 168.0, 241.0, 419.0, 539.0, 993.0, 1505.0, 2242.0, 3672.0, 5888.0, 9281.0, 15479.0, 26471.0, 45266.0, 80694.0, 148053.0, 272979.0, 473011.0, 3738840.0, 626932.0, 372236.0, 205549.0, 111690.0, 61973.0, 34641.0, 20394.0, 12218.0, 7405.0, 4487.0, 2822.0, 1798.0, 1145.0, 698.0, 491.0, 316.0, 195.0, 154.0, 91.0, 52.0, 37.0, 16.0, 11.0, 15.0, 10.0, 10.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.3378944396972656, -0.32691192626953125, -0.3159294128417969, -0.3049468994140625, -0.2939643859863281, -0.28298187255859375, -0.2719993591308594, -0.261016845703125, -0.2500343322753906, -0.23905181884765625, -0.22806930541992188, -0.2170867919921875, -0.20610427856445312, -0.19512176513671875, -0.18413925170898438, -0.17315673828125, -0.16217422485351562, -0.15119171142578125, -0.14020919799804688, -0.1292266845703125, -0.11824417114257812, -0.10726165771484375, -0.09627914428710938, -0.085296630859375, -0.07431411743164062, -0.06333160400390625, -0.052349090576171875, -0.0413665771484375, -0.030384063720703125, -0.01940155029296875, -0.008419036865234375, 0.0025634765625, 0.013545989990234375, 0.02452850341796875, 0.035511016845703125, 0.0464935302734375, 0.057476043701171875, 0.06845855712890625, 0.07944107055664062, 0.090423583984375, 0.10140609741210938, 0.11238861083984375, 0.12337112426757812, 0.1343536376953125, 0.14533615112304688, 0.15631866455078125, 0.16730117797851562, 0.17828369140625, 0.18926620483398438, 0.20024871826171875, 0.21123123168945312, 0.2222137451171875, 0.23319625854492188, 0.24417877197265625, 0.2551612854003906, 0.266143798828125, 0.2771263122558594, 0.28810882568359375, 0.2990913391113281, 0.3100738525390625, 0.3210563659667969, 0.33203887939453125, 0.3430213928222656, 0.35400390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 12.0, 21.0, 15.0, 16.0, 19.0, 21.0, 18.0, 28.0, 31.0, 28.0, 35.0, 33.0, 35.0, 42.0, 34.0, 46.0, 1026.0, 82.0, 38.0, 43.0, 37.0, 24.0, 31.0, 40.0, 39.0, 28.0, 26.0, 23.0, 15.0, 20.0, 18.0, 12.0, 9.0, 9.0, 11.0, 7.0, 8.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.9296875, -4.77374267578125, -4.6177978515625, -4.46185302734375, -4.305908203125, -4.14996337890625, -3.9940185546875, -3.83807373046875, -3.68212890625, -3.52618408203125, -3.3702392578125, -3.21429443359375, -3.058349609375, -2.90240478515625, -2.7464599609375, -2.59051513671875, -2.4345703125, -2.27862548828125, -2.1226806640625, -1.96673583984375, -1.810791015625, -1.65484619140625, -1.4989013671875, -1.34295654296875, -1.18701171875, -1.03106689453125, -0.8751220703125, -0.71917724609375, -0.563232421875, -0.40728759765625, -0.2513427734375, -0.09539794921875, 0.060546875, 0.21649169921875, 0.3724365234375, 0.52838134765625, 0.684326171875, 0.84027099609375, 0.9962158203125, 1.15216064453125, 1.30810546875, 1.46405029296875, 1.6199951171875, 1.77593994140625, 1.931884765625, 2.08782958984375, 2.2437744140625, 2.39971923828125, 2.5556640625, 2.71160888671875, 2.8675537109375, 3.02349853515625, 3.179443359375, 3.33538818359375, 3.4913330078125, 3.64727783203125, 3.80322265625, 3.95916748046875, 4.1151123046875, 4.27105712890625, 4.427001953125, 4.58294677734375, 4.7388916015625, 4.89483642578125, 5.05078125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 6.0, 12.0, 16.0, 25.0, 38.0, 53.0, 79.0, 106.0, 195.0, 240.0, 395.0, 639.0, 1030.0, 1763.0, 3285.0, 6345.0, 12765.0, 26945.0, 63537.0, 169643.0, 525290.0, 4307596.0, 766840.0, 246805.0, 88013.0, 35863.0, 16332.0, 7939.0, 4121.0, 2241.0, 1249.0, 720.0, 454.0, 267.0, 178.0, 126.0, 78.0, 60.0, 32.0, 33.0, 20.0, 14.0, 11.0, 13.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.72119140625, -0.7009735107421875, -0.680755615234375, -0.6605377197265625, -0.64031982421875, -0.6201019287109375, -0.599884033203125, -0.5796661376953125, -0.5594482421875, -0.5392303466796875, -0.519012451171875, -0.4987945556640625, -0.47857666015625, -0.4583587646484375, -0.438140869140625, -0.4179229736328125, -0.397705078125, -0.3774871826171875, -0.357269287109375, -0.3370513916015625, -0.31683349609375, -0.2966156005859375, -0.276397705078125, -0.2561798095703125, -0.2359619140625, -0.2157440185546875, -0.195526123046875, -0.1753082275390625, -0.15509033203125, -0.1348724365234375, -0.114654541015625, -0.0944366455078125, -0.07421875, -0.0540008544921875, -0.033782958984375, -0.0135650634765625, 0.00665283203125, 0.0268707275390625, 0.047088623046875, 0.0673065185546875, 0.0875244140625, 0.1077423095703125, 0.127960205078125, 0.1481781005859375, 0.16839599609375, 0.1886138916015625, 0.208831787109375, 0.2290496826171875, 0.249267578125, 0.2694854736328125, 0.289703369140625, 0.3099212646484375, 0.33013916015625, 0.3503570556640625, 0.370574951171875, 0.3907928466796875, 0.4110107421875, 0.4312286376953125, 0.451446533203125, 0.4716644287109375, 0.49188232421875, 0.5121002197265625, 0.532318115234375, 0.5525360107421875, 0.57275390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 12.0, 12.0, 19.0, 9.0, 19.0, 18.0, 26.0, 34.0, 35.0, 39.0, 26.0, 49.0, 46.0, 49.0, 57.0, 1056.0, 76.0, 61.0, 44.0, 36.0, 47.0, 32.0, 39.0, 29.0, 20.0, 25.0, 17.0, 21.0, 16.0, 9.0, 7.0, 5.0, 9.0, 3.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.2734375, -6.101806640625, -5.93017578125, -5.758544921875, -5.5869140625, -5.415283203125, -5.24365234375, -5.072021484375, -4.900390625, -4.728759765625, -4.55712890625, -4.385498046875, -4.2138671875, -4.042236328125, -3.87060546875, -3.698974609375, -3.52734375, -3.355712890625, -3.18408203125, -3.012451171875, -2.8408203125, -2.669189453125, -2.49755859375, -2.325927734375, -2.154296875, -1.982666015625, -1.81103515625, -1.639404296875, -1.4677734375, -1.296142578125, -1.12451171875, -0.952880859375, -0.78125, -0.609619140625, -0.43798828125, -0.266357421875, -0.0947265625, 0.076904296875, 0.24853515625, 0.420166015625, 0.591796875, 0.763427734375, 0.93505859375, 1.106689453125, 1.2783203125, 1.449951171875, 1.62158203125, 1.793212890625, 1.96484375, 2.136474609375, 2.30810546875, 2.479736328125, 2.6513671875, 2.822998046875, 2.99462890625, 3.166259765625, 3.337890625, 3.509521484375, 3.68115234375, 3.852783203125, 4.0244140625, 4.196044921875, 4.36767578125, 4.539306640625, 4.7109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 6.0, 12.0, 28.0, 52.0, 125.0, 234.0, 248.0, 123.0, 66.0, 35.0, 23.0, 20.0, 8.0, 2.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3906078338623047, -2.1903767585754395, -1.9901455640792847, -1.7899144887924194, -1.5896832942962646, -1.3894522190093994, -1.1892211437225342, -0.9889899492263794, -0.7887588739395142, -0.5885277390480042, -0.38829663395881653, -0.1880655288696289, 0.012165606021881104, 0.2123967409133911, 0.41262781620025635, 0.6128590106964111, 0.8130900859832764, 1.0133211612701416, 1.2135523557662964, 1.4137834310531616, 1.6140146255493164, 1.8142457008361816, 2.014476776123047, 2.214707851409912, 2.4149389266967773, 2.6151700019836426, 2.815401077270508, 3.015632152557373, 3.2158634662628174, 3.4160945415496826, 3.616325616836548, 3.816556930541992, 4.016788005828857, 4.217019081115723, 4.417250156402588, 4.617481231689453, 4.817712306976318, 5.017943382263184, 5.218174934387207, 5.418406009674072, 5.6186370849609375, 5.818868160247803, 6.019099235534668, 6.219330310821533, 6.419561386108398, 6.619792938232422, 6.820023536682129, 7.020255088806152, 7.220485687255859, 7.420716762542725, 7.62094783782959, 7.821178913116455, 8.02140998840332, 8.221641540527344, 8.42187213897705, 8.622103691101074, 8.822335243225098, 9.022566795349121, 9.222797393798828, 9.423028945922852, 9.623259544372559, 9.823491096496582, 10.023721694946289, 10.223953247070312, 10.42418384552002]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 15.0, 17.0, 22.0, 38.0, 38.0, 38.0, 53.0, 63.0, 62.0, 55.0, 73.0, 84.0, 52.0, 56.0, 61.0, 54.0, 46.0, 40.0, 35.0, 25.0, 19.0, 9.0, 15.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.291414260864258, -8.857199668884277, -8.422985076904297, -7.988770484924316, -7.554555892944336, -7.1203413009643555, -6.686126708984375, -6.2519121170043945, -5.817697525024414, -5.383482933044434, -4.949268341064453, -4.515053749084473, -4.080839157104492, -3.646624803543091, -3.2124102115631104, -2.77819561958313, -2.3439812660217285, -1.909766674041748, -1.4755520820617676, -1.0413376092910767, -0.6071230173110962, -0.17290854454040527, 0.2613060474395752, 0.6955206394195557, 1.1297352313995361, 1.5639498233795166, 1.998164415359497, 2.4323787689208984, 2.866593360900879, 3.3008079528808594, 3.73502254486084, 4.16923713684082, 4.603451728820801, 5.037666320800781, 5.471880912780762, 5.906095504760742, 6.340310096740723, 6.774524688720703, 7.208739280700684, 7.642953872680664, 8.077168464660645, 8.511383056640625, 8.945597648620605, 9.379812240600586, 9.814026832580566, 10.248241424560547, 10.682456016540527, 11.116670608520508, 11.550884246826172, 11.985098838806152, 12.419313430786133, 12.853528022766113, 13.287742614746094, 13.721957206726074, 14.156171798706055, 14.590386390686035, 15.024600982666016, 15.458815574645996, 15.893030166625977, 16.32724380493164, 16.761459350585938, 17.1956729888916, 17.6298885345459, 18.064102172851562, 18.49831771850586]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 9.0, 18.0, 26.0, 44.0, 84.0, 237.0, 721.0, 2149.0, 8179.0, 37161.0, 1675566.0, 2421822.0, 35888.0, 8155.0, 2291.0, 827.0, 323.0, 197.0, 137.0, 108.0, 96.0, 61.0, 42.0, 42.0, 29.0, 21.0, 17.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260009765625, -0.24473190307617188, -0.22945404052734375, -0.21417617797851562, -0.1988983154296875, -0.18362045288085938, -0.16834259033203125, -0.15306472778320312, -0.137786865234375, -0.12250900268554688, -0.10723114013671875, -0.09195327758789062, -0.0766754150390625, -0.061397552490234375, -0.04611968994140625, -0.030841827392578125, -0.01556396484375, -0.000286102294921875, 0.01499176025390625, 0.030269622802734375, 0.0455474853515625, 0.060825347900390625, 0.07610321044921875, 0.09138107299804688, 0.106658935546875, 0.12193679809570312, 0.13721466064453125, 0.15249252319335938, 0.1677703857421875, 0.18304824829101562, 0.19832611083984375, 0.21360397338867188, 0.2288818359375, 0.24415969848632812, 0.25943756103515625, 0.2747154235839844, 0.2899932861328125, 0.3052711486816406, 0.32054901123046875, 0.3358268737792969, 0.351104736328125, 0.3663825988769531, 0.38166046142578125, 0.3969383239746094, 0.4122161865234375, 0.4274940490722656, 0.44277191162109375, 0.4580497741699219, 0.47332763671875, 0.4886054992675781, 0.5038833618164062, 0.5191612243652344, 0.5344390869140625, 0.5497169494628906, 0.5649948120117188, 0.5802726745605469, 0.595550537109375, 0.6108283996582031, 0.6261062622070312, 0.6413841247558594, 0.6566619873046875, 0.6719398498535156, 0.6872177124023438, 0.7024955749511719, 0.7177734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 20.0, 26.0, 32.0, 33.0, 68.0, 100.0, 97.0, 116.0, 108.0, 81.0, 96.0, 61.0, 43.0, 25.0, 25.0, 19.0, 9.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.054920196533203125, -0.05149078369140625, -0.048061370849609375, -0.0446319580078125, -0.041202545166015625, -0.03777313232421875, -0.034343719482421875, -0.030914306640625, -0.027484893798828125, -0.02405548095703125, -0.020626068115234375, -0.0171966552734375, -0.013767242431640625, -0.01033782958984375, -0.006908416748046875, -0.00347900390625, -4.9591064453125e-05, 0.00337982177734375, 0.006809234619140625, 0.0102386474609375, 0.013668060302734375, 0.01709747314453125, 0.020526885986328125, 0.023956298828125, 0.027385711669921875, 0.03081512451171875, 0.034244537353515625, 0.0376739501953125, 0.041103363037109375, 0.04453277587890625, 0.047962188720703125, 0.0513916015625, 0.054821014404296875, 0.05825042724609375, 0.061679840087890625, 0.0651092529296875, 0.06853866577148438, 0.07196807861328125, 0.07539749145507812, 0.078826904296875, 0.08225631713867188, 0.08568572998046875, 0.08911514282226562, 0.0925445556640625, 0.09597396850585938, 0.09940338134765625, 0.10283279418945312, 0.10626220703125, 0.10969161987304688, 0.11312103271484375, 0.11655044555664062, 0.1199798583984375, 0.12340927124023438, 0.12683868408203125, 0.13026809692382812, 0.133697509765625, 0.13712692260742188, 0.14055633544921875, 0.14398574829101562, 0.1474151611328125, 0.15084457397460938, 0.15427398681640625, 0.15770339965820312, 0.1611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 11.0, 13.0, 10.0, 39.0, 60.0, 112.0, 390.0, 5389.0, 4146810.0, 40203.0, 748.0, 145.0, 68.0, 59.0, 33.0, 20.0, 22.0, 18.0, 16.0, 9.0, 15.0, 12.0, 8.0, 7.0, 2.0, 11.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.304931640625, -0.2902030944824219, -0.27547454833984375, -0.2607460021972656, -0.2460174560546875, -0.23128890991210938, -0.21656036376953125, -0.20183181762695312, -0.187103271484375, -0.17237472534179688, -0.15764617919921875, -0.14291763305664062, -0.1281890869140625, -0.11346054077148438, -0.09873199462890625, -0.08400344848632812, -0.06927490234375, -0.054546356201171875, -0.03981781005859375, -0.025089263916015625, -0.0103607177734375, 0.004367828369140625, 0.01909637451171875, 0.033824920654296875, 0.048553466796875, 0.06328201293945312, 0.07801055908203125, 0.09273910522460938, 0.1074676513671875, 0.12219619750976562, 0.13692474365234375, 0.15165328979492188, 0.1663818359375, 0.18111038208007812, 0.19583892822265625, 0.21056747436523438, 0.2252960205078125, 0.24002456665039062, 0.25475311279296875, 0.2694816589355469, 0.284210205078125, 0.2989387512207031, 0.31366729736328125, 0.3283958435058594, 0.3431243896484375, 0.3578529357910156, 0.37258148193359375, 0.3873100280761719, 0.40203857421875, 0.4167671203613281, 0.43149566650390625, 0.4462242126464844, 0.4609527587890625, 0.4756813049316406, 0.49040985107421875, 0.5051383972167969, 0.519866943359375, 0.5345954895019531, 0.5493240356445312, 0.5640525817871094, 0.5787811279296875, 0.5935096740722656, 0.6082382202148438, 0.6229667663574219, 0.6376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 6.0, 8.0, 7.0, 13.0, 7.0, 9.0, 9.0, 16.0, 13.0, 15.0, 21.0, 33.0, 34.0, 52.0, 83.0, 127.0, 280.0, 1000.0, 1478.0, 431.0, 176.0, 91.0, 53.0, 29.0, 15.0, 13.0, 12.0, 6.0, 9.0, 5.0, 5.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.15771484375, -0.15405941009521484, -0.1504039764404297, -0.14674854278564453, -0.14309310913085938, -0.13943767547607422, -0.13578224182128906, -0.1321268081665039, -0.12847137451171875, -0.1248159408569336, -0.12116050720214844, -0.11750507354736328, -0.11384963989257812, -0.11019420623779297, -0.10653877258300781, -0.10288333892822266, -0.0992279052734375, -0.09557247161865234, -0.09191703796386719, -0.08826160430908203, -0.08460617065429688, -0.08095073699951172, -0.07729530334472656, -0.0736398696899414, -0.06998443603515625, -0.0663290023803711, -0.06267356872558594, -0.05901813507080078, -0.055362701416015625, -0.05170726776123047, -0.04805183410644531, -0.044396400451660156, -0.040740966796875, -0.037085533142089844, -0.03343009948730469, -0.02977466583251953, -0.026119232177734375, -0.02246379852294922, -0.018808364868164062, -0.015152931213378906, -0.01149749755859375, -0.007842063903808594, -0.0041866302490234375, -0.0005311965942382812, 0.003124237060546875, 0.006779670715332031, 0.010435104370117188, 0.014090538024902344, 0.0177459716796875, 0.021401405334472656, 0.025056838989257812, 0.02871227264404297, 0.032367706298828125, 0.03602313995361328, 0.03967857360839844, 0.043334007263183594, 0.04698944091796875, 0.050644874572753906, 0.05430030822753906, 0.05795574188232422, 0.061611175537109375, 0.06526660919189453, 0.06892204284667969, 0.07257747650146484, 0.07623291015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 67.0, 943.0, 8.0, 1.0], "bins": [-10.233671188354492, -10.066451072692871, -9.89923095703125, -9.732009887695312, -9.564789772033691, -9.39756965637207, -9.23034954071045, -9.063129425048828, -8.89590835571289, -8.72868824005127, -8.561468124389648, -8.394247055053711, -8.22702693939209, -8.059806823730469, -7.892586708068848, -7.725366115570068, -7.558145999908447, -7.390925884246826, -7.223705291748047, -7.056485176086426, -6.8892645835876465, -6.722044467926025, -6.554823875427246, -6.387603759765625, -6.220383644104004, -6.053163528442383, -5.8859429359436035, -5.718722820281982, -5.551502227783203, -5.384282112121582, -5.217061996459961, -5.049841403961182, -4.882620811462402, -4.715400695800781, -4.548180103302002, -4.380959987640381, -4.213739395141602, -4.0465192794799805, -3.8792989253997803, -3.71207857131958, -3.544858455657959, -3.377638101577759, -3.2104177474975586, -3.0431976318359375, -2.875977039337158, -2.708756923675537, -2.541536569595337, -2.3743162155151367, -2.2070958614349365, -2.0398755073547363, -1.8726551532745361, -1.7054349184036255, -1.5382145643234253, -1.370994210243225, -1.2037739753723145, -1.0365536212921143, -0.8693332672119141, -0.7021129131317139, -0.5348926186561584, -0.367672324180603, -0.20045197010040283, -0.03323161602020264, 0.133988618850708, 0.3012089729309082, 0.4684293270111084]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 13.0, 8.0, 10.0, 24.0, 32.0, 31.0, 47.0, 64.0, 68.0, 62.0, 77.0, 70.0, 68.0, 74.0, 71.0, 64.0, 57.0, 27.0, 35.0, 35.0, 18.0, 12.0, 14.0, 12.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9026329517364502, -0.8802474737167358, -0.8578620553016663, -0.8354765772819519, -0.8130910992622375, -0.790705680847168, -0.7683202028274536, -0.7459347248077393, -0.7235493063926697, -0.7011638283729553, -0.6787784099578857, -0.6563929319381714, -0.634007453918457, -0.6116220355033875, -0.5892365574836731, -0.5668511390686035, -0.5444656610488892, -0.5220801830291748, -0.49969473481178284, -0.47730928659439087, -0.4549238383769989, -0.43253839015960693, -0.4101529121398926, -0.3877674639225006, -0.36538195610046387, -0.3429965078830719, -0.32061102986335754, -0.2982255816459656, -0.2758401334285736, -0.25345468521118164, -0.23106920719146729, -0.20868375897407532, -0.18629831075668335, -0.1639128476381302, -0.14152739942073822, -0.11914193630218506, -0.0967564806342125, -0.07437102496623993, -0.05198556184768677, -0.0296001136302948, -0.007214650511741638, 0.015170807018876076, 0.03755626454949379, 0.05994172394275665, 0.08232717961072922, 0.10471263527870178, 0.12709809839725494, 0.1494835466146469, 0.17186900973320007, 0.19425447285175323, 0.2166399210691452, 0.23902538418769836, 0.26141083240509033, 0.2837963104248047, 0.30618175864219666, 0.3285672068595886, 0.350952684879303, 0.37333813309669495, 0.3957236111164093, 0.41810905933380127, 0.44049450755119324, 0.4628799557685852, 0.48526543378829956, 0.5076508522033691, 0.5300363302230835]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 15.0, 20.0, 37.0, 69.0, 141.0, 278.0, 758.0, 1971.0, 8253.0, 739466.0, 287015.0, 7374.0, 1865.0, 656.0, 279.0, 138.0, 80.0, 38.0, 25.0, 14.0, 11.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.9599609375, -1.914337158203125, -1.86871337890625, -1.823089599609375, -1.7774658203125, -1.731842041015625, -1.68621826171875, -1.640594482421875, -1.594970703125, -1.549346923828125, -1.50372314453125, -1.458099365234375, -1.4124755859375, -1.366851806640625, -1.32122802734375, -1.275604248046875, -1.22998046875, -1.184356689453125, -1.13873291015625, -1.093109130859375, -1.0474853515625, -1.001861572265625, -0.95623779296875, -0.910614013671875, -0.864990234375, -0.819366455078125, -0.77374267578125, -0.728118896484375, -0.6824951171875, -0.636871337890625, -0.59124755859375, -0.545623779296875, -0.5, -0.454376220703125, -0.40875244140625, -0.363128662109375, -0.3175048828125, -0.271881103515625, -0.22625732421875, -0.180633544921875, -0.135009765625, -0.089385986328125, -0.04376220703125, 0.001861572265625, 0.0474853515625, 0.093109130859375, 0.13873291015625, 0.184356689453125, 0.22998046875, 0.275604248046875, 0.32122802734375, 0.366851806640625, 0.4124755859375, 0.458099365234375, 0.50372314453125, 0.549346923828125, 0.594970703125, 0.640594482421875, 0.68621826171875, 0.731842041015625, 0.7774658203125, 0.823089599609375, 0.86871337890625, 0.914337158203125, 0.9599609375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 7.0, 15.0, 17.0, 27.0, 29.0, 54.0, 83.0, 103.0, 107.0, 132.0, 95.0, 102.0, 73.0, 42.0, 30.0, 35.0, 15.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.0603179931640625, -0.056671142578125, -0.0530242919921875, -0.04937744140625, -0.0457305908203125, -0.042083740234375, -0.0384368896484375, -0.0347900390625, -0.0311431884765625, -0.027496337890625, -0.0238494873046875, -0.02020263671875, -0.0165557861328125, -0.012908935546875, -0.0092620849609375, -0.005615234375, -0.0019683837890625, 0.001678466796875, 0.0053253173828125, 0.00897216796875, 0.0126190185546875, 0.016265869140625, 0.0199127197265625, 0.0235595703125, 0.0272064208984375, 0.030853271484375, 0.0345001220703125, 0.03814697265625, 0.0417938232421875, 0.045440673828125, 0.0490875244140625, 0.052734375, 0.0563812255859375, 0.060028076171875, 0.0636749267578125, 0.06732177734375, 0.0709686279296875, 0.074615478515625, 0.0782623291015625, 0.0819091796875, 0.0855560302734375, 0.089202880859375, 0.0928497314453125, 0.09649658203125, 0.1001434326171875, 0.103790283203125, 0.1074371337890625, 0.111083984375, 0.1147308349609375, 0.118377685546875, 0.1220245361328125, 0.12567138671875, 0.1293182373046875, 0.132965087890625, 0.1366119384765625, 0.1402587890625, 0.1439056396484375, 0.147552490234375, 0.1511993408203125, 0.15484619140625, 0.1584930419921875, 0.162139892578125, 0.1657867431640625, 0.16943359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 6.0, 5.0, 6.0, 13.0, 15.0, 13.0, 22.0, 18.0, 30.0, 50.0, 59.0, 67.0, 105.0, 230.0, 404.0, 915.0, 2115.0, 5757.0, 17983.0, 73392.0, 488720.0, 374095.0, 60308.0, 15561.0, 5077.0, 1845.0, 794.0, 341.0, 226.0, 107.0, 57.0, 53.0, 32.0, 33.0, 18.0, 17.0, 15.0, 14.0, 7.0, 9.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1617431640625, -0.1568317413330078, -0.15192031860351562, -0.14700889587402344, -0.14209747314453125, -0.13718605041503906, -0.13227462768554688, -0.1273632049560547, -0.1224517822265625, -0.11754035949707031, -0.11262893676757812, -0.10771751403808594, -0.10280609130859375, -0.09789466857910156, -0.09298324584960938, -0.08807182312011719, -0.083160400390625, -0.07824897766113281, -0.07333755493164062, -0.06842613220214844, -0.06351470947265625, -0.05860328674316406, -0.053691864013671875, -0.04878044128417969, -0.0438690185546875, -0.03895759582519531, -0.034046173095703125, -0.029134750366210938, -0.02422332763671875, -0.019311904907226562, -0.014400482177734375, -0.009489059448242188, -0.00457763671875, 0.0003337860107421875, 0.005245208740234375, 0.010156631469726562, 0.01506805419921875, 0.019979476928710938, 0.024890899658203125, 0.029802322387695312, 0.0347137451171875, 0.03962516784667969, 0.044536590576171875, 0.04944801330566406, 0.05435943603515625, 0.05927085876464844, 0.06418228149414062, 0.06909370422363281, 0.074005126953125, 0.07891654968261719, 0.08382797241210938, 0.08873939514160156, 0.09365081787109375, 0.09856224060058594, 0.10347366333007812, 0.10838508605957031, 0.1132965087890625, 0.11820793151855469, 0.12311935424804688, 0.12803077697753906, 0.13294219970703125, 0.13785362243652344, 0.14276504516601562, 0.1476764678955078, 0.152587890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 15.0, 9.0, 9.0, 19.0, 17.0, 19.0, 20.0, 16.0, 29.0, 32.0, 33.0, 22.0, 40.0, 44.0, 40.0, 47.0, 39.0, 45.0, 51.0, 40.0, 34.0, 37.0, 32.0, 44.0, 25.0, 22.0, 39.0, 26.0, 26.0, 14.0, 15.0, 24.0, 8.0, 6.0, 9.0, 6.0, 5.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1234130859375, -0.11910629272460938, -0.11479949951171875, -0.11049270629882812, -0.1061859130859375, -0.10187911987304688, -0.09757232666015625, -0.09326553344726562, -0.088958740234375, -0.08465194702148438, -0.08034515380859375, -0.07603836059570312, -0.0717315673828125, -0.06742477416992188, -0.06311798095703125, -0.058811187744140625, -0.05450439453125, -0.050197601318359375, -0.04589080810546875, -0.041584014892578125, -0.0372772216796875, -0.032970428466796875, -0.02866363525390625, -0.024356842041015625, -0.020050048828125, -0.015743255615234375, -0.01143646240234375, -0.007129669189453125, -0.0028228759765625, 0.001483917236328125, 0.00579071044921875, 0.010097503662109375, 0.014404296875, 0.018711090087890625, 0.02301788330078125, 0.027324676513671875, 0.0316314697265625, 0.035938262939453125, 0.04024505615234375, 0.044551849365234375, 0.048858642578125, 0.053165435791015625, 0.05747222900390625, 0.061779022216796875, 0.0660858154296875, 0.07039260864257812, 0.07469940185546875, 0.07900619506835938, 0.08331298828125, 0.08761978149414062, 0.09192657470703125, 0.09623336791992188, 0.1005401611328125, 0.10484695434570312, 0.10915374755859375, 0.11346054077148438, 0.117767333984375, 0.12207412719726562, 0.12638092041015625, 0.13068771362304688, 0.1349945068359375, 0.13930130004882812, 0.14360809326171875, 0.14791488647460938, 0.1522216796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 13.0, 18.0, 21.0, 24.0, 52.0, 54.0, 80.0, 149.0, 241.0, 420.0, 740.0, 1323.0, 2695.0, 5537.0, 13926.0, 59414.0, 859553.0, 76041.0, 15765.0, 6125.0, 2876.0, 1464.0, 821.0, 432.0, 282.0, 156.0, 98.0, 60.0, 45.0, 27.0, 18.0, 14.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056396484375, -0.0545506477355957, -0.052704811096191406, -0.05085897445678711, -0.04901313781738281, -0.047167301177978516, -0.04532146453857422, -0.04347562789916992, -0.041629791259765625, -0.03978395462036133, -0.03793811798095703, -0.036092281341552734, -0.03424644470214844, -0.03240060806274414, -0.030554771423339844, -0.028708934783935547, -0.02686309814453125, -0.025017261505126953, -0.023171424865722656, -0.02132558822631836, -0.019479751586914062, -0.017633914947509766, -0.01578807830810547, -0.013942241668701172, -0.012096405029296875, -0.010250568389892578, -0.008404731750488281, -0.006558895111083984, -0.0047130584716796875, -0.0028672218322753906, -0.0010213851928710938, 0.0008244514465332031, 0.0026702880859375, 0.004516124725341797, 0.006361961364746094, 0.00820779800415039, 0.010053634643554688, 0.011899471282958984, 0.013745307922363281, 0.015591144561767578, 0.017436981201171875, 0.019282817840576172, 0.02112865447998047, 0.022974491119384766, 0.024820327758789062, 0.02666616439819336, 0.028512001037597656, 0.030357837677001953, 0.03220367431640625, 0.03404951095581055, 0.035895347595214844, 0.03774118423461914, 0.03958702087402344, 0.041432857513427734, 0.04327869415283203, 0.04512453079223633, 0.046970367431640625, 0.04881620407104492, 0.05066204071044922, 0.052507877349853516, 0.05435371398925781, 0.05619955062866211, 0.058045387268066406, 0.0598912239074707, 0.061737060546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 13.0, 128.0, 471.0, 293.0, 49.0, 11.0, 2.0, 4.0, 2.0, 1.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5032477676868439e-05, -1.4448538422584534e-05, -1.3864599168300629e-05, -1.3280659914016724e-05, -1.2696720659732819e-05, -1.2112781405448914e-05, -1.1528842151165009e-05, -1.0944902896881104e-05, -1.0360963642597198e-05, -9.777024388313293e-06, -9.193085134029388e-06, -8.609145879745483e-06, -8.025206625461578e-06, -7.441267371177673e-06, -6.857328116893768e-06, -6.273388862609863e-06, -5.689449608325958e-06, -5.105510354042053e-06, -4.521571099758148e-06, -3.937631845474243e-06, -3.353692591190338e-06, -2.769753336906433e-06, -2.185814082622528e-06, -1.601874828338623e-06, -1.017935574054718e-06, -4.33996319770813e-07, 1.4994293451309204e-07, 7.338821887969971e-07, 1.317821443080902e-06, 1.9017606973648071e-06, 2.485699951648712e-06, 3.069639205932617e-06, 3.6535784602165222e-06, 4.237517714500427e-06, 4.821456968784332e-06, 5.405396223068237e-06, 5.989335477352142e-06, 6.573274731636047e-06, 7.157213985919952e-06, 7.741153240203857e-06, 8.325092494487762e-06, 8.909031748771667e-06, 9.492971003055573e-06, 1.0076910257339478e-05, 1.0660849511623383e-05, 1.1244788765907288e-05, 1.1828728020191193e-05, 1.2412667274475098e-05, 1.2996606528759003e-05, 1.3580545783042908e-05, 1.4164485037326813e-05, 1.4748424291610718e-05, 1.5332363545894623e-05, 1.5916302800178528e-05, 1.6500242054462433e-05, 1.7084181308746338e-05, 1.7668120563030243e-05, 1.8252059817314148e-05, 1.8835999071598053e-05, 1.9419938325881958e-05, 2.0003877580165863e-05, 2.0587816834449768e-05, 2.1171756088733673e-05, 2.1755695343017578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 13.0, 29.0, 101.0, 376.0, 2002.0, 16393.0, 959578.0, 63984.0, 5022.0, 782.0, 151.0, 55.0, 17.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.1587352752685547, -0.15279769897460938, -0.14686012268066406, -0.14092254638671875, -0.13498497009277344, -0.12904739379882812, -0.12310981750488281, -0.1171722412109375, -0.11123466491699219, -0.10529708862304688, -0.09935951232910156, -0.09342193603515625, -0.08748435974121094, -0.08154678344726562, -0.07560920715332031, -0.069671630859375, -0.06373405456542969, -0.057796478271484375, -0.05185890197753906, -0.04592132568359375, -0.03998374938964844, -0.034046173095703125, -0.028108596801757812, -0.0221710205078125, -0.016233444213867188, -0.010295867919921875, -0.0043582916259765625, 0.00157928466796875, 0.0075168609619140625, 0.013454437255859375, 0.019392013549804688, 0.02532958984375, 0.03126716613769531, 0.037204742431640625, 0.04314231872558594, 0.04907989501953125, 0.05501747131347656, 0.060955047607421875, 0.06689262390136719, 0.0728302001953125, 0.07876777648925781, 0.08470535278320312, 0.09064292907714844, 0.09658050537109375, 0.10251808166503906, 0.10845565795898438, 0.11439323425292969, 0.120330810546875, 0.1262683868408203, 0.13220596313476562, 0.13814353942871094, 0.14408111572265625, 0.15001869201660156, 0.15595626831054688, 0.1618938446044922, 0.1678314208984375, 0.1737689971923828, 0.17970657348632812, 0.18564414978027344, 0.19158172607421875, 0.19751930236816406, 0.20345687866210938, 0.2093944549560547, 0.21533203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 6.0, 11.0, 29.0, 27.0, 60.0, 160.0, 309.0, 183.0, 88.0, 41.0, 21.0, 9.0, 10.0, 6.0, 1.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15946483612060547, -0.15511131286621094, -0.1507577896118164, -0.14640426635742188, -0.14205074310302734, -0.1376972198486328, -0.13334369659423828, -0.12899017333984375, -0.12463665008544922, -0.12028312683105469, -0.11592960357666016, -0.11157608032226562, -0.1072225570678711, -0.10286903381347656, -0.09851551055908203, -0.0941619873046875, -0.08980846405029297, -0.08545494079589844, -0.0811014175415039, -0.07674789428710938, -0.07239437103271484, -0.06804084777832031, -0.06368732452392578, -0.05933380126953125, -0.05498027801513672, -0.05062675476074219, -0.046273231506347656, -0.041919708251953125, -0.037566184997558594, -0.03321266174316406, -0.02885913848876953, -0.024505615234375, -0.02015209197998047, -0.015798568725585938, -0.011445045471191406, -0.007091522216796875, -0.0027379989624023438, 0.0016155242919921875, 0.005969047546386719, 0.01032257080078125, 0.014676094055175781, 0.019029617309570312, 0.023383140563964844, 0.027736663818359375, 0.032090187072753906, 0.03644371032714844, 0.04079723358154297, 0.0451507568359375, 0.04950428009033203, 0.05385780334472656, 0.058211326599121094, 0.06256484985351562, 0.06691837310791016, 0.07127189636230469, 0.07562541961669922, 0.07997894287109375, 0.08433246612548828, 0.08868598937988281, 0.09303951263427734, 0.09739303588867188, 0.1017465591430664, 0.10610008239746094, 0.11045360565185547, 0.11480712890625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [4.0, 8.0, 27.0, 82.0, 361.0, 357.0, 116.0, 42.0, 11.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32920947670936584, -0.26328980922698975, -0.19737014174461365, -0.13145047426223755, -0.06553080677986145, 0.00038886070251464844, 0.06630852818489075, 0.13222819566726685, 0.19814786314964294, 0.26406753063201904, 0.32998719811439514, 0.39590686559677124, 0.46182653307914734, 0.5277462005615234, 0.5936658382415771, 0.6595855355262756, 0.7255052328109741, 0.7914248704910278, 0.8573445677757263, 0.9232642650604248, 0.9891839027404785, 1.0551035404205322, 1.121023178100586, 1.1869429349899292, 1.252862572669983, 1.3187822103500366, 1.3847019672393799, 1.4506216049194336, 1.5165412425994873, 1.582460880279541, 1.6483805179595947, 1.714300274848938, 1.7802197933197021, 1.8461394309997559, 1.9120590686798096, 1.9779788255691528, 2.043898582458496, 2.10981822013855, 2.1757378578186035, 2.2416574954986572, 2.307577133178711, 2.3734967708587646, 2.4394164085388184, 2.505336046218872, 2.571255683898926, 2.6371755599975586, 2.7030951976776123, 2.769014835357666, 2.8349344730377197, 2.9008541107177734, 2.966773748397827, 3.032693386077881, 3.0986132621765137, 3.1645328998565674, 3.230452537536621, 3.296372175216675, 3.3622918128967285, 3.4282114505767822, 3.494131088256836, 3.5600507259368896, 3.6259703636169434, 3.691890239715576, 3.75780987739563, 3.8237295150756836, 3.8896491527557373]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 11.0, 8.0, 8.0, 12.0, 16.0, 22.0, 16.0, 22.0, 27.0, 24.0, 28.0, 34.0, 44.0, 26.0, 48.0, 62.0, 37.0, 41.0, 44.0, 38.0, 45.0, 41.0, 42.0, 43.0, 36.0, 31.0, 30.0, 18.0, 25.0, 19.0, 20.0, 11.0, 14.0, 14.0, 7.0, 11.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8024653792381287, -0.7776053547859192, -0.7527453899383545, -0.727885365486145, -0.7030253410339355, -0.6781653165817261, -0.6533053517341614, -0.6284453272819519, -0.6035853028297424, -0.578725278377533, -0.5538653135299683, -0.5290052890777588, -0.5041452646255493, -0.47928526997566223, -0.45442527532577515, -0.4295652508735657, -0.4047052562236786, -0.3798452615737915, -0.35498523712158203, -0.33012524247169495, -0.3052652180194855, -0.2804052233695984, -0.2555451989173889, -0.23068520426750183, -0.20582519471645355, -0.18096518516540527, -0.156105175614357, -0.13124516606330872, -0.10638516396284103, -0.08152515441179276, -0.05666515231132507, -0.031805142760276794, -0.006945133209228516, 0.017914874479174614, 0.042774882167577744, 0.06763488799333572, 0.092494897544384, 0.11735490709543228, 0.14221490919589996, 0.16707491874694824, 0.19193492829799652, 0.2167949378490448, 0.24165494740009308, 0.26651495695114136, 0.29137495160102844, 0.3162349760532379, 0.341094970703125, 0.3659549951553345, 0.39081498980522156, 0.41567498445510864, 0.4405350089073181, 0.4653950035572052, 0.4902550280094147, 0.5151150226593018, 0.5399750471115112, 0.5648350715637207, 0.5896950364112854, 0.6145550608634949, 0.6394150257110596, 0.664275050163269, 0.6891350746154785, 0.713995099067688, 0.7388550639152527, 0.7637150883674622, 0.7885751128196716]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 9.0, 10.0, 15.0, 58.0, 95.0, 171.0, 321.0, 715.0, 1672.0, 5009.0, 41429.0, 4110607.0, 26525.0, 4629.0, 1550.0, 675.0, 327.0, 193.0, 98.0, 54.0, 34.0, 13.0, 21.0, 11.0, 6.0, 10.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260986328125, -0.24512100219726562, -0.22925567626953125, -0.21339035034179688, -0.1975250244140625, -0.18165969848632812, -0.16579437255859375, -0.14992904663085938, -0.134063720703125, -0.11819839477539062, -0.10233306884765625, -0.08646774291992188, -0.0706024169921875, -0.054737091064453125, -0.03887176513671875, -0.023006439208984375, -0.00714111328125, 0.008724212646484375, 0.02458953857421875, 0.040454864501953125, 0.0563201904296875, 0.07218551635742188, 0.08805084228515625, 0.10391616821289062, 0.119781494140625, 0.13564682006835938, 0.15151214599609375, 0.16737747192382812, 0.1832427978515625, 0.19910812377929688, 0.21497344970703125, 0.23083877563476562, 0.2467041015625, 0.2625694274902344, 0.27843475341796875, 0.2943000793457031, 0.3101654052734375, 0.3260307312011719, 0.34189605712890625, 0.3577613830566406, 0.373626708984375, 0.3894920349121094, 0.40535736083984375, 0.4212226867675781, 0.4370880126953125, 0.4529533386230469, 0.46881866455078125, 0.4846839904785156, 0.50054931640625, 0.5164146423339844, 0.5322799682617188, 0.5481452941894531, 0.5640106201171875, 0.5798759460449219, 0.5957412719726562, 0.6116065979003906, 0.627471923828125, 0.6433372497558594, 0.6592025756835938, 0.6750679016113281, 0.6909332275390625, 0.7067985534667969, 0.7226638793945312, 0.7385292053222656, 0.75439453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 7.0, 5.0, 8.0, 18.0, 19.0, 26.0, 31.0, 64.0, 76.0, 108.0, 103.0, 111.0, 89.0, 83.0, 70.0, 52.0, 46.0, 30.0, 24.0, 13.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04913330078125, -0.045752525329589844, -0.04237174987792969, -0.03899097442626953, -0.035610198974609375, -0.03222942352294922, -0.028848648071289062, -0.025467872619628906, -0.02208709716796875, -0.018706321716308594, -0.015325546264648438, -0.011944770812988281, -0.008563995361328125, -0.005183219909667969, -0.0018024444580078125, 0.0015783309936523438, 0.0049591064453125, 0.008339881896972656, 0.011720657348632812, 0.015101432800292969, 0.018482208251953125, 0.02186298370361328, 0.025243759155273438, 0.028624534606933594, 0.03200531005859375, 0.035386085510253906, 0.03876686096191406, 0.04214763641357422, 0.045528411865234375, 0.04890918731689453, 0.05228996276855469, 0.055670738220214844, 0.059051513671875, 0.062432289123535156, 0.06581306457519531, 0.06919384002685547, 0.07257461547851562, 0.07595539093017578, 0.07933616638183594, 0.0827169418334961, 0.08609771728515625, 0.0894784927368164, 0.09285926818847656, 0.09624004364013672, 0.09962081909179688, 0.10300159454345703, 0.10638236999511719, 0.10976314544677734, 0.1131439208984375, 0.11652469635009766, 0.11990547180175781, 0.12328624725341797, 0.12666702270507812, 0.13004779815673828, 0.13342857360839844, 0.1368093490600586, 0.14019012451171875, 0.1435708999633789, 0.14695167541503906, 0.15033245086669922, 0.15371322631835938, 0.15709400177001953, 0.1604747772216797, 0.16385555267333984, 0.167236328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 9.0, 10.0, 11.0, 24.0, 18.0, 53.0, 112.0, 283.0, 783.0, 3025.0, 18791.0, 408263.0, 3699512.0, 54774.0, 6366.0, 1457.0, 424.0, 156.0, 79.0, 32.0, 19.0, 14.0, 7.0, 5.0, 4.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2335205078125, -0.22579383850097656, -0.21806716918945312, -0.2103404998779297, -0.20261383056640625, -0.1948871612548828, -0.18716049194335938, -0.17943382263183594, -0.1717071533203125, -0.16398048400878906, -0.15625381469726562, -0.1485271453857422, -0.14080047607421875, -0.1330738067626953, -0.12534713745117188, -0.11762046813964844, -0.109893798828125, -0.10216712951660156, -0.09444046020507812, -0.08671379089355469, -0.07898712158203125, -0.07126045227050781, -0.06353378295898438, -0.05580711364746094, -0.0480804443359375, -0.04035377502441406, -0.032627105712890625, -0.024900436401367188, -0.01717376708984375, -0.009447097778320312, -0.001720428466796875, 0.0060062408447265625, 0.01373291015625, 0.021459579467773438, 0.029186248779296875, 0.03691291809082031, 0.04463958740234375, 0.05236625671386719, 0.060092926025390625, 0.06781959533691406, 0.0755462646484375, 0.08327293395996094, 0.09099960327148438, 0.09872627258300781, 0.10645294189453125, 0.11417961120605469, 0.12190628051757812, 0.12963294982910156, 0.137359619140625, 0.14508628845214844, 0.15281295776367188, 0.1605396270751953, 0.16826629638671875, 0.1759929656982422, 0.18371963500976562, 0.19144630432128906, 0.1991729736328125, 0.20689964294433594, 0.21462631225585938, 0.2223529815673828, 0.23007965087890625, 0.2378063201904297, 0.24553298950195312, 0.25325965881347656, 0.260986328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 5.0, 3.0, 10.0, 3.0, 7.0, 12.0, 16.0, 17.0, 36.0, 46.0, 52.0, 61.0, 133.0, 304.0, 846.0, 1146.0, 560.0, 272.0, 159.0, 99.0, 67.0, 60.0, 37.0, 32.0, 20.0, 15.0, 9.0, 9.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0703125, -0.06806182861328125, -0.0658111572265625, -0.06356048583984375, -0.061309814453125, -0.05905914306640625, -0.0568084716796875, -0.05455780029296875, -0.05230712890625, -0.05005645751953125, -0.0478057861328125, -0.04555511474609375, -0.043304443359375, -0.04105377197265625, -0.0388031005859375, -0.03655242919921875, -0.0343017578125, -0.03205108642578125, -0.0298004150390625, -0.02754974365234375, -0.025299072265625, -0.02304840087890625, -0.0207977294921875, -0.01854705810546875, -0.01629638671875, -0.01404571533203125, -0.0117950439453125, -0.00954437255859375, -0.007293701171875, -0.00504302978515625, -0.0027923583984375, -0.00054168701171875, 0.001708984375, 0.00395965576171875, 0.0062103271484375, 0.00846099853515625, 0.010711669921875, 0.01296234130859375, 0.0152130126953125, 0.01746368408203125, 0.01971435546875, 0.02196502685546875, 0.0242156982421875, 0.02646636962890625, 0.028717041015625, 0.03096771240234375, 0.0332183837890625, 0.03546905517578125, 0.0377197265625, 0.03997039794921875, 0.0422210693359375, 0.04447174072265625, 0.046722412109375, 0.04897308349609375, 0.0512237548828125, 0.05347442626953125, 0.05572509765625, 0.05797576904296875, 0.0602264404296875, 0.06247711181640625, 0.064727783203125, 0.06697845458984375, 0.0692291259765625, 0.07147979736328125, 0.07373046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 17.0, 102.0, 636.0, 208.0, 40.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1958421766757965, -0.15244601666927338, -0.10904984921216965, -0.06565368175506592, -0.022257521748542786, 0.021138638257980347, 0.06453481316566467, 0.10793095827102661, 0.15132713317871094, 0.19472329318523407, 0.2381194531917572, 0.28151562809944153, 0.32491177320480347, 0.3683079481124878, 0.4117041230201721, 0.45510026812553406, 0.4984964430332184, 0.5418925881385803, 0.5852887630462646, 0.628684937953949, 0.6720811128616333, 0.7154772281646729, 0.758873462677002, 0.8022695779800415, 0.8456657528877258, 0.8890619277954102, 0.9324581027030945, 0.9758542776107788, 1.0192503929138184, 1.0626466274261475, 1.106042742729187, 1.1494388580322266, 1.1928349733352661, 1.2362310886383057, 1.2796273231506348, 1.3230234384536743, 1.3664196729660034, 1.409815788269043, 1.453212022781372, 1.4966081380844116, 1.5400042533874512, 1.5834003686904907, 1.6267966032028198, 1.6701927185058594, 1.7135889530181885, 1.756985068321228, 1.8003811836242676, 1.8437774181365967, 1.8871736526489258, 1.9305697679519653, 1.9739660024642944, 2.017362117767334, 2.060758352279663, 2.104154586791992, 2.147550582885742, 2.1909468173980713, 2.2343428134918213, 2.2777390480041504, 2.3211350440979004, 2.3645312786102295, 2.4079275131225586, 2.4513235092163086, 2.4947197437286377, 2.538115978240967, 2.581512212753296]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 11.0, 11.0, 12.0, 19.0, 19.0, 22.0, 29.0, 31.0, 38.0, 34.0, 41.0, 43.0, 44.0, 46.0, 52.0, 50.0, 48.0, 31.0, 52.0, 57.0, 31.0, 46.0, 30.0, 25.0, 32.0, 21.0, 21.0, 14.0, 22.0, 7.0, 10.0, 16.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.2670629620552063, -0.25954505801200867, -0.25202712416648865, -0.24450920522212982, -0.236991286277771, -0.22947336733341217, -0.22195544838905334, -0.2144375443458557, -0.2069196105003357, -0.19940169155597687, -0.19188377261161804, -0.18436585366725922, -0.1768479347229004, -0.16933001577854156, -0.16181209683418274, -0.1542941927909851, -0.14677627384662628, -0.13925835490226746, -0.13174043595790863, -0.1242225170135498, -0.11670459806919098, -0.10918667912483215, -0.10166876763105392, -0.0941508486866951, -0.08663292974233627, -0.07911501079797745, -0.07159709185361862, -0.0640791803598404, -0.05656125769019127, -0.04904333874583244, -0.041525423526763916, -0.03400750458240509, -0.026489585638046265, -0.01897166669368744, -0.011453749611973763, -0.003935832530260086, 0.0035820864140987396, 0.011100005358457565, 0.018617920577526093, 0.026135839521884918, 0.033653758466243744, 0.04117167741060257, 0.048689596354961395, 0.05620751157402992, 0.06372542679309845, 0.07124334573745728, 0.0787612646818161, 0.08627918362617493, 0.09379710257053375, 0.10131502151489258, 0.1088329404592514, 0.11635085940361023, 0.12386877834796906, 0.13138669729232788, 0.1389046013355255, 0.14642253518104553, 0.15394043922424316, 0.161458358168602, 0.16897627711296082, 0.17649419605731964, 0.18401211500167847, 0.1915300339460373, 0.19904795289039612, 0.20656585693359375, 0.21408379077911377]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 8.0, 5.0, 12.0, 6.0, 13.0, 23.0, 21.0, 31.0, 28.0, 37.0, 67.0, 92.0, 164.0, 292.0, 607.0, 1420.0, 3390.0, 9286.0, 28998.0, 114052.0, 610962.0, 210650.0, 45945.0, 13826.0, 4864.0, 1845.0, 894.0, 422.0, 166.0, 110.0, 73.0, 55.0, 37.0, 22.0, 23.0, 19.0, 18.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 9.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.41552734375, -0.4035453796386719, -0.39156341552734375, -0.3795814514160156, -0.3675994873046875, -0.3556175231933594, -0.34363555908203125, -0.3316535949707031, -0.319671630859375, -0.3076896667480469, -0.29570770263671875, -0.2837257385253906, -0.2717437744140625, -0.2597618103027344, -0.24777984619140625, -0.23579788208007812, -0.22381591796875, -0.21183395385742188, -0.19985198974609375, -0.18787002563476562, -0.1758880615234375, -0.16390609741210938, -0.15192413330078125, -0.13994216918945312, -0.127960205078125, -0.11597824096679688, -0.10399627685546875, -0.09201431274414062, -0.0800323486328125, -0.06805038452148438, -0.05606842041015625, -0.044086456298828125, -0.0321044921875, -0.020122528076171875, -0.00814056396484375, 0.003841400146484375, 0.0158233642578125, 0.027805328369140625, 0.03978729248046875, 0.051769256591796875, 0.063751220703125, 0.07573318481445312, 0.08771514892578125, 0.09969711303710938, 0.1116790771484375, 0.12366104125976562, 0.13564300537109375, 0.14762496948242188, 0.15960693359375, 0.17158889770507812, 0.18357086181640625, 0.19555282592773438, 0.2075347900390625, 0.21951675415039062, 0.23149871826171875, 0.24348068237304688, 0.255462646484375, 0.2674446105957031, 0.27942657470703125, 0.2914085388183594, 0.3033905029296875, 0.3153724670410156, 0.32735443115234375, 0.3393363952636719, 0.351318359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 1.0, 7.0, 8.0, 16.0, 21.0, 26.0, 35.0, 56.0, 75.0, 77.0, 86.0, 117.0, 96.0, 92.0, 72.0, 55.0, 40.0, 42.0, 36.0, 12.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.04816627502441406, -0.044940948486328125, -0.04171562194824219, -0.03849029541015625, -0.03526496887207031, -0.032039642333984375, -0.028814315795898438, -0.0255889892578125, -0.022363662719726562, -0.019138336181640625, -0.015913009643554688, -0.01268768310546875, -0.009462356567382812, -0.006237030029296875, -0.0030117034912109375, 0.000213623046875, 0.0034389495849609375, 0.006664276123046875, 0.009889602661132812, 0.01311492919921875, 0.016340255737304688, 0.019565582275390625, 0.022790908813476562, 0.0260162353515625, 0.029241561889648438, 0.032466888427734375, 0.03569221496582031, 0.03891754150390625, 0.04214286804199219, 0.045368194580078125, 0.04859352111816406, 0.05181884765625, 0.05504417419433594, 0.058269500732421875, 0.06149482727050781, 0.06472015380859375, 0.06794548034667969, 0.07117080688476562, 0.07439613342285156, 0.0776214599609375, 0.08084678649902344, 0.08407211303710938, 0.08729743957519531, 0.09052276611328125, 0.09374809265136719, 0.09697341918945312, 0.10019874572753906, 0.103424072265625, 0.10664939880371094, 0.10987472534179688, 0.11310005187988281, 0.11632537841796875, 0.11955070495605469, 0.12277603149414062, 0.12600135803222656, 0.1292266845703125, 0.13245201110839844, 0.13567733764648438, 0.1389026641845703, 0.14212799072265625, 0.1453533172607422, 0.14857864379882812, 0.15180397033691406, 0.155029296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 5.0, 18.0, 6.0, 12.0, 22.0, 20.0, 33.0, 28.0, 26.0, 43.0, 51.0, 91.0, 151.0, 483.0, 2281.0, 15675.0, 150646.0, 768316.0, 97138.0, 10995.0, 1679.0, 349.0, 135.0, 88.0, 62.0, 43.0, 31.0, 27.0, 20.0, 15.0, 15.0, 10.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.4169044494628906, -0.40363311767578125, -0.3903617858886719, -0.3770904541015625, -0.3638191223144531, -0.35054779052734375, -0.3372764587402344, -0.324005126953125, -0.3107337951660156, -0.29746246337890625, -0.2841911315917969, -0.2709197998046875, -0.2576484680175781, -0.24437713623046875, -0.23110580444335938, -0.21783447265625, -0.20456314086914062, -0.19129180908203125, -0.17802047729492188, -0.1647491455078125, -0.15147781372070312, -0.13820648193359375, -0.12493515014648438, -0.111663818359375, -0.09839248657226562, -0.08512115478515625, -0.07184982299804688, -0.0585784912109375, -0.045307159423828125, -0.03203582763671875, -0.018764495849609375, -0.0054931640625, 0.007778167724609375, 0.02104949951171875, 0.034320831298828125, 0.0475921630859375, 0.060863494873046875, 0.07413482666015625, 0.08740615844726562, 0.100677490234375, 0.11394882202148438, 0.12722015380859375, 0.14049148559570312, 0.1537628173828125, 0.16703414916992188, 0.18030548095703125, 0.19357681274414062, 0.20684814453125, 0.22011947631835938, 0.23339080810546875, 0.24666213989257812, 0.2599334716796875, 0.2732048034667969, 0.28647613525390625, 0.2997474670410156, 0.313018798828125, 0.3262901306152344, 0.33956146240234375, 0.3528327941894531, 0.3661041259765625, 0.3793754577636719, 0.39264678955078125, 0.4059181213378906, 0.419189453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 4.0, 4.0, 3.0, 7.0, 10.0, 11.0, 12.0, 17.0, 17.0, 19.0, 26.0, 19.0, 26.0, 28.0, 23.0, 35.0, 33.0, 34.0, 57.0, 35.0, 33.0, 37.0, 45.0, 44.0, 38.0, 31.0, 24.0, 41.0, 44.0, 38.0, 28.0, 18.0, 20.0, 37.0, 18.0, 11.0, 10.0, 13.0, 16.0, 10.0, 9.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12396240234375, -0.12045001983642578, -0.11693763732910156, -0.11342525482177734, -0.10991287231445312, -0.1064004898071289, -0.10288810729980469, -0.09937572479248047, -0.09586334228515625, -0.09235095977783203, -0.08883857727050781, -0.0853261947631836, -0.08181381225585938, -0.07830142974853516, -0.07478904724121094, -0.07127666473388672, -0.0677642822265625, -0.06425189971923828, -0.06073951721191406, -0.057227134704589844, -0.053714752197265625, -0.050202369689941406, -0.04668998718261719, -0.04317760467529297, -0.03966522216796875, -0.03615283966064453, -0.03264045715332031, -0.029128074645996094, -0.025615692138671875, -0.022103309631347656, -0.018590927124023438, -0.015078544616699219, -0.011566162109375, -0.008053779602050781, -0.0045413970947265625, -0.0010290145874023438, 0.002483367919921875, 0.005995750427246094, 0.009508132934570312, 0.013020515441894531, 0.01653289794921875, 0.02004528045654297, 0.023557662963867188, 0.027070045471191406, 0.030582427978515625, 0.034094810485839844, 0.03760719299316406, 0.04111957550048828, 0.0446319580078125, 0.04814434051513672, 0.05165672302246094, 0.055169105529785156, 0.058681488037109375, 0.062193870544433594, 0.06570625305175781, 0.06921863555908203, 0.07273101806640625, 0.07624340057373047, 0.07975578308105469, 0.0832681655883789, 0.08678054809570312, 0.09029293060302734, 0.09380531311035156, 0.09731769561767578, 0.100830078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 2.0, 6.0, 10.0, 8.0, 17.0, 21.0, 32.0, 26.0, 57.0, 105.0, 187.0, 382.0, 901.0, 2476.0, 9786.0, 113552.0, 873734.0, 38376.0, 5719.0, 1751.0, 665.0, 307.0, 152.0, 81.0, 42.0, 37.0, 30.0, 18.0, 15.0, 12.0, 8.0, 5.0, 9.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2176513671875, -0.21166038513183594, -0.20566940307617188, -0.1996784210205078, -0.19368743896484375, -0.1876964569091797, -0.18170547485351562, -0.17571449279785156, -0.1697235107421875, -0.16373252868652344, -0.15774154663085938, -0.1517505645751953, -0.14575958251953125, -0.1397686004638672, -0.13377761840820312, -0.12778663635253906, -0.121795654296875, -0.11580467224121094, -0.10981369018554688, -0.10382270812988281, -0.09783172607421875, -0.09184074401855469, -0.08584976196289062, -0.07985877990722656, -0.0738677978515625, -0.06787681579589844, -0.061885833740234375, -0.05589485168457031, -0.04990386962890625, -0.04391288757324219, -0.037921905517578125, -0.03193092346191406, -0.02593994140625, -0.019948959350585938, -0.013957977294921875, -0.007966995239257812, -0.00197601318359375, 0.0040149688720703125, 0.010005950927734375, 0.015996932983398438, 0.0219879150390625, 0.027978897094726562, 0.033969879150390625, 0.03996086120605469, 0.04595184326171875, 0.05194282531738281, 0.057933807373046875, 0.06392478942871094, 0.069915771484375, 0.07590675354003906, 0.08189773559570312, 0.08788871765136719, 0.09387969970703125, 0.09987068176269531, 0.10586166381835938, 0.11185264587402344, 0.1178436279296875, 0.12383460998535156, 0.12982559204101562, 0.1358165740966797, 0.14180755615234375, 0.1477985382080078, 0.15378952026367188, 0.15978050231933594, 0.165771484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 16.0, 19.0, 38.0, 59.0, 96.0, 173.0, 179.0, 156.0, 92.0, 48.0, 31.0, 13.0, 16.0, 11.0, 5.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0623207092285156e-05, -1.9963830709457397e-05, -1.930445432662964e-05, -1.864507794380188e-05, -1.798570156097412e-05, -1.7326325178146362e-05, -1.6666948795318604e-05, -1.6007572412490845e-05, -1.5348196029663086e-05, -1.4688819646835327e-05, -1.4029443264007568e-05, -1.337006688117981e-05, -1.271069049835205e-05, -1.2051314115524292e-05, -1.1391937732696533e-05, -1.0732561349868774e-05, -1.0073184967041016e-05, -9.413808584213257e-06, -8.754432201385498e-06, -8.09505581855774e-06, -7.4356794357299805e-06, -6.776303052902222e-06, -6.116926670074463e-06, -5.457550287246704e-06, -4.798173904418945e-06, -4.1387975215911865e-06, -3.4794211387634277e-06, -2.820044755935669e-06, -2.16066837310791e-06, -1.5012919902801514e-06, -8.419156074523926e-07, -1.825392246246338e-07, 4.76837158203125e-07, 1.1362135410308838e-06, 1.7955899238586426e-06, 2.4549663066864014e-06, 3.11434268951416e-06, 3.773719072341919e-06, 4.433095455169678e-06, 5.0924718379974365e-06, 5.751848220825195e-06, 6.411224603652954e-06, 7.070600986480713e-06, 7.729977369308472e-06, 8.38935375213623e-06, 9.04873013496399e-06, 9.708106517791748e-06, 1.0367482900619507e-05, 1.1026859283447266e-05, 1.1686235666275024e-05, 1.2345612049102783e-05, 1.3004988431930542e-05, 1.36643648147583e-05, 1.432374119758606e-05, 1.4983117580413818e-05, 1.5642493963241577e-05, 1.6301870346069336e-05, 1.6961246728897095e-05, 1.7620623111724854e-05, 1.8279999494552612e-05, 1.893937587738037e-05, 1.959875226020813e-05, 2.025812864303589e-05, 2.0917505025863647e-05, 2.1576881408691406e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 9.0, 25.0, 31.0, 54.0, 62.0, 165.0, 579.0, 3110.0, 35865.0, 852142.0, 147407.0, 7480.0, 1036.0, 308.0, 99.0, 53.0, 37.0, 24.0, 13.0, 14.0, 10.0, 3.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.102447509765625, -0.0989990234375, -0.095550537109375, -0.09210205078125, -0.088653564453125, -0.085205078125, -0.081756591796875, -0.07830810546875, -0.074859619140625, -0.0714111328125, -0.067962646484375, -0.06451416015625, -0.061065673828125, -0.0576171875, -0.054168701171875, -0.05072021484375, -0.047271728515625, -0.0438232421875, -0.040374755859375, -0.03692626953125, -0.033477783203125, -0.030029296875, -0.026580810546875, -0.02313232421875, -0.019683837890625, -0.0162353515625, -0.012786865234375, -0.00933837890625, -0.005889892578125, -0.00244140625, 0.001007080078125, 0.00445556640625, 0.007904052734375, 0.0113525390625, 0.014801025390625, 0.01824951171875, 0.021697998046875, 0.025146484375, 0.028594970703125, 0.03204345703125, 0.035491943359375, 0.0389404296875, 0.042388916015625, 0.04583740234375, 0.049285888671875, 0.052734375, 0.056182861328125, 0.05963134765625, 0.063079833984375, 0.0665283203125, 0.069976806640625, 0.07342529296875, 0.076873779296875, 0.080322265625, 0.083770751953125, 0.08721923828125, 0.090667724609375, 0.0941162109375, 0.097564697265625, 0.10101318359375, 0.104461669921875, 0.10791015625, 0.111358642578125, 0.11480712890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 12.0, 4.0, 18.0, 15.0, 17.0, 25.0, 26.0, 41.0, 34.0, 55.0, 62.0, 82.0, 92.0, 89.0, 90.0, 68.0, 58.0, 32.0, 39.0, 22.0, 15.0, 20.0, 21.0, 15.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269012451171875, -0.026081562042236328, -0.025261878967285156, -0.024442195892333984, -0.023622512817382812, -0.02280282974243164, -0.02198314666748047, -0.021163463592529297, -0.020343780517578125, -0.019524097442626953, -0.01870441436767578, -0.01788473129272461, -0.017065048217773438, -0.016245365142822266, -0.015425682067871094, -0.014605998992919922, -0.01378631591796875, -0.012966632843017578, -0.012146949768066406, -0.011327266693115234, -0.010507583618164062, -0.00968790054321289, -0.008868217468261719, -0.008048534393310547, -0.007228851318359375, -0.006409168243408203, -0.005589485168457031, -0.004769802093505859, -0.0039501190185546875, -0.0031304359436035156, -0.0023107528686523438, -0.0014910697937011719, -0.00067138671875, 0.00014829635620117188, 0.0009679794311523438, 0.0017876625061035156, 0.0026073455810546875, 0.0034270286560058594, 0.004246711730957031, 0.005066394805908203, 0.005886077880859375, 0.006705760955810547, 0.007525444030761719, 0.00834512710571289, 0.009164810180664062, 0.009984493255615234, 0.010804176330566406, 0.011623859405517578, 0.01244354248046875, 0.013263225555419922, 0.014082908630371094, 0.014902591705322266, 0.015722274780273438, 0.01654195785522461, 0.01736164093017578, 0.018181324005126953, 0.019001007080078125, 0.019820690155029297, 0.02064037322998047, 0.02146005630493164, 0.022279739379882812, 0.023099422454833984, 0.023919105529785156, 0.024738788604736328, 0.0255584716796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 16.0, 820.0, 179.0, 7.0], "bins": [-11.810188293457031, -11.61910629272461, -11.428024291992188, -11.236943244934082, -11.04586124420166, -10.854779243469238, -10.663697242736816, -10.472616195678711, -10.281534194946289, -10.090452194213867, -9.899370193481445, -9.70828914642334, -9.517207145690918, -9.326125144958496, -9.135043144226074, -8.943962097167969, -8.752880096435547, -8.561798095703125, -8.370716094970703, -8.179635047912598, -7.988553047180176, -7.797471046447754, -7.60638952255249, -7.415307521820068, -7.2242255210876465, -7.033143520355225, -6.842061996459961, -6.650979995727539, -6.459898471832275, -6.2688164710998535, -6.07773494720459, -5.886652946472168, -5.695570945739746, -5.504488945007324, -5.3134074211120605, -5.122325420379639, -4.931243896484375, -4.740161895751953, -4.5490803718566895, -4.357998371124268, -4.166916847229004, -3.975835084915161, -3.7847533226013184, -3.5936715602874756, -3.402589797973633, -3.21150803565979, -3.0204262733459473, -2.8293442726135254, -2.6382627487182617, -2.447180986404419, -2.256099224090576, -2.0650174617767334, -1.8739356994628906, -1.6828539371490479, -1.4917720556259155, -1.3006902933120728, -1.10960853099823, -0.9185267686843872, -0.7274450063705444, -0.5363631844520569, -0.3452814221382141, -0.15419965982437134, 0.03688216209411621, 0.22796392440795898, 0.41904568672180176]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 3.0, 9.0, 16.0, 20.0, 12.0, 22.0, 16.0, 23.0, 23.0, 33.0, 26.0, 38.0, 36.0, 39.0, 30.0, 36.0, 53.0, 60.0, 53.0, 50.0, 43.0, 52.0, 35.0, 37.0, 24.0, 45.0, 26.0, 21.0, 17.0, 18.0, 13.0, 11.0, 7.0, 8.0, 10.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43452364206314087, -0.4203079640865326, -0.4060923159122467, -0.3918766379356384, -0.37766098976135254, -0.36344531178474426, -0.349229633808136, -0.3350139856338501, -0.3207983374595642, -0.30658265948295593, -0.29236701130867004, -0.27815133333206177, -0.2639356851577759, -0.2497200071811676, -0.23550434410572052, -0.22128868103027344, -0.20707300305366516, -0.19285733997821808, -0.178641676902771, -0.16442599892616272, -0.15021035075187683, -0.13599467277526855, -0.12177900969982147, -0.10756334662437439, -0.09334768354892731, -0.07913202047348022, -0.06491635739803314, -0.05070068687200546, -0.03648502379655838, -0.022269360721111298, -0.008053690195083618, 0.006161972880363464, 0.020377635955810547, 0.03459329903125763, 0.04880896583199501, 0.06302463263273239, 0.07724029570817947, 0.09145595878362656, 0.10567162930965424, 0.11988729238510132, 0.1341029554605484, 0.14831861853599548, 0.16253428161144257, 0.17674994468688965, 0.19096562266349792, 0.2051812708377838, 0.2193969488143921, 0.23361261188983917, 0.24782827496528625, 0.26204395294189453, 0.2762596011161804, 0.2904752790927887, 0.3046909272670746, 0.31890660524368286, 0.33312225341796875, 0.347337931394577, 0.3615536093711853, 0.3757692873477936, 0.38998493552207947, 0.40420061349868774, 0.41841626167297363, 0.4326319396495819, 0.4468476176261902, 0.4610632658004761, 0.47527891397476196]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 18.0, 40.0, 51.0, 107.0, 194.0, 515.0, 1785.0, 16375.0, 3826851.0, 337467.0, 8401.0, 1464.0, 502.0, 215.0, 133.0, 62.0, 30.0, 30.0, 11.0, 10.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2827301025390625, -0.263702392578125, -0.2446746826171875, -0.22564697265625, -0.2066192626953125, -0.187591552734375, -0.1685638427734375, -0.1495361328125, -0.1305084228515625, -0.111480712890625, -0.0924530029296875, -0.07342529296875, -0.0543975830078125, -0.035369873046875, -0.0163421630859375, 0.002685546875, 0.0217132568359375, 0.040740966796875, 0.0597686767578125, 0.07879638671875, 0.0978240966796875, 0.116851806640625, 0.1358795166015625, 0.1549072265625, 0.1739349365234375, 0.192962646484375, 0.2119903564453125, 0.23101806640625, 0.2500457763671875, 0.269073486328125, 0.2881011962890625, 0.30712890625, 0.3261566162109375, 0.345184326171875, 0.3642120361328125, 0.38323974609375, 0.4022674560546875, 0.421295166015625, 0.4403228759765625, 0.4593505859375, 0.4783782958984375, 0.497406005859375, 0.5164337158203125, 0.53546142578125, 0.5544891357421875, 0.573516845703125, 0.5925445556640625, 0.611572265625, 0.6305999755859375, 0.649627685546875, 0.6686553955078125, 0.68768310546875, 0.7067108154296875, 0.725738525390625, 0.7447662353515625, 0.7637939453125, 0.7828216552734375, 0.801849365234375, 0.8208770751953125, 0.83990478515625, 0.8589324951171875, 0.877960205078125, 0.8969879150390625, 0.916015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 16.0, 19.0, 32.0, 35.0, 62.0, 61.0, 71.0, 89.0, 101.0, 96.0, 95.0, 81.0, 63.0, 57.0, 35.0, 21.0, 20.0, 17.0, 7.0, 11.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054718017578125, -0.05131673812866211, -0.04791545867919922, -0.04451417922973633, -0.04111289978027344, -0.03771162033081055, -0.034310340881347656, -0.030909061431884766, -0.027507781982421875, -0.024106502532958984, -0.020705223083496094, -0.017303943634033203, -0.013902664184570312, -0.010501384735107422, -0.007100105285644531, -0.0036988258361816406, -0.00029754638671875, 0.0031037330627441406, 0.006505012512207031, 0.009906291961669922, 0.013307571411132812, 0.016708850860595703, 0.020110130310058594, 0.023511409759521484, 0.026912689208984375, 0.030313968658447266, 0.033715248107910156, 0.03711652755737305, 0.04051780700683594, 0.04391908645629883, 0.04732036590576172, 0.05072164535522461, 0.0541229248046875, 0.05752420425415039, 0.06092548370361328, 0.06432676315307617, 0.06772804260253906, 0.07112932205200195, 0.07453060150146484, 0.07793188095092773, 0.08133316040039062, 0.08473443984985352, 0.0881357192993164, 0.0915369987487793, 0.09493827819824219, 0.09833955764770508, 0.10174083709716797, 0.10514211654663086, 0.10854339599609375, 0.11194467544555664, 0.11534595489501953, 0.11874723434448242, 0.12214851379394531, 0.1255497932434082, 0.1289510726928711, 0.13235235214233398, 0.13575363159179688, 0.13915491104125977, 0.14255619049072266, 0.14595746994018555, 0.14935874938964844, 0.15276002883911133, 0.15616130828857422, 0.1595625877380371, 0.1629638671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 8.0, 15.0, 28.0, 36.0, 75.0, 114.0, 250.0, 523.0, 1215.0, 4002.0, 20604.0, 221038.0, 3656645.0, 259910.0, 22898.0, 4334.0, 1393.0, 551.0, 290.0, 126.0, 99.0, 36.0, 23.0, 17.0, 17.0, 14.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.25348663330078125, -0.2442779541015625, -0.23506927490234375, -0.225860595703125, -0.21665191650390625, -0.2074432373046875, -0.19823455810546875, -0.18902587890625, -0.17981719970703125, -0.1706085205078125, -0.16139984130859375, -0.152191162109375, -0.14298248291015625, -0.1337738037109375, -0.12456512451171875, -0.1153564453125, -0.10614776611328125, -0.0969390869140625, -0.08773040771484375, -0.078521728515625, -0.06931304931640625, -0.0601043701171875, -0.05089569091796875, -0.04168701171875, -0.03247833251953125, -0.0232696533203125, -0.01406097412109375, -0.004852294921875, 0.00435638427734375, 0.0135650634765625, 0.02277374267578125, 0.031982421875, 0.04119110107421875, 0.0503997802734375, 0.05960845947265625, 0.068817138671875, 0.07802581787109375, 0.0872344970703125, 0.09644317626953125, 0.10565185546875, 0.11486053466796875, 0.1240692138671875, 0.13327789306640625, 0.142486572265625, 0.15169525146484375, 0.1609039306640625, 0.17011260986328125, 0.1793212890625, 0.18852996826171875, 0.1977386474609375, 0.20694732666015625, 0.216156005859375, 0.22536468505859375, 0.2345733642578125, 0.24378204345703125, 0.25299072265625, 0.26219940185546875, 0.2714080810546875, 0.28061676025390625, 0.289825439453125, 0.29903411865234375, 0.3082427978515625, 0.31745147705078125, 0.32666015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 11.0, 24.0, 29.0, 66.0, 58.0, 82.0, 109.0, 165.0, 288.0, 540.0, 1134.0, 683.0, 302.0, 171.0, 113.0, 72.0, 51.0, 56.0, 27.0, 15.0, 13.0, 11.0, 12.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10785579681396484, -0.10395622253417969, -0.10005664825439453, -0.09615707397460938, -0.09225749969482422, -0.08835792541503906, -0.0844583511352539, -0.08055877685546875, -0.0766592025756836, -0.07275962829589844, -0.06886005401611328, -0.06496047973632812, -0.06106090545654297, -0.05716133117675781, -0.053261756896972656, -0.0493621826171875, -0.045462608337402344, -0.04156303405761719, -0.03766345977783203, -0.033763885498046875, -0.02986431121826172, -0.025964736938476562, -0.022065162658691406, -0.01816558837890625, -0.014266014099121094, -0.010366439819335938, -0.006466865539550781, -0.002567291259765625, 0.0013322830200195312, 0.0052318572998046875, 0.009131431579589844, 0.013031005859375, 0.016930580139160156, 0.020830154418945312, 0.02472972869873047, 0.028629302978515625, 0.03252887725830078, 0.03642845153808594, 0.040328025817871094, 0.04422760009765625, 0.048127174377441406, 0.05202674865722656, 0.05592632293701172, 0.059825897216796875, 0.06372547149658203, 0.06762504577636719, 0.07152462005615234, 0.0754241943359375, 0.07932376861572266, 0.08322334289550781, 0.08712291717529297, 0.09102249145507812, 0.09492206573486328, 0.09882164001464844, 0.1027212142944336, 0.10662078857421875, 0.1105203628540039, 0.11441993713378906, 0.11831951141357422, 0.12221908569335938, 0.12611865997314453, 0.1300182342529297, 0.13391780853271484, 0.1378173828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 6.0, 30.0, 37.0, 132.0, 273.0, 263.0, 142.0, 57.0, 34.0, 16.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22763663530349731, -0.20282776653766632, -0.17801889777183533, -0.15321002900600433, -0.12840116024017334, -0.10359229147434235, -0.07878342270851135, -0.05397455394268036, -0.029165685176849365, -0.004356816411018372, 0.020452052354812622, 0.045260921120643616, 0.07006978988647461, 0.0948786586523056, 0.1196875274181366, 0.1444963961839676, 0.16930526494979858, 0.19411413371562958, 0.21892300248146057, 0.24373187124729156, 0.26854074001312256, 0.29334962368011475, 0.31815847754478455, 0.34296733140945435, 0.36777621507644653, 0.3925850987434387, 0.4173939526081085, 0.4422028064727783, 0.4670116901397705, 0.4918205738067627, 0.5166294574737549, 0.5414382815361023, 0.5662472248077393, 0.5910561084747314, 0.6158649921417236, 0.640673816204071, 0.6654826998710632, 0.6902915835380554, 0.7151004076004028, 0.739909291267395, 0.7647181749343872, 0.7895270586013794, 0.8143359422683716, 0.839144766330719, 0.8639536499977112, 0.8887625336647034, 0.9135713577270508, 0.938380241394043, 0.9631891250610352, 0.9879980087280273, 1.0128068923950195, 1.0376157760620117, 1.062424659729004, 1.0872334241867065, 1.1120423078536987, 1.136851191520691, 1.161660075187683, 1.1864689588546753, 1.2112778425216675, 1.2360867261886597, 1.2608954906463623, 1.2857043743133545, 1.3105132579803467, 1.3353221416473389, 1.360131025314331]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 6.0, 9.0, 26.0, 31.0, 40.0, 32.0, 49.0, 70.0, 58.0, 60.0, 72.0, 79.0, 86.0, 67.0, 71.0, 51.0, 39.0, 33.0, 27.0, 25.0, 27.0, 14.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4593002200126648, -0.4430868923664093, -0.4268735647201538, -0.4106602370738983, -0.3944469094276428, -0.3782336115837097, -0.3620202839374542, -0.34580695629119873, -0.32959362864494324, -0.31338030099868774, -0.29716697335243225, -0.28095364570617676, -0.26474034786224365, -0.24852700531482697, -0.23231369256973267, -0.21610036492347717, -0.19988703727722168, -0.1836737096309662, -0.1674603819847107, -0.1512470692396164, -0.1350337415933609, -0.11882041394710541, -0.10260709375143051, -0.08639377355575562, -0.07018044590950012, -0.05396712198853493, -0.03775379806756973, -0.021540474146604538, -0.005327150225639343, 0.01088617742061615, 0.027099497616291046, 0.04331281781196594, 0.05952608585357666, 0.07573941349983215, 0.09195273369550705, 0.10816605389118195, 0.12437938153743744, 0.14059270918369293, 0.15680602192878723, 0.17301934957504272, 0.18923267722129822, 0.2054460048675537, 0.2216593325138092, 0.2378726452589035, 0.2540859580039978, 0.2702993154525757, 0.2865126132965088, 0.3027259409427643, 0.3189392685890198, 0.33515259623527527, 0.35136592388153076, 0.36757925152778625, 0.38379257917404175, 0.40000587701797485, 0.41621920466423035, 0.43243253231048584, 0.44864585995674133, 0.4648591876029968, 0.4810725152492523, 0.4972858428955078, 0.5134991407394409, 0.5297124981880188, 0.5459257960319519, 0.5621391534805298, 0.5783524513244629]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 3.0, 13.0, 16.0, 23.0, 37.0, 47.0, 54.0, 71.0, 168.0, 404.0, 1055.0, 3505.0, 15947.0, 95990.0, 663828.0, 227224.0, 31000.0, 6374.0, 1646.0, 543.0, 224.0, 123.0, 72.0, 44.0, 41.0, 17.0, 18.0, 10.0, 5.0, 17.0, 8.0, 6.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.388671875, -0.3767852783203125, -0.364898681640625, -0.3530120849609375, -0.34112548828125, -0.3292388916015625, -0.317352294921875, -0.3054656982421875, -0.2935791015625, -0.2816925048828125, -0.269805908203125, -0.2579193115234375, -0.24603271484375, -0.2341461181640625, -0.222259521484375, -0.2103729248046875, -0.198486328125, -0.1865997314453125, -0.174713134765625, -0.1628265380859375, -0.15093994140625, -0.1390533447265625, -0.127166748046875, -0.1152801513671875, -0.1033935546875, -0.0915069580078125, -0.079620361328125, -0.0677337646484375, -0.05584716796875, -0.0439605712890625, -0.032073974609375, -0.0201873779296875, -0.00830078125, 0.0035858154296875, 0.015472412109375, 0.0273590087890625, 0.03924560546875, 0.0511322021484375, 0.063018798828125, 0.0749053955078125, 0.0867919921875, 0.0986785888671875, 0.110565185546875, 0.1224517822265625, 0.13433837890625, 0.1462249755859375, 0.158111572265625, 0.1699981689453125, 0.181884765625, 0.1937713623046875, 0.205657958984375, 0.2175445556640625, 0.22943115234375, 0.2413177490234375, 0.253204345703125, 0.2650909423828125, 0.2769775390625, 0.2888641357421875, 0.300750732421875, 0.3126373291015625, 0.32452392578125, 0.3364105224609375, 0.348297119140625, 0.3601837158203125, 0.3720703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 7.0, 3.0, 21.0, 26.0, 40.0, 36.0, 57.0, 75.0, 92.0, 113.0, 112.0, 97.0, 79.0, 67.0, 59.0, 42.0, 32.0, 17.0, 19.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051727294921875, -0.04815530776977539, -0.04458332061767578, -0.04101133346557617, -0.03743934631347656, -0.03386735916137695, -0.030295372009277344, -0.026723384857177734, -0.023151397705078125, -0.019579410552978516, -0.016007423400878906, -0.012435436248779297, -0.008863449096679688, -0.005291461944580078, -0.0017194747924804688, 0.0018525123596191406, 0.00542449951171875, 0.00899648666381836, 0.012568473815917969, 0.016140460968017578, 0.019712448120117188, 0.023284435272216797, 0.026856422424316406, 0.030428409576416016, 0.034000396728515625, 0.037572383880615234, 0.041144371032714844, 0.04471635818481445, 0.04828834533691406, 0.05186033248901367, 0.05543231964111328, 0.05900430679321289, 0.0625762939453125, 0.06614828109741211, 0.06972026824951172, 0.07329225540161133, 0.07686424255371094, 0.08043622970581055, 0.08400821685791016, 0.08758020401000977, 0.09115219116210938, 0.09472417831420898, 0.0982961654663086, 0.1018681526184082, 0.10544013977050781, 0.10901212692260742, 0.11258411407470703, 0.11615610122680664, 0.11972808837890625, 0.12330007553100586, 0.12687206268310547, 0.13044404983520508, 0.1340160369873047, 0.1375880241394043, 0.1411600112915039, 0.14473199844360352, 0.14830398559570312, 0.15187597274780273, 0.15544795989990234, 0.15901994705200195, 0.16259193420410156, 0.16616392135620117, 0.16973590850830078, 0.1733078956604004, 0.1768798828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 9.0, 4.0, 12.0, 15.0, 24.0, 52.0, 69.0, 129.0, 193.0, 419.0, 892.0, 1939.0, 4947.0, 14072.0, 45562.0, 190537.0, 527129.0, 193289.0, 46346.0, 13993.0, 5103.0, 2077.0, 835.0, 415.0, 202.0, 105.0, 58.0, 48.0, 27.0, 21.0, 9.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26708984375, -0.2595672607421875, -0.252044677734375, -0.2445220947265625, -0.23699951171875, -0.2294769287109375, -0.221954345703125, -0.2144317626953125, -0.2069091796875, -0.1993865966796875, -0.191864013671875, -0.1843414306640625, -0.17681884765625, -0.1692962646484375, -0.161773681640625, -0.1542510986328125, -0.146728515625, -0.1392059326171875, -0.131683349609375, -0.1241607666015625, -0.11663818359375, -0.1091156005859375, -0.101593017578125, -0.0940704345703125, -0.0865478515625, -0.0790252685546875, -0.071502685546875, -0.0639801025390625, -0.05645751953125, -0.0489349365234375, -0.041412353515625, -0.0338897705078125, -0.0263671875, -0.0188446044921875, -0.011322021484375, -0.0037994384765625, 0.00372314453125, 0.0112457275390625, 0.018768310546875, 0.0262908935546875, 0.0338134765625, 0.0413360595703125, 0.048858642578125, 0.0563812255859375, 0.06390380859375, 0.0714263916015625, 0.078948974609375, 0.0864715576171875, 0.093994140625, 0.1015167236328125, 0.109039306640625, 0.1165618896484375, 0.12408447265625, 0.1316070556640625, 0.139129638671875, 0.1466522216796875, 0.1541748046875, 0.1616973876953125, 0.169219970703125, 0.1767425537109375, 0.18426513671875, 0.1917877197265625, 0.199310302734375, 0.2068328857421875, 0.21435546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 9.0, 4.0, 16.0, 15.0, 13.0, 21.0, 21.0, 22.0, 33.0, 30.0, 35.0, 61.0, 44.0, 49.0, 60.0, 61.0, 64.0, 52.0, 53.0, 54.0, 49.0, 37.0, 35.0, 29.0, 25.0, 31.0, 14.0, 12.0, 13.0, 13.0, 8.0, 7.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1279296875, -0.1227874755859375, -0.117645263671875, -0.1125030517578125, -0.10736083984375, -0.1022186279296875, -0.097076416015625, -0.0919342041015625, -0.0867919921875, -0.0816497802734375, -0.076507568359375, -0.0713653564453125, -0.06622314453125, -0.0610809326171875, -0.055938720703125, -0.0507965087890625, -0.045654296875, -0.0405120849609375, -0.035369873046875, -0.0302276611328125, -0.02508544921875, -0.0199432373046875, -0.014801025390625, -0.0096588134765625, -0.0045166015625, 0.0006256103515625, 0.005767822265625, 0.0109100341796875, 0.01605224609375, 0.0211944580078125, 0.026336669921875, 0.0314788818359375, 0.03662109375, 0.0417633056640625, 0.046905517578125, 0.0520477294921875, 0.05718994140625, 0.0623321533203125, 0.067474365234375, 0.0726165771484375, 0.0777587890625, 0.0829010009765625, 0.088043212890625, 0.0931854248046875, 0.09832763671875, 0.1034698486328125, 0.108612060546875, 0.1137542724609375, 0.118896484375, 0.1240386962890625, 0.129180908203125, 0.1343231201171875, 0.13946533203125, 0.1446075439453125, 0.149749755859375, 0.1548919677734375, 0.1600341796875, 0.1651763916015625, 0.170318603515625, 0.1754608154296875, 0.18060302734375, 0.1857452392578125, 0.190887451171875, 0.1960296630859375, 0.201171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 8.0, 12.0, 11.0, 17.0, 23.0, 35.0, 57.0, 86.0, 132.0, 197.0, 398.0, 785.0, 1551.0, 3769.0, 13057.0, 74744.0, 725484.0, 193914.0, 23935.0, 5973.0, 2129.0, 999.0, 491.0, 296.0, 169.0, 90.0, 45.0, 43.0, 26.0, 12.0, 12.0, 12.0, 4.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.193115234375, -0.18799209594726562, -0.18286895751953125, -0.17774581909179688, -0.1726226806640625, -0.16749954223632812, -0.16237640380859375, -0.15725326538085938, -0.152130126953125, -0.14700698852539062, -0.14188385009765625, -0.13676071166992188, -0.1316375732421875, -0.12651443481445312, -0.12139129638671875, -0.11626815795898438, -0.11114501953125, -0.10602188110351562, -0.10089874267578125, -0.09577560424804688, -0.0906524658203125, -0.08552932739257812, -0.08040618896484375, -0.07528305053710938, -0.070159912109375, -0.06503677368164062, -0.05991363525390625, -0.054790496826171875, -0.0496673583984375, -0.044544219970703125, -0.03942108154296875, -0.034297943115234375, -0.0291748046875, -0.024051666259765625, -0.01892852783203125, -0.013805389404296875, -0.0086822509765625, -0.003559112548828125, 0.00156402587890625, 0.006687164306640625, 0.011810302734375, 0.016933441162109375, 0.02205657958984375, 0.027179718017578125, 0.0323028564453125, 0.037425994873046875, 0.04254913330078125, 0.047672271728515625, 0.05279541015625, 0.057918548583984375, 0.06304168701171875, 0.06816482543945312, 0.0732879638671875, 0.07841110229492188, 0.08353424072265625, 0.08865737915039062, 0.093780517578125, 0.09890365600585938, 0.10402679443359375, 0.10914993286132812, 0.1142730712890625, 0.11939620971679688, 0.12451934814453125, 0.12964248657226562, 0.134765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 16.0, 27.0, 23.0, 40.0, 59.0, 121.0, 136.0, 138.0, 103.0, 106.0, 57.0, 34.0, 28.0, 19.0, 15.0, 15.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0371208190917969e-05, -9.981915354728699e-06, -9.592622518539429e-06, -9.203329682350159e-06, -8.814036846160889e-06, -8.424744009971619e-06, -8.035451173782349e-06, -7.646158337593079e-06, -7.256865501403809e-06, -6.8675726652145386e-06, -6.4782798290252686e-06, -6.0889869928359985e-06, -5.6996941566467285e-06, -5.3104013204574585e-06, -4.9211084842681885e-06, -4.5318156480789185e-06, -4.1425228118896484e-06, -3.7532299757003784e-06, -3.3639371395111084e-06, -2.9746443033218384e-06, -2.5853514671325684e-06, -2.1960586309432983e-06, -1.8067657947540283e-06, -1.4174729585647583e-06, -1.0281801223754883e-06, -6.388872861862183e-07, -2.4959444999694824e-07, 1.3969838619232178e-07, 5.289912223815918e-07, 9.182840585708618e-07, 1.3075768947601318e-06, 1.6968697309494019e-06, 2.086162567138672e-06, 2.475455403327942e-06, 2.864748239517212e-06, 3.254041075706482e-06, 3.643333911895752e-06, 4.032626748085022e-06, 4.421919584274292e-06, 4.811212420463562e-06, 5.200505256652832e-06, 5.589798092842102e-06, 5.979090929031372e-06, 6.368383765220642e-06, 6.757676601409912e-06, 7.146969437599182e-06, 7.536262273788452e-06, 7.925555109977722e-06, 8.314847946166992e-06, 8.704140782356262e-06, 9.093433618545532e-06, 9.482726454734802e-06, 9.872019290924072e-06, 1.0261312127113342e-05, 1.0650604963302612e-05, 1.1039897799491882e-05, 1.1429190635681152e-05, 1.1818483471870422e-05, 1.2207776308059692e-05, 1.2597069144248962e-05, 1.2986361980438232e-05, 1.3375654816627502e-05, 1.3764947652816772e-05, 1.4154240489006042e-05, 1.4543533325195312e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 10.0, 17.0, 22.0, 26.0, 37.0, 65.0, 125.0, 210.0, 316.0, 572.0, 1027.0, 1962.0, 3560.0, 7220.0, 15066.0, 34462.0, 92405.0, 321039.0, 381736.0, 113342.0, 40575.0, 17397.0, 8176.0, 4192.0, 2155.0, 1184.0, 671.0, 388.0, 210.0, 133.0, 75.0, 50.0, 35.0, 20.0, 25.0, 12.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0662841796875, -0.06421852111816406, -0.062152862548828125, -0.06008720397949219, -0.05802154541015625, -0.05595588684082031, -0.053890228271484375, -0.05182456970214844, -0.0497589111328125, -0.04769325256347656, -0.045627593994140625, -0.04356193542480469, -0.04149627685546875, -0.03943061828613281, -0.037364959716796875, -0.03529930114746094, -0.033233642578125, -0.031167984008789062, -0.029102325439453125, -0.027036666870117188, -0.02497100830078125, -0.022905349731445312, -0.020839691162109375, -0.018774032592773438, -0.0167083740234375, -0.014642715454101562, -0.012577056884765625, -0.010511398315429688, -0.00844573974609375, -0.0063800811767578125, -0.004314422607421875, -0.0022487640380859375, -0.00018310546875, 0.0018825531005859375, 0.003948211669921875, 0.0060138702392578125, 0.00807952880859375, 0.010145187377929688, 0.012210845947265625, 0.014276504516601562, 0.0163421630859375, 0.018407821655273438, 0.020473480224609375, 0.022539138793945312, 0.02460479736328125, 0.026670455932617188, 0.028736114501953125, 0.030801773071289062, 0.032867431640625, 0.03493309020996094, 0.036998748779296875, 0.03906440734863281, 0.04113006591796875, 0.04319572448730469, 0.045261383056640625, 0.04732704162597656, 0.0493927001953125, 0.05145835876464844, 0.053524017333984375, 0.05558967590332031, 0.05765533447265625, 0.05972099304199219, 0.061786651611328125, 0.06385231018066406, 0.06591796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 10.0, 14.0, 16.0, 9.0, 16.0, 22.0, 33.0, 39.0, 36.0, 34.0, 45.0, 51.0, 53.0, 82.0, 74.0, 69.0, 58.0, 57.0, 45.0, 37.0, 44.0, 16.0, 22.0, 18.0, 15.0, 11.0, 14.0, 6.0, 6.0, 4.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044342041015625, -0.042922019958496094, -0.04150199890136719, -0.04008197784423828, -0.038661956787109375, -0.03724193572998047, -0.03582191467285156, -0.034401893615722656, -0.03298187255859375, -0.031561851501464844, -0.030141830444335938, -0.02872180938720703, -0.027301788330078125, -0.02588176727294922, -0.024461746215820312, -0.023041725158691406, -0.0216217041015625, -0.020201683044433594, -0.018781661987304688, -0.01736164093017578, -0.015941619873046875, -0.014521598815917969, -0.013101577758789062, -0.011681556701660156, -0.01026153564453125, -0.008841514587402344, -0.0074214935302734375, -0.006001472473144531, -0.004581451416015625, -0.0031614303588867188, -0.0017414093017578125, -0.00032138824462890625, 0.0010986328125, 0.0025186538696289062, 0.0039386749267578125, 0.005358695983886719, 0.006778717041015625, 0.008198738098144531, 0.009618759155273438, 0.011038780212402344, 0.01245880126953125, 0.013878822326660156, 0.015298843383789062, 0.01671886444091797, 0.018138885498046875, 0.01955890655517578, 0.020978927612304688, 0.022398948669433594, 0.0238189697265625, 0.025238990783691406, 0.026659011840820312, 0.02807903289794922, 0.029499053955078125, 0.03091907501220703, 0.03233909606933594, 0.033759117126464844, 0.03517913818359375, 0.036599159240722656, 0.03801918029785156, 0.03943920135498047, 0.040859222412109375, 0.04227924346923828, 0.04369926452636719, 0.045119285583496094, 0.046539306640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 26.0, 170.0, 699.0, 102.0, 10.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.88085412979126, -4.787600994110107, -4.694348335266113, -4.601095199584961, -4.507842063903809, -4.414588928222656, -4.321336269378662, -4.22808313369751, -4.134829998016357, -4.041576862335205, -3.948323965072632, -3.8550710678100586, -3.7618179321289062, -3.668565034866333, -3.5753121376037598, -3.4820590019226074, -3.388806104660034, -3.295553207397461, -3.2023000717163086, -3.1090471744537354, -3.015794038772583, -2.9225411415100098, -2.8292880058288574, -2.736035108566284, -2.642782211303711, -2.5495293140411377, -2.4562761783599854, -2.363023281097412, -2.2697701454162598, -2.1765172481536865, -2.0832643508911133, -1.990011215209961, -1.8967578411102295, -1.8035048246383667, -1.710251808166504, -1.6169989109039307, -1.5237457752227783, -1.430492877960205, -1.3372398614883423, -1.2439868450164795, -1.1507338285446167, -1.057480812072754, -0.9642277956008911, -0.8709748387336731, -0.7777218222618103, -0.6844688057899475, -0.5912158489227295, -0.4979628324508667, -0.4047098159790039, -0.3114567995071411, -0.2182038128376007, -0.1249508261680603, -0.03169780969619751, 0.06155520677566528, 0.1548081636428833, 0.2480611801147461, 0.3413141965866089, 0.4345672130584717, 0.5278202295303345, 0.6210731863975525, 0.7143262028694153, 0.8075792193412781, 0.9008321762084961, 0.9940851926803589, 1.0873382091522217]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 4.0, 7.0, 9.0, 11.0, 15.0, 22.0, 18.0, 25.0, 32.0, 36.0, 31.0, 38.0, 61.0, 50.0, 60.0, 48.0, 55.0, 54.0, 44.0, 48.0, 34.0, 37.0, 48.0, 29.0, 31.0, 27.0, 35.0, 18.0, 16.0, 11.0, 8.0, 6.0, 11.0, 8.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4297906756401062, -0.4140566289424896, -0.39832255244255066, -0.3825885057449341, -0.3668544590473175, -0.3511204123497009, -0.33538633584976196, -0.3196522891521454, -0.3039182424545288, -0.28818419575691223, -0.27245011925697327, -0.2567160725593567, -0.2409820258617401, -0.22524796426296234, -0.20951390266418457, -0.193779855966568, -0.17804577946662903, -0.16231171786785126, -0.14657767117023468, -0.1308436095714569, -0.11510955542325974, -0.09937550127506256, -0.08364143967628479, -0.06790738552808762, -0.05217333137989044, -0.03643927723169327, -0.020705219358205795, -0.004971161484718323, 0.010762892663478851, 0.026496946811676025, 0.042231008410453796, 0.05796506255865097, 0.07369911670684814, 0.08943317085504532, 0.10516722500324249, 0.12090128660202026, 0.13663533329963684, 0.1523693948984146, 0.16810345649719238, 0.18383750319480896, 0.19957156479358673, 0.2153056263923645, 0.23103967308998108, 0.24677373468875885, 0.2625077962875366, 0.2782418429851532, 0.2939758896827698, 0.30970996618270874, 0.3254440128803253, 0.3411780595779419, 0.35691213607788086, 0.37264618277549744, 0.388380229473114, 0.404114305973053, 0.41984835267066956, 0.43558239936828613, 0.4513164758682251, 0.4670505225658417, 0.48278459906578064, 0.4985186457633972, 0.5142527222633362, 0.5299867391586304, 0.5457208156585693, 0.5614548921585083, 0.5771889090538025]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 8.0, 16.0, 23.0, 37.0, 45.0, 106.0, 201.0, 458.0, 1109.0, 3710.0, 14390.0, 67733.0, 805854.0, 3111697.0, 151774.0, 25506.0, 6654.0, 2225.0, 1044.0, 565.0, 327.0, 236.0, 146.0, 109.0, 84.0, 53.0, 54.0, 29.0, 23.0, 15.0, 14.0, 10.0, 7.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1051025390625, -0.09862709045410156, -0.09215164184570312, -0.08567619323730469, -0.07920074462890625, -0.07272529602050781, -0.06624984741210938, -0.05977439880371094, -0.0532989501953125, -0.04682350158691406, -0.040348052978515625, -0.03387260437011719, -0.02739715576171875, -0.020921707153320312, -0.014446258544921875, -0.007970809936523438, -0.001495361328125, 0.0049800872802734375, 0.011455535888671875, 0.017930984497070312, 0.02440643310546875, 0.030881881713867188, 0.037357330322265625, 0.04383277893066406, 0.0503082275390625, 0.05678367614746094, 0.06325912475585938, 0.06973457336425781, 0.07621002197265625, 0.08268547058105469, 0.08916091918945312, 0.09563636779785156, 0.10211181640625, 0.10858726501464844, 0.11506271362304688, 0.12153816223144531, 0.12801361083984375, 0.1344890594482422, 0.14096450805664062, 0.14743995666503906, 0.1539154052734375, 0.16039085388183594, 0.16686630249023438, 0.1733417510986328, 0.17981719970703125, 0.1862926483154297, 0.19276809692382812, 0.19924354553222656, 0.205718994140625, 0.21219444274902344, 0.21866989135742188, 0.2251453399658203, 0.23162078857421875, 0.2380962371826172, 0.24457168579101562, 0.25104713439941406, 0.2575225830078125, 0.26399803161621094, 0.2704734802246094, 0.2769489288330078, 0.28342437744140625, 0.2898998260498047, 0.2963752746582031, 0.30285072326660156, 0.309326171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 12.0, 6.0, 24.0, 34.0, 43.0, 62.0, 74.0, 73.0, 87.0, 103.0, 111.0, 104.0, 74.0, 52.0, 53.0, 34.0, 23.0, 15.0, 8.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05010986328125, -0.04619121551513672, -0.04227256774902344, -0.038353919982910156, -0.034435272216796875, -0.030516624450683594, -0.026597976684570312, -0.02267932891845703, -0.01876068115234375, -0.014842033386230469, -0.010923385620117188, -0.007004737854003906, -0.003086090087890625, 0.0008325576782226562, 0.0047512054443359375, 0.008669853210449219, 0.0125885009765625, 0.01650714874267578, 0.020425796508789062, 0.024344444274902344, 0.028263092041015625, 0.032181739807128906, 0.03610038757324219, 0.04001903533935547, 0.04393768310546875, 0.04785633087158203, 0.05177497863769531, 0.055693626403808594, 0.059612274169921875, 0.06353092193603516, 0.06744956970214844, 0.07136821746826172, 0.075286865234375, 0.07920551300048828, 0.08312416076660156, 0.08704280853271484, 0.09096145629882812, 0.0948801040649414, 0.09879875183105469, 0.10271739959716797, 0.10663604736328125, 0.11055469512939453, 0.11447334289550781, 0.1183919906616211, 0.12231063842773438, 0.12622928619384766, 0.13014793395996094, 0.13406658172607422, 0.1379852294921875, 0.14190387725830078, 0.14582252502441406, 0.14974117279052734, 0.15365982055664062, 0.1575784683227539, 0.1614971160888672, 0.16541576385498047, 0.16933441162109375, 0.17325305938720703, 0.1771717071533203, 0.1810903549194336, 0.18500900268554688, 0.18892765045166016, 0.19284629821777344, 0.19676494598388672, 0.20068359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 12.0, 19.0, 14.0, 31.0, 47.0, 53.0, 91.0, 123.0, 225.0, 357.0, 783.0, 2465.0, 12328.0, 157512.0, 3500547.0, 489704.0, 23796.0, 3780.0, 1151.0, 504.0, 244.0, 165.0, 112.0, 85.0, 33.0, 36.0, 23.0, 15.0, 12.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3116874694824219, -0.30184173583984375, -0.2919960021972656, -0.2821502685546875, -0.2723045349121094, -0.26245880126953125, -0.2526130676269531, -0.242767333984375, -0.23292160034179688, -0.22307586669921875, -0.21323013305664062, -0.2033843994140625, -0.19353866577148438, -0.18369293212890625, -0.17384719848632812, -0.16400146484375, -0.15415573120117188, -0.14430999755859375, -0.13446426391601562, -0.1246185302734375, -0.11477279663085938, -0.10492706298828125, -0.09508132934570312, -0.085235595703125, -0.07538986206054688, -0.06554412841796875, -0.055698394775390625, -0.0458526611328125, -0.036006927490234375, -0.02616119384765625, -0.016315460205078125, -0.0064697265625, 0.003376007080078125, 0.01322174072265625, 0.023067474365234375, 0.0329132080078125, 0.042758941650390625, 0.05260467529296875, 0.062450408935546875, 0.072296142578125, 0.08214187622070312, 0.09198760986328125, 0.10183334350585938, 0.1116790771484375, 0.12152481079101562, 0.13137054443359375, 0.14121627807617188, 0.15106201171875, 0.16090774536132812, 0.17075347900390625, 0.18059921264648438, 0.1904449462890625, 0.20029067993164062, 0.21013641357421875, 0.21998214721679688, 0.229827880859375, 0.23967361450195312, 0.24951934814453125, 0.2593650817871094, 0.2692108154296875, 0.2790565490722656, 0.28890228271484375, 0.2987480163574219, 0.30859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 13.0, 21.0, 27.0, 54.0, 83.0, 164.0, 284.0, 465.0, 782.0, 958.0, 576.0, 315.0, 148.0, 80.0, 33.0, 22.0, 18.0, 10.0, 12.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.12945175170898438, -0.12145233154296875, -0.11345291137695312, -0.1054534912109375, -0.09745407104492188, -0.08945465087890625, -0.08145523071289062, -0.073455810546875, -0.06545639038085938, -0.05745697021484375, -0.049457550048828125, -0.0414581298828125, -0.033458709716796875, -0.02545928955078125, -0.017459869384765625, -0.00946044921875, -0.001461029052734375, 0.00653839111328125, 0.014537811279296875, 0.0225372314453125, 0.030536651611328125, 0.03853607177734375, 0.046535491943359375, 0.054534912109375, 0.06253433227539062, 0.07053375244140625, 0.07853317260742188, 0.0865325927734375, 0.09453201293945312, 0.10253143310546875, 0.11053085327148438, 0.1185302734375, 0.12652969360351562, 0.13452911376953125, 0.14252853393554688, 0.1505279541015625, 0.15852737426757812, 0.16652679443359375, 0.17452621459960938, 0.182525634765625, 0.19052505493164062, 0.19852447509765625, 0.20652389526367188, 0.2145233154296875, 0.22252273559570312, 0.23052215576171875, 0.23852157592773438, 0.24652099609375, 0.2545204162597656, 0.26251983642578125, 0.2705192565917969, 0.2785186767578125, 0.2865180969238281, 0.29451751708984375, 0.3025169372558594, 0.310516357421875, 0.3185157775878906, 0.32651519775390625, 0.3345146179199219, 0.3425140380859375, 0.3505134582519531, 0.35851287841796875, 0.3665122985839844, 0.37451171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 13.0, 8.0, 19.0, 45.0, 64.0, 118.0, 138.0, 169.0, 146.0, 106.0, 57.0, 36.0, 28.0, 17.0, 9.0, 13.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40134763717651367, -0.3755206763744354, -0.3496937155723572, -0.3238667845726013, -0.29803982377052307, -0.2722128629684448, -0.24638590216636658, -0.22055895626544952, -0.19473199546337128, -0.16890503466129303, -0.14307808876037598, -0.11725112795829773, -0.09142417460680008, -0.06559722125530243, -0.03977026045322418, -0.013943314552307129, 0.011883646249771118, 0.03771059960126877, 0.06353755295276642, 0.08936451375484467, 0.11519146710634232, 0.14101842045783997, 0.1668453812599182, 0.19267232716083527, 0.2184992879629135, 0.24432624876499176, 0.2701531946659088, 0.29598015546798706, 0.3218071162700653, 0.34763407707214355, 0.3734610080718994, 0.39928796887397766, 0.4251149296760559, 0.45094189047813416, 0.4767688512802124, 0.5025957822799683, 0.5284227728843689, 0.5542497038841248, 0.5800766944885254, 0.6059036254882812, 0.6317305564880371, 0.657557487487793, 0.6833844780921936, 0.7092114090919495, 0.7350383996963501, 0.760865330696106, 0.7866922616958618, 0.8125192523002625, 0.8383462429046631, 0.864173173904419, 0.8900001645088196, 0.9158270955085754, 0.9416540861129761, 0.9674810171127319, 0.9933079481124878, 1.0191348791122437, 1.0449618101119995, 1.0707887411117554, 1.0966156721115112, 1.1224427223205566, 1.1482696533203125, 1.1740965843200684, 1.1999235153198242, 1.22575044631958, 1.2515774965286255]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 8.0, 11.0, 10.0, 15.0, 16.0, 25.0, 25.0, 25.0, 30.0, 37.0, 20.0, 36.0, 48.0, 55.0, 45.0, 40.0, 49.0, 50.0, 52.0, 53.0, 45.0, 42.0, 36.0, 34.0, 24.0, 21.0, 29.0, 14.0, 13.0, 11.0, 9.0, 4.0, 10.0, 13.0, 5.0, 9.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5966930389404297, -0.5800929665565491, -0.5634929537773132, -0.5468928813934326, -0.5302928686141968, -0.5136927962303162, -0.49709275364875793, -0.4804927110671997, -0.4638926386833191, -0.44729259610176086, -0.43069255352020264, -0.414092481136322, -0.3974924385547638, -0.38089239597320557, -0.36429235339164734, -0.3476923108100891, -0.3310922682285309, -0.31449222564697266, -0.29789218306541443, -0.2812921404838562, -0.2646920680999756, -0.24809202551841736, -0.23149198293685913, -0.2148919403553009, -0.19829188287258148, -0.18169184029102325, -0.16509178280830383, -0.1484917402267456, -0.13189169764518738, -0.11529164016246796, -0.09869159758090973, -0.0820915475487709, -0.06549149751663208, -0.048891447484493256, -0.03229140117764473, -0.015691354870796204, 0.0009086951613426208, 0.017508745193481445, 0.03410878777503967, 0.0507088378071785, 0.06730888783931732, 0.08390893787145615, 0.10050898790359497, 0.1171090304851532, 0.13370907306671143, 0.15030913054943085, 0.16690917313098907, 0.1835092306137085, 0.20010927319526672, 0.21670931577682495, 0.23330937325954437, 0.2499094158411026, 0.266509473323822, 0.28310951590538025, 0.2997095584869385, 0.3163096010684967, 0.33290964365005493, 0.34950968623161316, 0.3661097288131714, 0.382709801197052, 0.39930984377861023, 0.41590988636016846, 0.4325099289417267, 0.4491099715232849, 0.4657100439071655]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 0.0, 2.0, 4.0, 7.0, 10.0, 5.0, 9.0, 10.0, 16.0, 14.0, 24.0, 29.0, 38.0, 48.0, 84.0, 161.0, 275.0, 686.0, 1920.0, 6084.0, 22935.0, 113319.0, 535725.0, 297522.0, 51671.0, 12111.0, 3546.0, 1189.0, 507.0, 229.0, 109.0, 77.0, 47.0, 27.0, 26.0, 23.0, 18.0, 13.0, 8.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3378944396972656, -0.32788848876953125, -0.3178825378417969, -0.3078765869140625, -0.2978706359863281, -0.28786468505859375, -0.2778587341308594, -0.267852783203125, -0.2578468322753906, -0.24784088134765625, -0.23783493041992188, -0.2278289794921875, -0.21782302856445312, -0.20781707763671875, -0.19781112670898438, -0.18780517578125, -0.17779922485351562, -0.16779327392578125, -0.15778732299804688, -0.1477813720703125, -0.13777542114257812, -0.12776947021484375, -0.11776351928710938, -0.107757568359375, -0.09775161743164062, -0.08774566650390625, -0.07773971557617188, -0.0677337646484375, -0.057727813720703125, -0.04772186279296875, -0.037715911865234375, -0.0277099609375, -0.017704010009765625, -0.00769805908203125, 0.002307891845703125, 0.0123138427734375, 0.022319793701171875, 0.03232574462890625, 0.042331695556640625, 0.052337646484375, 0.062343597412109375, 0.07234954833984375, 0.08235549926757812, 0.0923614501953125, 0.10236740112304688, 0.11237335205078125, 0.12237930297851562, 0.13238525390625, 0.14239120483398438, 0.15239715576171875, 0.16240310668945312, 0.1724090576171875, 0.18241500854492188, 0.19242095947265625, 0.20242691040039062, 0.212432861328125, 0.22243881225585938, 0.23244476318359375, 0.24245071411132812, 0.2524566650390625, 0.2624626159667969, 0.27246856689453125, 0.2824745178222656, 0.29248046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 12.0, 21.0, 25.0, 31.0, 64.0, 100.0, 90.0, 86.0, 114.0, 115.0, 112.0, 75.0, 69.0, 35.0, 22.0, 16.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06245231628417969, -0.058132171630859375, -0.05381202697753906, -0.04949188232421875, -0.04517173767089844, -0.040851593017578125, -0.03653144836425781, -0.0322113037109375, -0.027891159057617188, -0.023571014404296875, -0.019250869750976562, -0.01493072509765625, -0.010610580444335938, -0.006290435791015625, -0.0019702911376953125, 0.002349853515625, 0.0066699981689453125, 0.010990142822265625, 0.015310287475585938, 0.01963043212890625, 0.023950576782226562, 0.028270721435546875, 0.03259086608886719, 0.0369110107421875, 0.04123115539550781, 0.045551300048828125, 0.04987144470214844, 0.05419158935546875, 0.05851173400878906, 0.06283187866210938, 0.06715202331542969, 0.07147216796875, 0.07579231262207031, 0.08011245727539062, 0.08443260192871094, 0.08875274658203125, 0.09307289123535156, 0.09739303588867188, 0.10171318054199219, 0.1060333251953125, 0.11035346984863281, 0.11467361450195312, 0.11899375915527344, 0.12331390380859375, 0.12763404846191406, 0.13195419311523438, 0.1362743377685547, 0.140594482421875, 0.1449146270751953, 0.14923477172851562, 0.15355491638183594, 0.15787506103515625, 0.16219520568847656, 0.16651535034179688, 0.1708354949951172, 0.1751556396484375, 0.1794757843017578, 0.18379592895507812, 0.18811607360839844, 0.19243621826171875, 0.19675636291503906, 0.20107650756835938, 0.2053966522216797, 0.209716796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 16.0, 28.0, 30.0, 40.0, 87.0, 149.0, 244.0, 400.0, 654.0, 1124.0, 2108.0, 4082.0, 8373.0, 17985.0, 40751.0, 96923.0, 240540.0, 335083.0, 172205.0, 69451.0, 30134.0, 13835.0, 6637.0, 3427.0, 1769.0, 975.0, 593.0, 328.0, 210.0, 111.0, 80.0, 51.0, 37.0, 23.0, 21.0, 8.0, 7.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1668701171875, -0.16154098510742188, -0.15621185302734375, -0.15088272094726562, -0.1455535888671875, -0.14022445678710938, -0.13489532470703125, -0.12956619262695312, -0.124237060546875, -0.11890792846679688, -0.11357879638671875, -0.10824966430664062, -0.1029205322265625, -0.09759140014648438, -0.09226226806640625, -0.08693313598632812, -0.08160400390625, -0.07627487182617188, -0.07094573974609375, -0.06561660766601562, -0.0602874755859375, -0.054958343505859375, -0.04962921142578125, -0.044300079345703125, -0.038970947265625, -0.033641815185546875, -0.02831268310546875, -0.022983551025390625, -0.0176544189453125, -0.012325286865234375, -0.00699615478515625, -0.001667022705078125, 0.003662109375, 0.008991241455078125, 0.01432037353515625, 0.019649505615234375, 0.0249786376953125, 0.030307769775390625, 0.03563690185546875, 0.040966033935546875, 0.046295166015625, 0.051624298095703125, 0.05695343017578125, 0.062282562255859375, 0.0676116943359375, 0.07294082641601562, 0.07826995849609375, 0.08359909057617188, 0.08892822265625, 0.09425735473632812, 0.09958648681640625, 0.10491561889648438, 0.1102447509765625, 0.11557388305664062, 0.12090301513671875, 0.12623214721679688, 0.131561279296875, 0.13689041137695312, 0.14221954345703125, 0.14754867553710938, 0.1528778076171875, 0.15820693969726562, 0.16353607177734375, 0.16886520385742188, 0.1741943359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 8.0, 7.0, 10.0, 13.0, 13.0, 19.0, 14.0, 19.0, 23.0, 14.0, 16.0, 26.0, 34.0, 23.0, 41.0, 38.0, 37.0, 35.0, 25.0, 48.0, 36.0, 50.0, 44.0, 46.0, 45.0, 36.0, 27.0, 30.0, 33.0, 35.0, 24.0, 18.0, 16.0, 16.0, 10.0, 13.0, 14.0, 17.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.15394973754882812, -0.14920806884765625, -0.14446640014648438, -0.1397247314453125, -0.13498306274414062, -0.13024139404296875, -0.12549972534179688, -0.120758056640625, -0.11601638793945312, -0.11127471923828125, -0.10653305053710938, -0.1017913818359375, -0.09704971313476562, -0.09230804443359375, -0.08756637573242188, -0.08282470703125, -0.07808303833007812, -0.07334136962890625, -0.06859970092773438, -0.0638580322265625, -0.059116363525390625, -0.05437469482421875, -0.049633026123046875, -0.044891357421875, -0.040149688720703125, -0.03540802001953125, -0.030666351318359375, -0.0259246826171875, -0.021183013916015625, -0.01644134521484375, -0.011699676513671875, -0.0069580078125, -0.002216339111328125, 0.00252532958984375, 0.007266998291015625, 0.0120086669921875, 0.016750335693359375, 0.02149200439453125, 0.026233673095703125, 0.030975341796875, 0.035717010498046875, 0.04045867919921875, 0.045200347900390625, 0.0499420166015625, 0.054683685302734375, 0.05942535400390625, 0.06416702270507812, 0.06890869140625, 0.07365036010742188, 0.07839202880859375, 0.08313369750976562, 0.0878753662109375, 0.09261703491210938, 0.09735870361328125, 0.10210037231445312, 0.106842041015625, 0.11158370971679688, 0.11632537841796875, 0.12106704711914062, 0.1258087158203125, 0.13055038452148438, 0.13529205322265625, 0.14003372192382812, 0.144775390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 15.0, 22.0, 49.0, 84.0, 127.0, 218.0, 476.0, 1142.0, 2620.0, 8249.0, 964541.0, 62980.0, 4743.0, 1729.0, 804.0, 325.0, 168.0, 113.0, 65.0, 30.0, 17.0, 9.0, 6.0, 6.0, 9.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.67437744140625, -0.6524658203125, -0.63055419921875, -0.608642578125, -0.58673095703125, -0.5648193359375, -0.54290771484375, -0.52099609375, -0.49908447265625, -0.4771728515625, -0.45526123046875, -0.433349609375, -0.41143798828125, -0.3895263671875, -0.36761474609375, -0.345703125, -0.32379150390625, -0.3018798828125, -0.27996826171875, -0.258056640625, -0.23614501953125, -0.2142333984375, -0.19232177734375, -0.17041015625, -0.14849853515625, -0.1265869140625, -0.10467529296875, -0.082763671875, -0.06085205078125, -0.0389404296875, -0.01702880859375, 0.0048828125, 0.02679443359375, 0.0487060546875, 0.07061767578125, 0.092529296875, 0.11444091796875, 0.1363525390625, 0.15826416015625, 0.18017578125, 0.20208740234375, 0.2239990234375, 0.24591064453125, 0.267822265625, 0.28973388671875, 0.3116455078125, 0.33355712890625, 0.35546875, 0.37738037109375, 0.3992919921875, 0.42120361328125, 0.443115234375, 0.46502685546875, 0.4869384765625, 0.50885009765625, 0.53076171875, 0.55267333984375, 0.5745849609375, 0.59649658203125, 0.618408203125, 0.64031982421875, 0.6622314453125, 0.68414306640625, 0.7060546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 23.0, 48.0, 158.0, 223.0, 270.0, 159.0, 66.0, 21.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.141164779663086e-05, -3.010779619216919e-05, -2.880394458770752e-05, -2.750009298324585e-05, -2.619624137878418e-05, -2.489238977432251e-05, -2.358853816986084e-05, -2.228468656539917e-05, -2.09808349609375e-05, -1.967698335647583e-05, -1.837313175201416e-05, -1.706928014755249e-05, -1.576542854309082e-05, -1.446157693862915e-05, -1.315772533416748e-05, -1.185387372970581e-05, -1.055002212524414e-05, -9.24617052078247e-06, -7.9423189163208e-06, -6.638467311859131e-06, -5.334615707397461e-06, -4.030764102935791e-06, -2.726912498474121e-06, -1.4230608940124512e-06, -1.1920928955078125e-07, 1.1846423149108887e-06, 2.4884939193725586e-06, 3.7923455238342285e-06, 5.0961971282958984e-06, 6.400048732757568e-06, 7.703900337219238e-06, 9.007751941680908e-06, 1.0311603546142578e-05, 1.1615455150604248e-05, 1.2919306755065918e-05, 1.4223158359527588e-05, 1.5527009963989258e-05, 1.6830861568450928e-05, 1.8134713172912598e-05, 1.9438564777374268e-05, 2.0742416381835938e-05, 2.2046267986297607e-05, 2.3350119590759277e-05, 2.4653971195220947e-05, 2.5957822799682617e-05, 2.7261674404144287e-05, 2.8565526008605957e-05, 2.9869377613067627e-05, 3.11732292175293e-05, 3.247708082199097e-05, 3.378093242645264e-05, 3.508478403091431e-05, 3.6388635635375977e-05, 3.7692487239837646e-05, 3.8996338844299316e-05, 4.0300190448760986e-05, 4.1604042053222656e-05, 4.2907893657684326e-05, 4.4211745262145996e-05, 4.5515596866607666e-05, 4.6819448471069336e-05, 4.8123300075531006e-05, 4.9427151679992676e-05, 5.0731003284454346e-05, 5.2034854888916016e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 12.0, 10.0, 13.0, 35.0, 42.0, 54.0, 109.0, 198.0, 347.0, 668.0, 1178.0, 2129.0, 4978.0, 11096.0, 28528.0, 77375.0, 204696.0, 342071.0, 230270.0, 88857.0, 32587.0, 12485.0, 5443.0, 2498.0, 1294.0, 613.0, 411.0, 215.0, 94.0, 78.0, 52.0, 37.0, 22.0, 13.0, 13.0, 6.0, 7.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06561279296875, -0.0635986328125, -0.06158447265625, -0.0595703125, -0.05755615234375, -0.0555419921875, -0.05352783203125, -0.051513671875, -0.04949951171875, -0.0474853515625, -0.04547119140625, -0.04345703125, -0.04144287109375, -0.0394287109375, -0.03741455078125, -0.035400390625, -0.03338623046875, -0.0313720703125, -0.02935791015625, -0.02734375, -0.02532958984375, -0.0233154296875, -0.02130126953125, -0.019287109375, -0.01727294921875, -0.0152587890625, -0.01324462890625, -0.01123046875, -0.00921630859375, -0.0072021484375, -0.00518798828125, -0.003173828125, -0.00115966796875, 0.0008544921875, 0.00286865234375, 0.0048828125, 0.00689697265625, 0.0089111328125, 0.01092529296875, 0.012939453125, 0.01495361328125, 0.0169677734375, 0.01898193359375, 0.02099609375, 0.02301025390625, 0.0250244140625, 0.02703857421875, 0.029052734375, 0.03106689453125, 0.0330810546875, 0.03509521484375, 0.037109375, 0.03912353515625, 0.0411376953125, 0.04315185546875, 0.045166015625, 0.04718017578125, 0.0491943359375, 0.05120849609375, 0.05322265625, 0.05523681640625, 0.0572509765625, 0.05926513671875, 0.061279296875, 0.06329345703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 5.0, 5.0, 2.0, 7.0, 5.0, 5.0, 9.0, 14.0, 18.0, 19.0, 19.0, 29.0, 26.0, 24.0, 29.0, 49.0, 44.0, 47.0, 48.0, 56.0, 57.0, 50.0, 49.0, 48.0, 49.0, 51.0, 35.0, 35.0, 24.0, 30.0, 18.0, 19.0, 18.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.050811767578125, -0.049483299255371094, -0.04815483093261719, -0.04682636260986328, -0.045497894287109375, -0.04416942596435547, -0.04284095764160156, -0.041512489318847656, -0.04018402099609375, -0.038855552673339844, -0.03752708435058594, -0.03619861602783203, -0.034870147705078125, -0.03354167938232422, -0.03221321105957031, -0.030884742736816406, -0.0295562744140625, -0.028227806091308594, -0.026899337768554688, -0.02557086944580078, -0.024242401123046875, -0.02291393280029297, -0.021585464477539062, -0.020256996154785156, -0.01892852783203125, -0.017600059509277344, -0.016271591186523438, -0.014943122863769531, -0.013614654541015625, -0.012286186218261719, -0.010957717895507812, -0.009629249572753906, -0.00830078125, -0.006972312927246094, -0.0056438446044921875, -0.004315376281738281, -0.002986907958984375, -0.0016584396362304688, -0.0003299713134765625, 0.0009984970092773438, 0.00232696533203125, 0.0036554336547851562, 0.0049839019775390625, 0.006312370300292969, 0.007640838623046875, 0.008969306945800781, 0.010297775268554688, 0.011626243591308594, 0.0129547119140625, 0.014283180236816406, 0.015611648559570312, 0.01694011688232422, 0.018268585205078125, 0.01959705352783203, 0.020925521850585938, 0.022253990173339844, 0.02358245849609375, 0.024910926818847656, 0.026239395141601562, 0.02756786346435547, 0.028896331787109375, 0.03022480010986328, 0.03155326843261719, 0.032881736755371094, 0.034210205078125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 10.0, 24.0, 99.0, 328.0, 384.0, 113.0, 29.0, 14.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5728673934936523, -2.5132243633270264, -2.4535813331604004, -2.3939383029937744, -2.3342952728271484, -2.2746522426605225, -2.2150092124938965, -2.1553664207458496, -2.0957233905792236, -2.0360803604125977, -1.9764373302459717, -1.9167943000793457, -1.8571513891220093, -1.7975083589553833, -1.7378653287887573, -1.6782222986221313, -1.6185791492462158, -1.5589361190795898, -1.4992930889129639, -1.439650058746338, -1.3800071477890015, -1.3203641176223755, -1.2607210874557495, -1.2010780572891235, -1.141435146331787, -1.0817921161651611, -1.0221490859985352, -0.962506115436554, -0.902863085269928, -0.8432201147079468, -0.7835770845413208, -0.7239340543746948, -0.6642910242080688, -0.6046479940414429, -0.5450050234794617, -0.4853619933128357, -0.4257189631462097, -0.36607596278190613, -0.30643296241760254, -0.24678993225097656, -0.18714693188667297, -0.1275039166212082, -0.067860908806324, -0.00821790099143982, 0.05142511427402496, 0.11106812953948975, 0.17071112990379333, 0.2303541600704193, 0.2899971604347229, 0.3496401607990265, 0.40928319096565247, 0.46892619132995605, 0.528569221496582, 0.588212251663208, 0.6478552222251892, 0.7074982523918152, 0.7671412229537964, 0.8267842531204224, 0.8864272236824036, 0.9460702538490295, 1.0057132244110107, 1.0653562545776367, 1.1249992847442627, 1.1846423149108887, 1.2442853450775146]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 19.0, 13.0, 29.0, 22.0, 20.0, 29.0, 34.0, 50.0, 48.0, 71.0, 69.0, 60.0, 57.0, 66.0, 61.0, 50.0, 50.0, 47.0, 46.0, 40.0, 39.0, 21.0, 9.0, 11.0, 3.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.91217440366745, -0.8893617987632751, -0.8665491342544556, -0.8437365293502808, -0.8209238648414612, -0.7981112599372864, -0.7752985954284668, -0.752485990524292, -0.7296733856201172, -0.7068607807159424, -0.6840481162071228, -0.661235511302948, -0.6384228467941284, -0.6156102418899536, -0.5927976369857788, -0.5699849724769592, -0.5471723079681396, -0.5243597030639648, -0.5015470385551453, -0.47873443365097046, -0.4559217691421509, -0.4331091642379761, -0.4102965295314789, -0.3874838948249817, -0.3646712601184845, -0.3418586254119873, -0.3190459907054901, -0.2962333559989929, -0.2734207510948181, -0.25060808658599854, -0.22779548168182373, -0.20498284697532654, -0.18217027187347412, -0.15935763716697693, -0.13654500246047974, -0.11373238265514374, -0.09091974794864655, -0.06810711324214935, -0.045294493436813354, -0.022481858730316162, 0.0003307759761810303, 0.023143406957387924, 0.04595603793859482, 0.06876866519451141, 0.0915812999010086, 0.1143939346075058, 0.1372065544128418, 0.160019189119339, 0.18283182382583618, 0.20564445853233337, 0.22845709323883057, 0.25126969814300537, 0.27408236265182495, 0.29689496755599976, 0.31970760226249695, 0.34252023696899414, 0.36533287167549133, 0.3881455063819885, 0.4109581410884857, 0.4337707757949829, 0.4565833806991577, 0.4793960452079773, 0.5022086501121521, 0.5250213146209717, 0.5478339195251465]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 19.0, 34.0, 66.0, 144.0, 278.0, 672.0, 2137.0, 10345.0, 115752.0, 3890433.0, 159870.0, 10746.0, 2122.0, 763.0, 380.0, 194.0, 111.0, 76.0, 46.0, 20.0, 22.0, 7.0, 12.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.2969703674316406, -0.28534698486328125, -0.2737236022949219, -0.2621002197265625, -0.2504768371582031, -0.23885345458984375, -0.22723007202148438, -0.215606689453125, -0.20398330688476562, -0.19235992431640625, -0.18073654174804688, -0.1691131591796875, -0.15748977661132812, -0.14586639404296875, -0.13424301147460938, -0.12261962890625, -0.11099624633789062, -0.09937286376953125, -0.08774948120117188, -0.0761260986328125, -0.06450271606445312, -0.05287933349609375, -0.041255950927734375, -0.029632568359375, -0.018009185791015625, -0.00638580322265625, 0.005237579345703125, 0.0168609619140625, 0.028484344482421875, 0.04010772705078125, 0.051731109619140625, 0.0633544921875, 0.07497787475585938, 0.08660125732421875, 0.09822463989257812, 0.1098480224609375, 0.12147140502929688, 0.13309478759765625, 0.14471817016601562, 0.156341552734375, 0.16796493530273438, 0.17958831787109375, 0.19121170043945312, 0.2028350830078125, 0.21445846557617188, 0.22608184814453125, 0.23770523071289062, 0.24932861328125, 0.2609519958496094, 0.27257537841796875, 0.2841987609863281, 0.2958221435546875, 0.3074455261230469, 0.31906890869140625, 0.3306922912597656, 0.342315673828125, 0.3539390563964844, 0.36556243896484375, 0.3771858215332031, 0.3888092041015625, 0.4004325866699219, 0.41205596923828125, 0.4236793518066406, 0.435302734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 11.0, 22.0, 41.0, 43.0, 67.0, 114.0, 124.0, 115.0, 120.0, 116.0, 71.0, 75.0, 37.0, 16.0, 13.0, 10.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11468505859375, -0.10913562774658203, -0.10358619689941406, -0.0980367660522461, -0.09248733520507812, -0.08693790435791016, -0.08138847351074219, -0.07583904266357422, -0.07028961181640625, -0.06474018096923828, -0.05919075012207031, -0.053641319274902344, -0.048091888427734375, -0.042542457580566406, -0.03699302673339844, -0.03144359588623047, -0.0258941650390625, -0.02034473419189453, -0.014795303344726562, -0.009245872497558594, -0.003696441650390625, 0.0018529891967773438, 0.0074024200439453125, 0.012951850891113281, 0.01850128173828125, 0.02405071258544922, 0.029600143432617188, 0.035149574279785156, 0.040699005126953125, 0.046248435974121094, 0.05179786682128906, 0.05734729766845703, 0.062896728515625, 0.06844615936279297, 0.07399559020996094, 0.0795450210571289, 0.08509445190429688, 0.09064388275146484, 0.09619331359863281, 0.10174274444580078, 0.10729217529296875, 0.11284160614013672, 0.11839103698730469, 0.12394046783447266, 0.12948989868164062, 0.1350393295288086, 0.14058876037597656, 0.14613819122314453, 0.1516876220703125, 0.15723705291748047, 0.16278648376464844, 0.1683359146118164, 0.17388534545898438, 0.17943477630615234, 0.1849842071533203, 0.19053363800048828, 0.19608306884765625, 0.20163249969482422, 0.2071819305419922, 0.21273136138916016, 0.21828079223632812, 0.2238302230834961, 0.22937965393066406, 0.23492908477783203, 0.240478515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 20.0, 22.0, 50.0, 67.0, 100.0, 198.0, 356.0, 899.0, 2700.0, 13930.0, 129404.0, 2532551.0, 1425951.0, 75223.0, 9279.0, 2069.0, 696.0, 340.0, 164.0, 91.0, 57.0, 41.0, 28.0, 17.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.26911354064941406, -0.2616157531738281, -0.2541179656982422, -0.24662017822265625, -0.2391223907470703, -0.23162460327148438, -0.22412681579589844, -0.2166290283203125, -0.20913124084472656, -0.20163345336914062, -0.1941356658935547, -0.18663787841796875, -0.1791400909423828, -0.17164230346679688, -0.16414451599121094, -0.156646728515625, -0.14914894104003906, -0.14165115356445312, -0.1341533660888672, -0.12665557861328125, -0.11915779113769531, -0.11166000366210938, -0.10416221618652344, -0.0966644287109375, -0.08916664123535156, -0.08166885375976562, -0.07417106628417969, -0.06667327880859375, -0.05917549133300781, -0.051677703857421875, -0.04417991638183594, -0.03668212890625, -0.029184341430664062, -0.021686553955078125, -0.014188766479492188, -0.00669097900390625, 0.0008068084716796875, 0.008304595947265625, 0.015802383422851562, 0.0233001708984375, 0.030797958374023438, 0.038295745849609375, 0.04579353332519531, 0.05329132080078125, 0.06078910827636719, 0.06828689575195312, 0.07578468322753906, 0.083282470703125, 0.09078025817871094, 0.09827804565429688, 0.10577583312988281, 0.11327362060546875, 0.12077140808105469, 0.12826919555664062, 0.13576698303222656, 0.1432647705078125, 0.15076255798339844, 0.15826034545898438, 0.1657581329345703, 0.17325592041015625, 0.1807537078857422, 0.18825149536132812, 0.19574928283691406, 0.2032470703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 10.0, 25.0, 38.0, 66.0, 104.0, 125.0, 218.0, 364.0, 492.0, 703.0, 754.0, 418.0, 262.0, 191.0, 80.0, 90.0, 48.0, 28.0, 16.0, 15.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12017822265625, -0.11414241790771484, -0.10810661315917969, -0.10207080841064453, -0.09603500366210938, -0.08999919891357422, -0.08396339416503906, -0.0779275894165039, -0.07189178466796875, -0.0658559799194336, -0.05982017517089844, -0.05378437042236328, -0.047748565673828125, -0.04171276092529297, -0.03567695617675781, -0.029641151428222656, -0.0236053466796875, -0.017569541931152344, -0.011533737182617188, -0.005497932434082031, 0.000537872314453125, 0.006573677062988281, 0.012609481811523438, 0.018645286560058594, 0.02468109130859375, 0.030716896057128906, 0.03675270080566406, 0.04278850555419922, 0.048824310302734375, 0.05486011505126953, 0.06089591979980469, 0.06693172454833984, 0.072967529296875, 0.07900333404541016, 0.08503913879394531, 0.09107494354248047, 0.09711074829101562, 0.10314655303955078, 0.10918235778808594, 0.1152181625366211, 0.12125396728515625, 0.1272897720336914, 0.13332557678222656, 0.13936138153076172, 0.14539718627929688, 0.15143299102783203, 0.1574687957763672, 0.16350460052490234, 0.1695404052734375, 0.17557621002197266, 0.1816120147705078, 0.18764781951904297, 0.19368362426757812, 0.19971942901611328, 0.20575523376464844, 0.2117910385131836, 0.21782684326171875, 0.2238626480102539, 0.22989845275878906, 0.23593425750732422, 0.24197006225585938, 0.24800586700439453, 0.2540416717529297, 0.26007747650146484, 0.26611328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 17.0, 39.0, 39.0, 92.0, 144.0, 171.0, 172.0, 135.0, 82.0, 35.0, 21.0, 17.0, 10.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3894377648830414, -0.36547428369522095, -0.3415107727050781, -0.3175472617149353, -0.29358378052711487, -0.26962029933929443, -0.2456567883491516, -0.22169329226016998, -0.19772979617118835, -0.17376630008220673, -0.1498028039932251, -0.12583930790424347, -0.10187581181526184, -0.07791231572628021, -0.053948819637298584, -0.029985323548316956, -0.006021827459335327, 0.0179416686296463, 0.04190516471862793, 0.06586866080760956, 0.08983215689659119, 0.11379565298557281, 0.13775914907455444, 0.16172264516353607, 0.1856861412525177, 0.20964963734149933, 0.23361313343048096, 0.2575766444206238, 0.2815401256084442, 0.30550360679626465, 0.32946711778640747, 0.3534306287765503, 0.37739408016204834, 0.40135759115219116, 0.4253210723400116, 0.44928455352783203, 0.47324806451797485, 0.4972115755081177, 0.5211750268936157, 0.5451385378837585, 0.5691020488739014, 0.5930655598640442, 0.617029070854187, 0.6409925222396851, 0.6649560332298279, 0.6889195442199707, 0.7128829956054688, 0.7368465065956116, 0.7608100175857544, 0.7847735285758972, 0.80873703956604, 0.8327004909515381, 0.8566640019416809, 0.8806275129318237, 0.9045909643173218, 0.9285544753074646, 0.9525179862976074, 0.9764814972877502, 1.000445008277893, 1.0244084596633911, 1.0483720302581787, 1.0723354816436768, 1.0962989330291748, 1.1202625036239624, 1.1442259550094604]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 10.0, 11.0, 17.0, 21.0, 28.0, 18.0, 37.0, 37.0, 38.0, 46.0, 40.0, 53.0, 38.0, 44.0, 44.0, 68.0, 52.0, 52.0, 46.0, 41.0, 47.0, 31.0, 23.0, 23.0, 27.0, 19.0, 19.0, 15.0, 14.0, 4.0, 6.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5208801627159119, -0.5050221085548401, -0.4891640245914459, -0.47330597043037415, -0.45744788646698, -0.4415898323059082, -0.4257317781448364, -0.40987372398376465, -0.3940156400203705, -0.3781575858592987, -0.36229950189590454, -0.34644144773483276, -0.330583393573761, -0.3147253096103668, -0.29886725544929504, -0.2830091714859009, -0.2671511173248291, -0.2512930631637573, -0.23543497920036316, -0.21957692503929138, -0.2037188559770584, -0.18786078691482544, -0.17200273275375366, -0.1561446636915207, -0.14028659462928772, -0.12442852556705475, -0.10857046395540237, -0.09271240234375, -0.07685433328151703, -0.06099626421928406, -0.04513820260763168, -0.02928014099597931, -0.013422071933746338, 0.002435993403196335, 0.018294058740139008, 0.03415212407708168, 0.05001018941402435, 0.06586825847625732, 0.0817263200879097, 0.09758438169956207, 0.11344245076179504, 0.12930051982402802, 0.145158588886261, 0.16101664304733276, 0.17687471210956573, 0.1927327811717987, 0.20859083533287048, 0.22444890439510345, 0.24030697345733643, 0.2561650276184082, 0.27202311158180237, 0.28788116574287415, 0.3037392497062683, 0.3195973038673401, 0.33545535802841187, 0.35131341218948364, 0.3671714961528778, 0.3830295503139496, 0.39888763427734375, 0.4147456884384155, 0.4306037425994873, 0.44646182656288147, 0.46231988072395325, 0.4781779646873474, 0.4940360188484192]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 23.0, 30.0, 37.0, 65.0, 73.0, 111.0, 169.0, 275.0, 466.0, 850.0, 2295.0, 9547.0, 57759.0, 452692.0, 451941.0, 58037.0, 9586.0, 2366.0, 915.0, 474.0, 278.0, 152.0, 118.0, 73.0, 59.0, 30.0, 19.0, 16.0, 19.0, 10.0, 10.0, 3.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.346923828125, -0.33453369140625, -0.3221435546875, -0.30975341796875, -0.29736328125, -0.28497314453125, -0.2725830078125, -0.26019287109375, -0.247802734375, -0.23541259765625, -0.2230224609375, -0.21063232421875, -0.1982421875, -0.18585205078125, -0.1734619140625, -0.16107177734375, -0.148681640625, -0.13629150390625, -0.1239013671875, -0.11151123046875, -0.09912109375, -0.08673095703125, -0.0743408203125, -0.06195068359375, -0.049560546875, -0.03717041015625, -0.0247802734375, -0.01239013671875, 0.0, 0.01239013671875, 0.0247802734375, 0.03717041015625, 0.049560546875, 0.06195068359375, 0.0743408203125, 0.08673095703125, 0.09912109375, 0.11151123046875, 0.1239013671875, 0.13629150390625, 0.148681640625, 0.16107177734375, 0.1734619140625, 0.18585205078125, 0.1982421875, 0.21063232421875, 0.2230224609375, 0.23541259765625, 0.247802734375, 0.26019287109375, 0.2725830078125, 0.28497314453125, 0.29736328125, 0.30975341796875, 0.3221435546875, 0.33453369140625, 0.346923828125, 0.35931396484375, 0.3717041015625, 0.38409423828125, 0.396484375, 0.40887451171875, 0.4212646484375, 0.43365478515625, 0.446044921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 22.0, 41.0, 77.0, 105.0, 134.0, 155.0, 164.0, 119.0, 81.0, 47.0, 32.0, 12.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14990234375, -0.14357757568359375, -0.1372528076171875, -0.13092803955078125, -0.124603271484375, -0.11827850341796875, -0.1119537353515625, -0.10562896728515625, -0.09930419921875, -0.09297943115234375, -0.0866546630859375, -0.08032989501953125, -0.074005126953125, -0.06768035888671875, -0.0613555908203125, -0.05503082275390625, -0.0487060546875, -0.04238128662109375, -0.0360565185546875, -0.02973175048828125, -0.023406982421875, -0.01708221435546875, -0.0107574462890625, -0.00443267822265625, 0.00189208984375, 0.00821685791015625, 0.0145416259765625, 0.02086639404296875, 0.027191162109375, 0.03351593017578125, 0.0398406982421875, 0.04616546630859375, 0.052490234375, 0.05881500244140625, 0.0651397705078125, 0.07146453857421875, 0.077789306640625, 0.08411407470703125, 0.0904388427734375, 0.09676361083984375, 0.10308837890625, 0.10941314697265625, 0.1157379150390625, 0.12206268310546875, 0.128387451171875, 0.13471221923828125, 0.1410369873046875, 0.14736175537109375, 0.1536865234375, 0.16001129150390625, 0.1663360595703125, 0.17266082763671875, 0.178985595703125, 0.18531036376953125, 0.1916351318359375, 0.19795989990234375, 0.20428466796875, 0.21060943603515625, 0.2169342041015625, 0.22325897216796875, 0.229583740234375, 0.23590850830078125, 0.2422332763671875, 0.24855804443359375, 0.2548828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 15.0, 14.0, 28.0, 33.0, 49.0, 64.0, 108.0, 171.0, 252.0, 408.0, 630.0, 1117.0, 2038.0, 3995.0, 8144.0, 17342.0, 40896.0, 104968.0, 263676.0, 334860.0, 161075.0, 60667.0, 24994.0, 11241.0, 5398.0, 2703.0, 1391.0, 857.0, 516.0, 303.0, 210.0, 131.0, 71.0, 55.0, 46.0, 24.0, 20.0, 15.0, 12.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.1706714630126953, -0.16568374633789062, -0.16069602966308594, -0.15570831298828125, -0.15072059631347656, -0.14573287963867188, -0.1407451629638672, -0.1357574462890625, -0.1307697296142578, -0.12578201293945312, -0.12079429626464844, -0.11580657958984375, -0.11081886291503906, -0.10583114624023438, -0.10084342956542969, -0.095855712890625, -0.09086799621582031, -0.08588027954101562, -0.08089256286621094, -0.07590484619140625, -0.07091712951660156, -0.06592941284179688, -0.06094169616699219, -0.0559539794921875, -0.05096626281738281, -0.045978546142578125, -0.04099082946777344, -0.03600311279296875, -0.031015396118164062, -0.026027679443359375, -0.021039962768554688, -0.01605224609375, -0.011064529418945312, -0.006076812744140625, -0.0010890960693359375, 0.00389862060546875, 0.008886337280273438, 0.013874053955078125, 0.018861770629882812, 0.0238494873046875, 0.028837203979492188, 0.033824920654296875, 0.03881263732910156, 0.04380035400390625, 0.04878807067871094, 0.053775787353515625, 0.05876350402832031, 0.063751220703125, 0.06873893737792969, 0.07372665405273438, 0.07871437072753906, 0.08370208740234375, 0.08868980407714844, 0.09367752075195312, 0.09866523742675781, 0.1036529541015625, 0.10864067077636719, 0.11362838745117188, 0.11861610412597656, 0.12360382080078125, 0.12859153747558594, 0.13357925415039062, 0.1385669708251953, 0.1435546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 5.0, 5.0, 6.0, 5.0, 13.0, 9.0, 13.0, 12.0, 18.0, 20.0, 21.0, 23.0, 22.0, 30.0, 30.0, 24.0, 33.0, 37.0, 45.0, 36.0, 38.0, 31.0, 51.0, 38.0, 36.0, 38.0, 40.0, 49.0, 29.0, 36.0, 22.0, 40.0, 16.0, 21.0, 24.0, 13.0, 12.0, 15.0, 10.0, 9.0, 10.0, 8.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.147216796875, -0.1420745849609375, -0.136932373046875, -0.1317901611328125, -0.12664794921875, -0.1215057373046875, -0.116363525390625, -0.1112213134765625, -0.1060791015625, -0.1009368896484375, -0.095794677734375, -0.0906524658203125, -0.08551025390625, -0.0803680419921875, -0.075225830078125, -0.0700836181640625, -0.06494140625, -0.0597991943359375, -0.054656982421875, -0.0495147705078125, -0.04437255859375, -0.0392303466796875, -0.034088134765625, -0.0289459228515625, -0.0238037109375, -0.0186614990234375, -0.013519287109375, -0.0083770751953125, -0.00323486328125, 0.0019073486328125, 0.007049560546875, 0.0121917724609375, 0.017333984375, 0.0224761962890625, 0.027618408203125, 0.0327606201171875, 0.03790283203125, 0.0430450439453125, 0.048187255859375, 0.0533294677734375, 0.0584716796875, 0.0636138916015625, 0.068756103515625, 0.0738983154296875, 0.07904052734375, 0.0841827392578125, 0.089324951171875, 0.0944671630859375, 0.099609375, 0.1047515869140625, 0.109893798828125, 0.1150360107421875, 0.12017822265625, 0.1253204345703125, 0.130462646484375, 0.1356048583984375, 0.1407470703125, 0.1458892822265625, 0.151031494140625, 0.1561737060546875, 0.16131591796875, 0.1664581298828125, 0.171600341796875, 0.1767425537109375, 0.181884765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 9.0, 9.0, 10.0, 21.0, 42.0, 60.0, 91.0, 151.0, 253.0, 501.0, 1219.0, 3460.0, 11793.0, 48545.0, 217999.0, 475040.0, 221562.0, 49991.0, 11943.0, 3409.0, 1274.0, 521.0, 258.0, 135.0, 86.0, 40.0, 34.0, 31.0, 25.0, 10.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.06951904296875, -0.0675044059753418, -0.0654897689819336, -0.06347513198852539, -0.06146049499511719, -0.059445858001708984, -0.05743122100830078, -0.05541658401489258, -0.053401947021484375, -0.05138731002807617, -0.04937267303466797, -0.047358036041259766, -0.04534339904785156, -0.04332876205444336, -0.041314125061035156, -0.03929948806762695, -0.03728485107421875, -0.03527021408081055, -0.033255577087402344, -0.03124094009399414, -0.029226303100585938, -0.027211666107177734, -0.02519702911376953, -0.023182392120361328, -0.021167755126953125, -0.019153118133544922, -0.01713848114013672, -0.015123844146728516, -0.013109207153320312, -0.01109457015991211, -0.009079933166503906, -0.007065296173095703, -0.0050506591796875, -0.003036022186279297, -0.0010213851928710938, 0.0009932518005371094, 0.0030078887939453125, 0.005022525787353516, 0.007037162780761719, 0.009051799774169922, 0.011066436767578125, 0.013081073760986328, 0.015095710754394531, 0.017110347747802734, 0.019124984741210938, 0.02113962173461914, 0.023154258728027344, 0.025168895721435547, 0.02718353271484375, 0.029198169708251953, 0.031212806701660156, 0.03322744369506836, 0.03524208068847656, 0.037256717681884766, 0.03927135467529297, 0.04128599166870117, 0.043300628662109375, 0.04531526565551758, 0.04732990264892578, 0.049344539642333984, 0.05135917663574219, 0.05337381362915039, 0.055388450622558594, 0.0574030876159668, 0.059417724609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 8.0, 12.0, 8.0, 10.0, 16.0, 31.0, 27.0, 34.0, 28.0, 70.0, 53.0, 57.0, 67.0, 55.0, 66.0, 52.0, 61.0, 60.0, 51.0, 35.0, 31.0, 26.0, 22.0, 23.0, 18.0, 22.0, 13.0, 9.0, 10.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.463859558105469e-06, -8.210539817810059e-06, -7.957220077514648e-06, -7.703900337219238e-06, -7.450580596923828e-06, -7.197260856628418e-06, -6.943941116333008e-06, -6.690621376037598e-06, -6.4373016357421875e-06, -6.183981895446777e-06, -5.930662155151367e-06, -5.677342414855957e-06, -5.424022674560547e-06, -5.170702934265137e-06, -4.9173831939697266e-06, -4.664063453674316e-06, -4.410743713378906e-06, -4.157423973083496e-06, -3.904104232788086e-06, -3.6507844924926758e-06, -3.3974647521972656e-06, -3.1441450119018555e-06, -2.8908252716064453e-06, -2.637505531311035e-06, -2.384185791015625e-06, -2.130866050720215e-06, -1.8775463104248047e-06, -1.6242265701293945e-06, -1.3709068298339844e-06, -1.1175870895385742e-06, -8.642673492431641e-07, -6.109476089477539e-07, -3.5762786865234375e-07, -1.043081283569336e-07, 1.4901161193847656e-07, 4.023313522338867e-07, 6.556510925292969e-07, 9.08970832824707e-07, 1.1622905731201172e-06, 1.4156103134155273e-06, 1.6689300537109375e-06, 1.9222497940063477e-06, 2.175569534301758e-06, 2.428889274597168e-06, 2.682209014892578e-06, 2.9355287551879883e-06, 3.1888484954833984e-06, 3.4421682357788086e-06, 3.6954879760742188e-06, 3.948807716369629e-06, 4.202127456665039e-06, 4.455447196960449e-06, 4.708766937255859e-06, 4.9620866775512695e-06, 5.21540641784668e-06, 5.46872615814209e-06, 5.7220458984375e-06, 5.97536563873291e-06, 6.22868537902832e-06, 6.4820051193237305e-06, 6.735324859619141e-06, 6.988644599914551e-06, 7.241964340209961e-06, 7.495284080505371e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 10.0, 9.0, 8.0, 18.0, 15.0, 33.0, 37.0, 57.0, 55.0, 105.0, 187.0, 270.0, 436.0, 653.0, 1155.0, 2049.0, 4074.0, 8296.0, 20251.0, 58584.0, 188514.0, 384340.0, 250133.0, 80937.0, 27050.0, 10516.0, 4857.0, 2464.0, 1318.0, 783.0, 448.0, 301.0, 178.0, 119.0, 81.0, 54.0, 44.0, 29.0, 17.0, 20.0, 5.0, 15.0, 9.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.05450439453125, -0.05288410186767578, -0.05126380920410156, -0.049643516540527344, -0.048023223876953125, -0.046402931213378906, -0.04478263854980469, -0.04316234588623047, -0.04154205322265625, -0.03992176055908203, -0.03830146789550781, -0.036681175231933594, -0.035060882568359375, -0.033440589904785156, -0.03182029724121094, -0.03020000457763672, -0.0285797119140625, -0.02695941925048828, -0.025339126586914062, -0.023718833923339844, -0.022098541259765625, -0.020478248596191406, -0.018857955932617188, -0.01723766326904297, -0.01561737060546875, -0.013997077941894531, -0.012376785278320312, -0.010756492614746094, -0.009136199951171875, -0.007515907287597656, -0.0058956146240234375, -0.004275321960449219, -0.002655029296875, -0.0010347366333007812, 0.0005855560302734375, 0.0022058486938476562, 0.003826141357421875, 0.005446434020996094, 0.0070667266845703125, 0.008687019348144531, 0.01030731201171875, 0.011927604675292969, 0.013547897338867188, 0.015168190002441406, 0.016788482666015625, 0.018408775329589844, 0.020029067993164062, 0.02164936065673828, 0.0232696533203125, 0.02488994598388672, 0.026510238647460938, 0.028130531311035156, 0.029750823974609375, 0.031371116638183594, 0.03299140930175781, 0.03461170196533203, 0.03623199462890625, 0.03785228729248047, 0.03947257995605469, 0.041092872619628906, 0.042713165283203125, 0.044333457946777344, 0.04595375061035156, 0.04757404327392578, 0.0491943359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 11.0, 10.0, 11.0, 14.0, 24.0, 36.0, 23.0, 38.0, 65.0, 83.0, 90.0, 100.0, 91.0, 84.0, 68.0, 51.0, 41.0, 23.0, 30.0, 21.0, 11.0, 18.0, 9.0, 4.0, 7.0, 6.0, 0.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05419921875, -0.05244016647338867, -0.050681114196777344, -0.048922061920166016, -0.04716300964355469, -0.04540395736694336, -0.04364490509033203, -0.0418858528137207, -0.040126800537109375, -0.03836774826049805, -0.03660869598388672, -0.03484964370727539, -0.03309059143066406, -0.031331539154052734, -0.029572486877441406, -0.027813434600830078, -0.02605438232421875, -0.024295330047607422, -0.022536277770996094, -0.020777225494384766, -0.019018173217773438, -0.01725912094116211, -0.015500068664550781, -0.013741016387939453, -0.011981964111328125, -0.010222911834716797, -0.008463859558105469, -0.006704807281494141, -0.0049457550048828125, -0.0031867027282714844, -0.0014276504516601562, 0.0003314018249511719, 0.0020904541015625, 0.003849506378173828, 0.005608558654785156, 0.007367610931396484, 0.009126663208007812, 0.01088571548461914, 0.012644767761230469, 0.014403820037841797, 0.016162872314453125, 0.017921924591064453, 0.01968097686767578, 0.02144002914428711, 0.023199081420898438, 0.024958133697509766, 0.026717185974121094, 0.028476238250732422, 0.03023529052734375, 0.03199434280395508, 0.033753395080566406, 0.035512447357177734, 0.03727149963378906, 0.03903055191040039, 0.04078960418701172, 0.04254865646362305, 0.044307708740234375, 0.0460667610168457, 0.04782581329345703, 0.04958486557006836, 0.05134391784667969, 0.053102970123291016, 0.054862022399902344, 0.05662107467651367, 0.058380126953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 16.0, 146.0, 672.0, 162.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.652754783630371, -5.549046516418457, -5.445338249206543, -5.341629981994629, -5.237921237945557, -5.134212970733643, -5.0305047035217285, -4.9267964363098145, -4.8230881690979, -4.719379901885986, -4.615671634674072, -4.511962890625, -4.408254623413086, -4.304546356201172, -4.200838088989258, -4.097129821777344, -3.9934210777282715, -3.8897128105163574, -3.7860043048858643, -3.68229603767395, -3.578587770462036, -3.474879264831543, -3.371170997619629, -3.267462730407715, -3.163754463195801, -3.0600461959838867, -2.9563376903533936, -2.8526294231414795, -2.7489211559295654, -2.6452126502990723, -2.541504383087158, -2.437796115875244, -2.334087610244751, -2.230379343032837, -2.1266708374023438, -2.0229625701904297, -1.919254183769226, -1.8155457973480225, -1.7118375301361084, -1.6081291437149048, -1.5044207572937012, -1.4007123708724976, -1.2970041036605835, -1.1932957172393799, -1.0895873308181763, -0.9858790040016174, -0.8821706771850586, -0.778462290763855, -0.6747540235519409, -0.5710456967353821, -0.46733731031417847, -0.36362898349761963, -0.2599206268787384, -0.15621227025985718, -0.05250394344329834, 0.05120444297790527, 0.1549127697944641, 0.25862112641334534, 0.36232948303222656, 0.4660378098487854, 0.5697461366653442, 0.6734545230865479, 0.7771628499031067, 0.8808712363243103, 0.9845795631408691]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 3.0, 13.0, 10.0, 8.0, 17.0, 22.0, 16.0, 34.0, 30.0, 38.0, 31.0, 43.0, 48.0, 41.0, 46.0, 43.0, 47.0, 61.0, 47.0, 44.0, 39.0, 33.0, 42.0, 29.0, 36.0, 38.0, 31.0, 16.0, 20.0, 18.0, 13.0, 10.0, 5.0, 6.0, 6.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4682573080062866, -0.44985583424568176, -0.4314543604850769, -0.41305291652679443, -0.3946514427661896, -0.3762499690055847, -0.35784852504730225, -0.3394470512866974, -0.32104557752609253, -0.30264410376548767, -0.2842426300048828, -0.26584118604660034, -0.24743971228599548, -0.22903823852539062, -0.21063677966594696, -0.1922353208065033, -0.17383384704589844, -0.15543237328529358, -0.13703091442584991, -0.11862944811582565, -0.10022798180580139, -0.08182651549577713, -0.06342504918575287, -0.045023590326309204, -0.026622116565704346, -0.008220650255680084, 0.010180816054344177, 0.02858228236436844, 0.0469837486743927, 0.06538521498441696, 0.08378668129444122, 0.10218814015388489, 0.12058961391448975, 0.1389910876750946, 0.15739254653453827, 0.17579400539398193, 0.1941954791545868, 0.21259695291519165, 0.23099841177463531, 0.24939987063407898, 0.26780134439468384, 0.2862028181552887, 0.30460429191589355, 0.323005735874176, 0.3414072096347809, 0.35980868339538574, 0.3782101273536682, 0.39661160111427307, 0.41501307487487793, 0.4334145486354828, 0.45181602239608765, 0.4702174663543701, 0.488618940114975, 0.5070204138755798, 0.5254218578338623, 0.5438233613967896, 0.562224805355072, 0.5806262493133545, 0.5990277528762817, 0.6174291968345642, 0.6358306407928467, 0.6542321443557739, 0.6726335883140564, 0.6910350322723389, 0.7094365358352661]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 4.0, 12.0, 8.0, 12.0, 14.0, 25.0, 30.0, 44.0, 91.0, 129.0, 219.0, 374.0, 670.0, 1240.0, 2997.0, 9294.0, 41061.0, 503421.0, 3459564.0, 145349.0, 19609.0, 5249.0, 2080.0, 1029.0, 599.0, 366.0, 225.0, 159.0, 106.0, 68.0, 53.0, 43.0, 38.0, 19.0, 19.0, 9.0, 8.0, 6.0, 9.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1722412109375, -0.1645221710205078, -0.15680313110351562, -0.14908409118652344, -0.14136505126953125, -0.13364601135253906, -0.12592697143554688, -0.11820793151855469, -0.1104888916015625, -0.10276985168457031, -0.09505081176757812, -0.08733177185058594, -0.07961273193359375, -0.07189369201660156, -0.06417465209960938, -0.05645561218261719, -0.048736572265625, -0.04101753234863281, -0.033298492431640625, -0.025579452514648438, -0.01786041259765625, -0.010141372680664062, -0.002422332763671875, 0.0052967071533203125, 0.0130157470703125, 0.020734786987304688, 0.028453826904296875, 0.03617286682128906, 0.04389190673828125, 0.05161094665527344, 0.059329986572265625, 0.06704902648925781, 0.07476806640625, 0.08248710632324219, 0.09020614624023438, 0.09792518615722656, 0.10564422607421875, 0.11336326599121094, 0.12108230590820312, 0.1288013458251953, 0.1365203857421875, 0.1442394256591797, 0.15195846557617188, 0.15967750549316406, 0.16739654541015625, 0.17511558532714844, 0.18283462524414062, 0.1905536651611328, 0.198272705078125, 0.2059917449951172, 0.21371078491210938, 0.22142982482910156, 0.22914886474609375, 0.23686790466308594, 0.24458694458007812, 0.2523059844970703, 0.2600250244140625, 0.2677440643310547, 0.2754631042480469, 0.28318214416503906, 0.29090118408203125, 0.29862022399902344, 0.3063392639160156, 0.3140583038330078, 0.32177734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 14.0, 22.0, 42.0, 67.0, 84.0, 112.0, 99.0, 157.0, 130.0, 89.0, 76.0, 52.0, 26.0, 21.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11590576171875, -0.11019420623779297, -0.10448265075683594, -0.0987710952758789, -0.09305953979492188, -0.08734798431396484, -0.08163642883300781, -0.07592487335205078, -0.07021331787109375, -0.06450176239013672, -0.05879020690917969, -0.053078651428222656, -0.047367095947265625, -0.041655540466308594, -0.03594398498535156, -0.03023242950439453, -0.0245208740234375, -0.01880931854248047, -0.013097763061523438, -0.007386207580566406, -0.001674652099609375, 0.004036903381347656, 0.009748458862304688, 0.015460014343261719, 0.02117156982421875, 0.02688312530517578, 0.03259468078613281, 0.038306236267089844, 0.044017791748046875, 0.049729347229003906, 0.05544090270996094, 0.06115245819091797, 0.066864013671875, 0.07257556915283203, 0.07828712463378906, 0.0839986801147461, 0.08971023559570312, 0.09542179107666016, 0.10113334655761719, 0.10684490203857422, 0.11255645751953125, 0.11826801300048828, 0.12397956848144531, 0.12969112396240234, 0.13540267944335938, 0.1411142349243164, 0.14682579040527344, 0.15253734588623047, 0.1582489013671875, 0.16396045684814453, 0.16967201232910156, 0.1753835678100586, 0.18109512329101562, 0.18680667877197266, 0.1925182342529297, 0.19822978973388672, 0.20394134521484375, 0.20965290069580078, 0.2153644561767578, 0.22107601165771484, 0.22678756713867188, 0.2324991226196289, 0.23821067810058594, 0.24392223358154297, 0.2496337890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 13.0, 11.0, 23.0, 29.0, 36.0, 56.0, 103.0, 136.0, 213.0, 403.0, 707.0, 1415.0, 3428.0, 10149.0, 41110.0, 277844.0, 2656807.0, 1062876.0, 107940.0, 20543.0, 5799.0, 2231.0, 1026.0, 523.0, 291.0, 191.0, 91.0, 75.0, 61.0, 29.0, 21.0, 22.0, 10.0, 16.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.1768798828125, -0.17164230346679688, -0.16640472412109375, -0.16116714477539062, -0.1559295654296875, -0.15069198608398438, -0.14545440673828125, -0.14021682739257812, -0.134979248046875, -0.12974166870117188, -0.12450408935546875, -0.11926651000976562, -0.1140289306640625, -0.10879135131835938, -0.10355377197265625, -0.09831619262695312, -0.09307861328125, -0.08784103393554688, -0.08260345458984375, -0.07736587524414062, -0.0721282958984375, -0.06689071655273438, -0.06165313720703125, -0.056415557861328125, -0.051177978515625, -0.045940399169921875, -0.04070281982421875, -0.035465240478515625, -0.0302276611328125, -0.024990081787109375, -0.01975250244140625, -0.014514923095703125, -0.00927734375, -0.004039764404296875, 0.00119781494140625, 0.006435394287109375, 0.0116729736328125, 0.016910552978515625, 0.02214813232421875, 0.027385711669921875, 0.032623291015625, 0.037860870361328125, 0.04309844970703125, 0.048336029052734375, 0.0535736083984375, 0.058811187744140625, 0.06404876708984375, 0.06928634643554688, 0.07452392578125, 0.07976150512695312, 0.08499908447265625, 0.09023666381835938, 0.0954742431640625, 0.10071182250976562, 0.10594940185546875, 0.11118698120117188, 0.116424560546875, 0.12166213989257812, 0.12689971923828125, 0.13213729858398438, 0.1373748779296875, 0.14261245727539062, 0.14785003662109375, 0.15308761596679688, 0.1583251953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 4.0, 8.0, 9.0, 19.0, 14.0, 24.0, 46.0, 36.0, 57.0, 71.0, 104.0, 136.0, 185.0, 249.0, 367.0, 501.0, 546.0, 451.0, 291.0, 255.0, 175.0, 112.0, 87.0, 80.0, 65.0, 40.0, 28.0, 24.0, 16.0, 14.0, 9.0, 4.0, 5.0, 7.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1241455078125, -0.12043094635009766, -0.11671638488769531, -0.11300182342529297, -0.10928726196289062, -0.10557270050048828, -0.10185813903808594, -0.0981435775756836, -0.09442901611328125, -0.0907144546508789, -0.08699989318847656, -0.08328533172607422, -0.07957077026367188, -0.07585620880126953, -0.07214164733886719, -0.06842708587646484, -0.0647125244140625, -0.060997962951660156, -0.05728340148925781, -0.05356884002685547, -0.049854278564453125, -0.04613971710205078, -0.04242515563964844, -0.038710594177246094, -0.03499603271484375, -0.031281471252441406, -0.027566909790039062, -0.02385234832763672, -0.020137786865234375, -0.01642322540283203, -0.012708663940429688, -0.008994102478027344, -0.005279541015625, -0.0015649795532226562, 0.0021495819091796875, 0.005864143371582031, 0.009578704833984375, 0.013293266296386719, 0.017007827758789062, 0.020722389221191406, 0.02443695068359375, 0.028151512145996094, 0.03186607360839844, 0.03558063507080078, 0.039295196533203125, 0.04300975799560547, 0.04672431945800781, 0.050438880920410156, 0.0541534423828125, 0.057868003845214844, 0.06158256530761719, 0.06529712677001953, 0.06901168823242188, 0.07272624969482422, 0.07644081115722656, 0.0801553726196289, 0.08386993408203125, 0.0875844955444336, 0.09129905700683594, 0.09501361846923828, 0.09872817993164062, 0.10244274139404297, 0.10615730285644531, 0.10987186431884766, 0.11358642578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 13.0, 19.0, 39.0, 60.0, 102.0, 179.0, 189.0, 161.0, 97.0, 58.0, 45.0, 14.0, 13.0, 7.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.3298853635787964, -1.3029388189315796, -1.2759922742843628, -1.249045729637146, -1.2220990657806396, -1.1951525211334229, -1.168205976486206, -1.1412594318389893, -1.1143128871917725, -1.0873663425445557, -1.0604197978973389, -1.033473253250122, -1.0065265893936157, -0.9795800447463989, -0.9526335000991821, -0.9256869554519653, -0.8987404108047485, -0.8717938661575317, -0.8448472619056702, -0.8179007172584534, -0.7909541726112366, -0.764007568359375, -0.7370610237121582, -0.7101144790649414, -0.6831678748130798, -0.656221330165863, -0.6292747259140015, -0.6023281812667847, -0.5753816366195679, -0.5484350919723511, -0.5214884877204895, -0.4945419430732727, -0.4675953686237335, -0.44064879417419434, -0.41370224952697754, -0.38675567507743835, -0.35980913043022156, -0.3328625559806824, -0.3059160113334656, -0.2789694368839264, -0.2520228624343872, -0.22507630288600922, -0.19812974333763123, -0.17118316888809204, -0.14423662424087524, -0.11729004979133606, -0.09034349024295807, -0.06339693069458008, -0.03645038604736328, -0.009503824636340141, 0.017442736774683, 0.04438930004835129, 0.07133585959672928, 0.09828242659568787, 0.12522898614406586, 0.15217554569244385, 0.17912210524082184, 0.20606866478919983, 0.23301522433757782, 0.2599617838859558, 0.286908358335495, 0.3138549327850342, 0.340801477432251, 0.3677480220794678, 0.39469459652900696]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 10.0, 14.0, 16.0, 20.0, 31.0, 18.0, 30.0, 33.0, 31.0, 38.0, 35.0, 42.0, 35.0, 41.0, 38.0, 42.0, 56.0, 41.0, 36.0, 50.0, 38.0, 29.0, 34.0, 33.0, 18.0, 24.0, 25.0, 26.0, 22.0, 15.0, 14.0, 3.0, 7.0, 4.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.39985769987106323, -0.38670894503593445, -0.3735601603984833, -0.3604114055633545, -0.3472626209259033, -0.33411386609077454, -0.32096508145332336, -0.3078163266181946, -0.2946675419807434, -0.2815187871456146, -0.26837000250816345, -0.25522124767303467, -0.2420724630355835, -0.2289237082004547, -0.21577492356300354, -0.20262616872787476, -0.18947739899158478, -0.1763286292552948, -0.16317985951900482, -0.15003108978271484, -0.13688232004642487, -0.12373355776071548, -0.1105847880244255, -0.09743601828813553, -0.08428724855184555, -0.07113847881555557, -0.057989709079265594, -0.044840943068265915, -0.03169217333197594, -0.018543407320976257, -0.005394637584686279, 0.007754132151603699, 0.020902901887893677, 0.034051671624183655, 0.04720044136047363, 0.06034920737147331, 0.07349798083305359, 0.08664674311876297, 0.09979551285505295, 0.11294428259134293, 0.1260930597782135, 0.13924182951450348, 0.15239059925079346, 0.16553936898708344, 0.1786881387233734, 0.1918368935585022, 0.20498567819595337, 0.21813443303108215, 0.23128320276737213, 0.2444319725036621, 0.2575807273387909, 0.27072951197624207, 0.28387826681137085, 0.297027051448822, 0.3101758062839508, 0.323324590921402, 0.33647334575653076, 0.34962210059165955, 0.3627708852291107, 0.3759196400642395, 0.3890684247016907, 0.40221717953681946, 0.41536596417427063, 0.4285147190093994, 0.4416635036468506]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 8.0, 21.0, 25.0, 22.0, 39.0, 60.0, 68.0, 86.0, 140.0, 215.0, 301.0, 489.0, 957.0, 2338.0, 6858.0, 26887.0, 137692.0, 539309.0, 266893.0, 48256.0, 11401.0, 3487.0, 1295.0, 567.0, 343.0, 204.0, 153.0, 106.0, 80.0, 43.0, 42.0, 30.0, 29.0, 19.0, 12.0, 10.0, 9.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.271484375, -0.2631797790527344, -0.25487518310546875, -0.24657058715820312, -0.2382659912109375, -0.22996139526367188, -0.22165679931640625, -0.21335220336914062, -0.205047607421875, -0.19674301147460938, -0.18843841552734375, -0.18013381958007812, -0.1718292236328125, -0.16352462768554688, -0.15522003173828125, -0.14691543579101562, -0.13861083984375, -0.13030624389648438, -0.12200164794921875, -0.11369705200195312, -0.1053924560546875, -0.09708786010742188, -0.08878326416015625, -0.08047866821289062, -0.072174072265625, -0.06386947631835938, -0.05556488037109375, -0.047260284423828125, -0.0389556884765625, -0.030651092529296875, -0.02234649658203125, -0.014041900634765625, -0.0057373046875, 0.002567291259765625, 0.01087188720703125, 0.019176483154296875, 0.0274810791015625, 0.035785675048828125, 0.04409027099609375, 0.052394866943359375, 0.060699462890625, 0.06900405883789062, 0.07730865478515625, 0.08561325073242188, 0.0939178466796875, 0.10222244262695312, 0.11052703857421875, 0.11883163452148438, 0.12713623046875, 0.13544082641601562, 0.14374542236328125, 0.15205001831054688, 0.1603546142578125, 0.16865921020507812, 0.17696380615234375, 0.18526840209960938, 0.193572998046875, 0.20187759399414062, 0.21018218994140625, 0.21848678588867188, 0.2267913818359375, 0.23509597778320312, 0.24340057373046875, 0.2517051696777344, 0.260009765625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 11.0, 14.0, 23.0, 48.0, 94.0, 104.0, 141.0, 144.0, 117.0, 117.0, 89.0, 44.0, 34.0, 20.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.10944652557373047, -0.10384178161621094, -0.0982370376586914, -0.09263229370117188, -0.08702754974365234, -0.08142280578613281, -0.07581806182861328, -0.07021331787109375, -0.06460857391357422, -0.05900382995605469, -0.053399085998535156, -0.047794342041015625, -0.042189598083496094, -0.03658485412597656, -0.03098011016845703, -0.0253753662109375, -0.01977062225341797, -0.014165878295898438, -0.008561134338378906, -0.002956390380859375, 0.0026483535766601562, 0.008253097534179688, 0.013857841491699219, 0.01946258544921875, 0.02506732940673828, 0.030672073364257812, 0.036276817321777344, 0.041881561279296875, 0.047486305236816406, 0.05309104919433594, 0.05869579315185547, 0.064300537109375, 0.06990528106689453, 0.07551002502441406, 0.0811147689819336, 0.08671951293945312, 0.09232425689697266, 0.09792900085449219, 0.10353374481201172, 0.10913848876953125, 0.11474323272705078, 0.12034797668457031, 0.12595272064208984, 0.13155746459960938, 0.1371622085571289, 0.14276695251464844, 0.14837169647216797, 0.1539764404296875, 0.15958118438720703, 0.16518592834472656, 0.1707906723022461, 0.17639541625976562, 0.18200016021728516, 0.1876049041748047, 0.19320964813232422, 0.19881439208984375, 0.20441913604736328, 0.2100238800048828, 0.21562862396240234, 0.22123336791992188, 0.2268381118774414, 0.23244285583496094, 0.23804759979248047, 0.24365234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 7.0, 15.0, 17.0, 27.0, 40.0, 40.0, 56.0, 106.0, 192.0, 375.0, 926.0, 2325.0, 6304.0, 19081.0, 62489.0, 230621.0, 457769.0, 190917.0, 51672.0, 16431.0, 5457.0, 2043.0, 808.0, 347.0, 175.0, 95.0, 55.0, 27.0, 26.0, 19.0, 20.0, 8.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16431427001953125, -0.1578521728515625, -0.15139007568359375, -0.144927978515625, -0.13846588134765625, -0.1320037841796875, -0.12554168701171875, -0.11907958984375, -0.11261749267578125, -0.1061553955078125, -0.09969329833984375, -0.093231201171875, -0.08676910400390625, -0.0803070068359375, -0.07384490966796875, -0.0673828125, -0.06092071533203125, -0.0544586181640625, -0.04799652099609375, -0.041534423828125, -0.03507232666015625, -0.0286102294921875, -0.02214813232421875, -0.01568603515625, -0.00922393798828125, -0.0027618408203125, 0.00370025634765625, 0.010162353515625, 0.01662445068359375, 0.0230865478515625, 0.02954864501953125, 0.0360107421875, 0.04247283935546875, 0.0489349365234375, 0.05539703369140625, 0.061859130859375, 0.06832122802734375, 0.0747833251953125, 0.08124542236328125, 0.08770751953125, 0.09416961669921875, 0.1006317138671875, 0.10709381103515625, 0.113555908203125, 0.12001800537109375, 0.1264801025390625, 0.13294219970703125, 0.139404296875, 0.14586639404296875, 0.1523284912109375, 0.15879058837890625, 0.165252685546875, 0.17171478271484375, 0.1781768798828125, 0.18463897705078125, 0.19110107421875, 0.19756317138671875, 0.2040252685546875, 0.21048736572265625, 0.216949462890625, 0.22341156005859375, 0.2298736572265625, 0.23633575439453125, 0.2427978515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 8.0, 9.0, 8.0, 6.0, 15.0, 15.0, 16.0, 16.0, 18.0, 29.0, 18.0, 28.0, 37.0, 31.0, 36.0, 41.0, 49.0, 33.0, 42.0, 52.0, 37.0, 47.0, 44.0, 39.0, 37.0, 33.0, 42.0, 23.0, 31.0, 31.0, 30.0, 17.0, 18.0, 18.0, 14.0, 8.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.2109375, -0.20531463623046875, -0.1996917724609375, -0.19406890869140625, -0.188446044921875, -0.18282318115234375, -0.1772003173828125, -0.17157745361328125, -0.16595458984375, -0.16033172607421875, -0.1547088623046875, -0.14908599853515625, -0.143463134765625, -0.13784027099609375, -0.1322174072265625, -0.12659454345703125, -0.1209716796875, -0.11534881591796875, -0.1097259521484375, -0.10410308837890625, -0.098480224609375, -0.09285736083984375, -0.0872344970703125, -0.08161163330078125, -0.07598876953125, -0.07036590576171875, -0.0647430419921875, -0.05912017822265625, -0.053497314453125, -0.04787445068359375, -0.0422515869140625, -0.03662872314453125, -0.031005859375, -0.02538299560546875, -0.0197601318359375, -0.01413726806640625, -0.008514404296875, -0.00289154052734375, 0.0027313232421875, 0.00835418701171875, 0.01397705078125, 0.01959991455078125, 0.0252227783203125, 0.03084564208984375, 0.036468505859375, 0.04209136962890625, 0.0477142333984375, 0.05333709716796875, 0.0589599609375, 0.06458282470703125, 0.0702056884765625, 0.07582855224609375, 0.081451416015625, 0.08707427978515625, 0.0926971435546875, 0.09832000732421875, 0.10394287109375, 0.10956573486328125, 0.1151885986328125, 0.12081146240234375, 0.126434326171875, 0.13205718994140625, 0.1376800537109375, 0.14330291748046875, 0.14892578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 3.0, 8.0, 14.0, 12.0, 23.0, 35.0, 66.0, 125.0, 242.0, 494.0, 1055.0, 2453.0, 6032.0, 17405.0, 59251.0, 196702.0, 378921.0, 260920.0, 86176.0, 24750.0, 8194.0, 3159.0, 1255.0, 590.0, 288.0, 150.0, 93.0, 50.0, 29.0, 13.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038818359375, -0.03736162185668945, -0.035904884338378906, -0.03444814682006836, -0.03299140930175781, -0.031534671783447266, -0.03007793426513672, -0.028621196746826172, -0.027164459228515625, -0.025707721710205078, -0.02425098419189453, -0.022794246673583984, -0.021337509155273438, -0.01988077163696289, -0.018424034118652344, -0.016967296600341797, -0.01551055908203125, -0.014053821563720703, -0.012597084045410156, -0.01114034652709961, -0.009683609008789062, -0.008226871490478516, -0.006770133972167969, -0.005313396453857422, -0.003856658935546875, -0.002399921417236328, -0.0009431838989257812, 0.0005135536193847656, 0.0019702911376953125, 0.0034270286560058594, 0.004883766174316406, 0.006340503692626953, 0.0077972412109375, 0.009253978729248047, 0.010710716247558594, 0.01216745376586914, 0.013624191284179688, 0.015080928802490234, 0.01653766632080078, 0.017994403839111328, 0.019451141357421875, 0.020907878875732422, 0.02236461639404297, 0.023821353912353516, 0.025278091430664062, 0.02673482894897461, 0.028191566467285156, 0.029648303985595703, 0.03110504150390625, 0.0325617790222168, 0.034018516540527344, 0.03547525405883789, 0.03693199157714844, 0.038388729095458984, 0.03984546661376953, 0.04130220413208008, 0.042758941650390625, 0.04421567916870117, 0.04567241668701172, 0.047129154205322266, 0.04858589172363281, 0.05004262924194336, 0.051499366760253906, 0.05295610427856445, 0.054412841796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 7.0, 5.0, 8.0, 10.0, 20.0, 25.0, 30.0, 58.0, 56.0, 93.0, 67.0, 106.0, 83.0, 83.0, 76.0, 53.0, 47.0, 46.0, 33.0, 25.0, 17.0, 12.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.171603798866272e-05, -1.1391937732696533e-05, -1.1067837476730347e-05, -1.074373722076416e-05, -1.0419636964797974e-05, -1.0095536708831787e-05, -9.7714364528656e-06, -9.447336196899414e-06, -9.123235940933228e-06, -8.799135684967041e-06, -8.475035429000854e-06, -8.150935173034668e-06, -7.826834917068481e-06, -7.502734661102295e-06, -7.178634405136108e-06, -6.854534149169922e-06, -6.530433893203735e-06, -6.206333637237549e-06, -5.882233381271362e-06, -5.558133125305176e-06, -5.234032869338989e-06, -4.909932613372803e-06, -4.585832357406616e-06, -4.26173210144043e-06, -3.937631845474243e-06, -3.6135315895080566e-06, -3.28943133354187e-06, -2.9653310775756836e-06, -2.641230821609497e-06, -2.3171305656433105e-06, -1.993030309677124e-06, -1.6689300537109375e-06, -1.344829797744751e-06, -1.0207295417785645e-06, -6.966292858123779e-07, -3.725290298461914e-07, -4.842877388000488e-08, 2.7567148208618164e-07, 5.997717380523682e-07, 9.238719940185547e-07, 1.2479722499847412e-06, 1.5720725059509277e-06, 1.8961727619171143e-06, 2.2202730178833008e-06, 2.5443732738494873e-06, 2.868473529815674e-06, 3.1925737857818604e-06, 3.516674041748047e-06, 3.840774297714233e-06, 4.16487455368042e-06, 4.4889748096466064e-06, 4.813075065612793e-06, 5.1371753215789795e-06, 5.461275577545166e-06, 5.7853758335113525e-06, 6.109476089477539e-06, 6.433576345443726e-06, 6.757676601409912e-06, 7.081776857376099e-06, 7.405877113342285e-06, 7.729977369308472e-06, 8.054077625274658e-06, 8.378177881240845e-06, 8.702278137207031e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 11.0, 21.0, 30.0, 71.0, 101.0, 176.0, 406.0, 781.0, 1867.0, 4126.0, 10696.0, 31586.0, 99124.0, 260553.0, 348425.0, 192094.0, 64450.0, 20951.0, 7479.0, 3018.0, 1343.0, 585.0, 301.0, 140.0, 85.0, 58.0, 25.0, 13.0, 9.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.04779052734375, -0.046509742736816406, -0.04522895812988281, -0.04394817352294922, -0.042667388916015625, -0.04138660430908203, -0.04010581970214844, -0.038825035095214844, -0.03754425048828125, -0.036263465881347656, -0.03498268127441406, -0.03370189666748047, -0.032421112060546875, -0.03114032745361328, -0.029859542846679688, -0.028578758239746094, -0.0272979736328125, -0.026017189025878906, -0.024736404418945312, -0.02345561981201172, -0.022174835205078125, -0.02089405059814453, -0.019613265991210938, -0.018332481384277344, -0.01705169677734375, -0.015770912170410156, -0.014490127563476562, -0.013209342956542969, -0.011928558349609375, -0.010647773742675781, -0.009366989135742188, -0.008086204528808594, -0.006805419921875, -0.005524635314941406, -0.0042438507080078125, -0.0029630661010742188, -0.001682281494140625, -0.00040149688720703125, 0.0008792877197265625, 0.0021600723266601562, 0.00344085693359375, 0.004721641540527344, 0.0060024261474609375, 0.007283210754394531, 0.008563995361328125, 0.009844779968261719, 0.011125564575195312, 0.012406349182128906, 0.0136871337890625, 0.014967918395996094, 0.016248703002929688, 0.01752948760986328, 0.018810272216796875, 0.02009105682373047, 0.021371841430664062, 0.022652626037597656, 0.02393341064453125, 0.025214195251464844, 0.026494979858398438, 0.02777576446533203, 0.029056549072265625, 0.03033733367919922, 0.03161811828613281, 0.032898902893066406, 0.0341796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 15.0, 8.0, 20.0, 35.0, 40.0, 43.0, 63.0, 80.0, 71.0, 103.0, 98.0, 78.0, 73.0, 65.0, 47.0, 36.0, 36.0, 24.0, 21.0, 9.0, 8.0, 10.0, 4.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038299560546875, -0.03694438934326172, -0.03558921813964844, -0.034234046936035156, -0.032878875732421875, -0.031523704528808594, -0.030168533325195312, -0.02881336212158203, -0.02745819091796875, -0.02610301971435547, -0.024747848510742188, -0.023392677307128906, -0.022037506103515625, -0.020682334899902344, -0.019327163696289062, -0.01797199249267578, -0.0166168212890625, -0.015261650085449219, -0.013906478881835938, -0.012551307678222656, -0.011196136474609375, -0.009840965270996094, -0.008485794067382812, -0.007130622863769531, -0.00577545166015625, -0.004420280456542969, -0.0030651092529296875, -0.0017099380493164062, -0.000354766845703125, 0.0010004043579101562, 0.0023555755615234375, 0.0037107467651367188, 0.00506591796875, 0.006421089172363281, 0.0077762603759765625, 0.009131431579589844, 0.010486602783203125, 0.011841773986816406, 0.013196945190429688, 0.014552116394042969, 0.01590728759765625, 0.01726245880126953, 0.018617630004882812, 0.019972801208496094, 0.021327972412109375, 0.022683143615722656, 0.024038314819335938, 0.02539348602294922, 0.0267486572265625, 0.02810382843017578, 0.029458999633789062, 0.030814170837402344, 0.032169342041015625, 0.033524513244628906, 0.03487968444824219, 0.03623485565185547, 0.03759002685546875, 0.03894519805908203, 0.04030036926269531, 0.041655540466308594, 0.043010711669921875, 0.044365882873535156, 0.04572105407714844, 0.04707622528076172, 0.048431396484375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 19.0, 16.0, 37.0, 73.0, 118.0, 159.0, 177.0, 121.0, 87.0, 68.0, 42.0, 27.0, 15.0, 12.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5792344212532043, -0.5582047700881958, -0.5371750593185425, -0.5161453485488892, -0.4951156973838806, -0.4740860164165497, -0.45305633544921875, -0.4320266544818878, -0.4109969735145569, -0.38996729254722595, -0.368937611579895, -0.3479079306125641, -0.32687824964523315, -0.3058485686779022, -0.2848188877105713, -0.26378920674324036, -0.24275952577590942, -0.2217298448085785, -0.20070016384124756, -0.17967048287391663, -0.1586408019065857, -0.13761112093925476, -0.11658143997192383, -0.0955517590045929, -0.07452207803726196, -0.05349239706993103, -0.0324627161026001, -0.011433035135269165, 0.009596645832061768, 0.0306263267993927, 0.05165600776672363, 0.07268568873405457, 0.0937153697013855, 0.11474505066871643, 0.13577473163604736, 0.1568044126033783, 0.17783409357070923, 0.19886377453804016, 0.2198934555053711, 0.24092313647270203, 0.26195281744003296, 0.2829824984073639, 0.3040121793746948, 0.32504186034202576, 0.3460715413093567, 0.3671012222766876, 0.38813090324401855, 0.4091605842113495, 0.4301902651786804, 0.45121994614601135, 0.4722496271133423, 0.4932793080806732, 0.5143089890480042, 0.5353386402130127, 0.556368350982666, 0.5773980617523193, 0.5984277129173279, 0.6194573640823364, 0.6404870748519897, 0.6615167856216431, 0.6825464367866516, 0.7035760879516602, 0.7246057987213135, 0.7456355094909668, 0.7666651606559753]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 9.0, 9.0, 12.0, 22.0, 21.0, 29.0, 40.0, 37.0, 43.0, 68.0, 46.0, 58.0, 56.0, 62.0, 53.0, 50.0, 46.0, 45.0, 52.0, 42.0, 34.0, 26.0, 24.0, 23.0, 20.0, 14.0, 17.0, 13.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4980294704437256, -0.47613757848739624, -0.4542456865310669, -0.43235379457473755, -0.4104619026184082, -0.38857001066207886, -0.3666781187057495, -0.34478622674942017, -0.3228943347930908, -0.3010024428367615, -0.27911055088043213, -0.2572186589241028, -0.23532676696777344, -0.2134348750114441, -0.19154298305511475, -0.1696510910987854, -0.14775919914245605, -0.1258673071861267, -0.10397541522979736, -0.08208352327346802, -0.06019163131713867, -0.038299739360809326, -0.01640784740447998, 0.005484044551849365, 0.02737593650817871, 0.04926782846450806, 0.0711597204208374, 0.09305161237716675, 0.1149435043334961, 0.13683539628982544, 0.15872728824615479, 0.18061918020248413, 0.2025110125541687, 0.22440290451049805, 0.2462947964668274, 0.26818668842315674, 0.2900785803794861, 0.31197047233581543, 0.3338623642921448, 0.3557542562484741, 0.37764614820480347, 0.3995380401611328, 0.42142993211746216, 0.4433218240737915, 0.46521371603012085, 0.4871056079864502, 0.5089974999427795, 0.5308893918991089, 0.5527812838554382, 0.5746731758117676, 0.5965650677680969, 0.6184569597244263, 0.6403488516807556, 0.662240743637085, 0.6841326355934143, 0.7060245275497437, 0.727916419506073, 0.7498083114624023, 0.7717002034187317, 0.793592095375061, 0.8154839873313904, 0.8373758792877197, 0.8592677712440491, 0.8811596632003784, 0.9030515551567078]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 6.0, 8.0, 16.0, 27.0, 33.0, 54.0, 98.0, 176.0, 303.0, 563.0, 1188.0, 2764.0, 10152.0, 56046.0, 2085720.0, 1970130.0, 52773.0, 8871.0, 2603.0, 1164.0, 570.0, 364.0, 205.0, 126.0, 82.0, 59.0, 35.0, 33.0, 27.0, 13.0, 13.0, 15.0, 8.0, 8.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.1765270233154297, -0.16811752319335938, -0.15970802307128906, -0.15129852294921875, -0.14288902282714844, -0.13447952270507812, -0.1260700225830078, -0.1176605224609375, -0.10925102233886719, -0.10084152221679688, -0.09243202209472656, -0.08402252197265625, -0.07561302185058594, -0.06720352172851562, -0.05879402160644531, -0.050384521484375, -0.04197502136230469, -0.033565521240234375, -0.025156021118164062, -0.01674652099609375, -0.008337020874023438, 7.2479248046875e-05, 0.008481979370117188, 0.0168914794921875, 0.025300979614257812, 0.033710479736328125, 0.04211997985839844, 0.05052947998046875, 0.05893898010253906, 0.06734848022460938, 0.07575798034667969, 0.08416748046875, 0.09257698059082031, 0.10098648071289062, 0.10939598083496094, 0.11780548095703125, 0.12621498107910156, 0.13462448120117188, 0.1430339813232422, 0.1514434814453125, 0.1598529815673828, 0.16826248168945312, 0.17667198181152344, 0.18508148193359375, 0.19349098205566406, 0.20190048217773438, 0.2103099822998047, 0.218719482421875, 0.2271289825439453, 0.23553848266601562, 0.24394798278808594, 0.25235748291015625, 0.26076698303222656, 0.2691764831542969, 0.2775859832763672, 0.2859954833984375, 0.2944049835205078, 0.3028144836425781, 0.31122398376464844, 0.31963348388671875, 0.32804298400878906, 0.3364524841308594, 0.3448619842529297, 0.353271484375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 14.0, 19.0, 43.0, 56.0, 102.0, 104.0, 150.0, 125.0, 123.0, 100.0, 71.0, 42.0, 26.0, 11.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.13126754760742188, -0.12532806396484375, -0.11938858032226562, -0.1134490966796875, -0.10750961303710938, -0.10157012939453125, -0.09563064575195312, -0.089691162109375, -0.08375167846679688, -0.07781219482421875, -0.07187271118164062, -0.0659332275390625, -0.059993743896484375, -0.05405426025390625, -0.048114776611328125, -0.04217529296875, -0.036235809326171875, -0.03029632568359375, -0.024356842041015625, -0.0184173583984375, -0.012477874755859375, -0.00653839111328125, -0.000598907470703125, 0.005340576171875, 0.011280059814453125, 0.01721954345703125, 0.023159027099609375, 0.0290985107421875, 0.035037994384765625, 0.04097747802734375, 0.046916961669921875, 0.0528564453125, 0.058795928955078125, 0.06473541259765625, 0.07067489624023438, 0.0766143798828125, 0.08255386352539062, 0.08849334716796875, 0.09443283081054688, 0.100372314453125, 0.10631179809570312, 0.11225128173828125, 0.11819076538085938, 0.1241302490234375, 0.13006973266601562, 0.13600921630859375, 0.14194869995117188, 0.14788818359375, 0.15382766723632812, 0.15976715087890625, 0.16570663452148438, 0.1716461181640625, 0.17758560180664062, 0.18352508544921875, 0.18946456909179688, 0.195404052734375, 0.20134353637695312, 0.20728302001953125, 0.21322250366210938, 0.2191619873046875, 0.22510147094726562, 0.23104095458984375, 0.23698043823242188, 0.242919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 19.0, 21.0, 29.0, 49.0, 70.0, 155.0, 333.0, 738.0, 2267.0, 11453.0, 138181.0, 3463409.0, 545368.0, 26175.0, 4063.0, 1092.0, 401.0, 210.0, 85.0, 60.0, 36.0, 15.0, 13.0, 8.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.316162109375, -0.30799102783203125, -0.2998199462890625, -0.29164886474609375, -0.283477783203125, -0.27530670166015625, -0.2671356201171875, -0.25896453857421875, -0.25079345703125, -0.24262237548828125, -0.2344512939453125, -0.22628021240234375, -0.218109130859375, -0.20993804931640625, -0.2017669677734375, -0.19359588623046875, -0.1854248046875, -0.17725372314453125, -0.1690826416015625, -0.16091156005859375, -0.152740478515625, -0.14456939697265625, -0.1363983154296875, -0.12822723388671875, -0.12005615234375, -0.11188507080078125, -0.1037139892578125, -0.09554290771484375, -0.087371826171875, -0.07920074462890625, -0.0710296630859375, -0.06285858154296875, -0.0546875, -0.04651641845703125, -0.0383453369140625, -0.03017425537109375, -0.022003173828125, -0.01383209228515625, -0.0056610107421875, 0.00251007080078125, 0.01068115234375, 0.01885223388671875, 0.0270233154296875, 0.03519439697265625, 0.043365478515625, 0.05153656005859375, 0.0597076416015625, 0.06787872314453125, 0.0760498046875, 0.08422088623046875, 0.0923919677734375, 0.10056304931640625, 0.108734130859375, 0.11690521240234375, 0.1250762939453125, 0.13324737548828125, 0.14141845703125, 0.14958953857421875, 0.1577606201171875, 0.16593170166015625, 0.174102783203125, 0.18227386474609375, 0.1904449462890625, 0.19861602783203125, 0.206787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 11.0, 18.0, 30.0, 38.0, 71.0, 88.0, 170.0, 273.0, 461.0, 753.0, 835.0, 521.0, 262.0, 182.0, 125.0, 81.0, 45.0, 25.0, 19.0, 13.0, 12.0, 5.0, 4.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.12714195251464844, -0.12208175659179688, -0.11702156066894531, -0.11196136474609375, -0.10690116882324219, -0.10184097290039062, -0.09678077697753906, -0.0917205810546875, -0.08666038513183594, -0.08160018920898438, -0.07653999328613281, -0.07147979736328125, -0.06641960144042969, -0.061359405517578125, -0.05629920959472656, -0.051239013671875, -0.04617881774902344, -0.041118621826171875, -0.03605842590332031, -0.03099822998046875, -0.025938034057617188, -0.020877838134765625, -0.015817642211914062, -0.0107574462890625, -0.0056972503662109375, -0.000637054443359375, 0.0044231414794921875, 0.00948333740234375, 0.014543533325195312, 0.019603729248046875, 0.024663925170898438, 0.02972412109375, 0.03478431701660156, 0.039844512939453125, 0.04490470886230469, 0.04996490478515625, 0.05502510070800781, 0.060085296630859375, 0.06514549255371094, 0.0702056884765625, 0.07526588439941406, 0.08032608032226562, 0.08538627624511719, 0.09044647216796875, 0.09550666809082031, 0.10056686401367188, 0.10562705993652344, 0.110687255859375, 0.11574745178222656, 0.12080764770507812, 0.1258678436279297, 0.13092803955078125, 0.1359882354736328, 0.14104843139648438, 0.14610862731933594, 0.1511688232421875, 0.15622901916503906, 0.16128921508789062, 0.1663494110107422, 0.17140960693359375, 0.1764698028564453, 0.18152999877929688, 0.18659019470214844, 0.191650390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 11.0, 19.0, 29.0, 85.0, 146.0, 186.0, 224.0, 134.0, 89.0, 37.0, 19.0, 8.0, 9.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1359779834747314, -1.1076794862747192, -1.079380989074707, -1.0510824918746948, -1.0227839946746826, -0.9944854974746704, -0.9661870002746582, -0.937888503074646, -0.9095900058746338, -0.8812915086746216, -0.8529930114746094, -0.8246945142745972, -0.796396017074585, -0.7680975198745728, -0.7397990226745605, -0.7115005254745483, -0.6832020282745361, -0.6549035310745239, -0.6266050338745117, -0.5983065366744995, -0.5700080394744873, -0.5417095422744751, -0.5134110450744629, -0.4851125478744507, -0.4568140506744385, -0.42851555347442627, -0.40021705627441406, -0.37191855907440186, -0.34362006187438965, -0.31532156467437744, -0.28702306747436523, -0.258724570274353, -0.23042607307434082, -0.2021275758743286, -0.1738290786743164, -0.1455305814743042, -0.11723208427429199, -0.08893358707427979, -0.06063508987426758, -0.03233659267425537, -0.004038095474243164, 0.024260401725769043, 0.05255889892578125, 0.08085739612579346, 0.10915589332580566, 0.13745439052581787, 0.16575288772583008, 0.19405138492584229, 0.2223498821258545, 0.2506483793258667, 0.2789468765258789, 0.3072453737258911, 0.3355438709259033, 0.3638423681259155, 0.39214086532592773, 0.42043936252593994, 0.44873785972595215, 0.47703635692596436, 0.5053348541259766, 0.5336333513259888, 0.561931848526001, 0.5902303457260132, 0.6185288429260254, 0.6468273401260376, 0.6751258373260498]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 12.0, 14.0, 9.0, 20.0, 18.0, 27.0, 27.0, 26.0, 29.0, 39.0, 39.0, 53.0, 46.0, 51.0, 62.0, 48.0, 39.0, 31.0, 59.0, 50.0, 48.0, 35.0, 40.0, 30.0, 25.0, 17.0, 20.0, 19.0, 13.0, 16.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4959157109260559, -0.4824906587600708, -0.4690656065940857, -0.4556405544281006, -0.4422155022621155, -0.42879045009613037, -0.4153653681278229, -0.40194031596183777, -0.38851526379585266, -0.37509021162986755, -0.36166515946388245, -0.34824010729789734, -0.33481502532958984, -0.32138997316360474, -0.30796492099761963, -0.2945398688316345, -0.2811148166656494, -0.2676897644996643, -0.2542647123336792, -0.2408396452665329, -0.2274145931005478, -0.21398954093456268, -0.20056447386741638, -0.18713942170143127, -0.17371436953544617, -0.16028931736946106, -0.14686426520347595, -0.13343919813632965, -0.12001414597034454, -0.10658909380435944, -0.09316403418779373, -0.07973897457122803, -0.06631392240524292, -0.052888866513967514, -0.03946381062269211, -0.026038754731416702, -0.012613698840141296, 0.000811353325843811, 0.014236412942409515, 0.02766147255897522, 0.04108652472496033, 0.05451158061623573, 0.06793663650751114, 0.08136169612407684, 0.09478674829006195, 0.10821180045604706, 0.12163686007261276, 0.13506191968917847, 0.14848697185516357, 0.16191202402114868, 0.1753370761871338, 0.1887621432542801, 0.2021871954202652, 0.2156122475862503, 0.2290373146533966, 0.2424623668193817, 0.2558874189853668, 0.26931247115135193, 0.28273752331733704, 0.29616257548332214, 0.30958765745162964, 0.32301270961761475, 0.33643776178359985, 0.34986281394958496, 0.36328786611557007]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 14.0, 9.0, 17.0, 27.0, 26.0, 38.0, 41.0, 76.0, 113.0, 127.0, 148.0, 248.0, 345.0, 625.0, 1103.0, 2367.0, 6495.0, 22692.0, 100414.0, 420503.0, 377553.0, 85086.0, 19724.0, 5825.0, 2137.0, 968.0, 614.0, 370.0, 228.0, 161.0, 110.0, 87.0, 55.0, 52.0, 30.0, 25.0, 17.0, 22.0, 18.0, 6.0, 5.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.2958984375, -0.2871818542480469, -0.27846527099609375, -0.2697486877441406, -0.2610321044921875, -0.2523155212402344, -0.24359893798828125, -0.23488235473632812, -0.226165771484375, -0.21744918823242188, -0.20873260498046875, -0.20001602172851562, -0.1912994384765625, -0.18258285522460938, -0.17386627197265625, -0.16514968872070312, -0.15643310546875, -0.14771652221679688, -0.13899993896484375, -0.13028335571289062, -0.1215667724609375, -0.11285018920898438, -0.10413360595703125, -0.09541702270507812, -0.086700439453125, -0.07798385620117188, -0.06926727294921875, -0.060550689697265625, -0.0518341064453125, -0.043117523193359375, -0.03440093994140625, -0.025684356689453125, -0.0169677734375, -0.008251190185546875, 0.00046539306640625, 0.009181976318359375, 0.0178985595703125, 0.026615142822265625, 0.03533172607421875, 0.044048309326171875, 0.052764892578125, 0.061481475830078125, 0.07019805908203125, 0.07891464233398438, 0.0876312255859375, 0.09634780883789062, 0.10506439208984375, 0.11378097534179688, 0.12249755859375, 0.13121414184570312, 0.13993072509765625, 0.14864730834960938, 0.1573638916015625, 0.16608047485351562, 0.17479705810546875, 0.18351364135742188, 0.192230224609375, 0.20094680786132812, 0.20966339111328125, 0.21837997436523438, 0.2270965576171875, 0.23581314086914062, 0.24452972412109375, 0.2532463073730469, 0.261962890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 18.0, 19.0, 36.0, 82.0, 97.0, 135.0, 144.0, 160.0, 109.0, 83.0, 63.0, 33.0, 9.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15869140625, -0.15275192260742188, -0.14681243896484375, -0.14087295532226562, -0.1349334716796875, -0.12899398803710938, -0.12305450439453125, -0.11711502075195312, -0.111175537109375, -0.10523605346679688, -0.09929656982421875, -0.09335708618164062, -0.0874176025390625, -0.08147811889648438, -0.07553863525390625, -0.06959915161132812, -0.06365966796875, -0.057720184326171875, -0.05178070068359375, -0.045841217041015625, -0.0399017333984375, -0.033962249755859375, -0.02802276611328125, -0.022083282470703125, -0.016143798828125, -0.010204315185546875, -0.00426483154296875, 0.001674652099609375, 0.0076141357421875, 0.013553619384765625, 0.01949310302734375, 0.025432586669921875, 0.0313720703125, 0.037311553955078125, 0.04325103759765625, 0.049190521240234375, 0.0551300048828125, 0.061069488525390625, 0.06700897216796875, 0.07294845581054688, 0.078887939453125, 0.08482742309570312, 0.09076690673828125, 0.09670639038085938, 0.1026458740234375, 0.10858535766601562, 0.11452484130859375, 0.12046432495117188, 0.12640380859375, 0.13234329223632812, 0.13828277587890625, 0.14422225952148438, 0.1501617431640625, 0.15610122680664062, 0.16204071044921875, 0.16798019409179688, 0.173919677734375, 0.17985916137695312, 0.18579864501953125, 0.19173812866210938, 0.1976776123046875, 0.20361709594726562, 0.20955657958984375, 0.21549606323242188, 0.221435546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 10.0, 18.0, 16.0, 31.0, 24.0, 59.0, 87.0, 93.0, 154.0, 239.0, 443.0, 728.0, 1393.0, 2636.0, 5546.0, 12770.0, 31800.0, 90175.0, 249590.0, 366940.0, 181767.0, 62690.0, 22762.0, 9504.0, 4279.0, 2103.0, 1045.0, 587.0, 376.0, 220.0, 131.0, 104.0, 58.0, 42.0, 38.0, 15.0, 18.0, 12.0, 13.0, 11.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1806640625, -0.1754016876220703, -0.17013931274414062, -0.16487693786621094, -0.15961456298828125, -0.15435218811035156, -0.14908981323242188, -0.1438274383544922, -0.1385650634765625, -0.1333026885986328, -0.12804031372070312, -0.12277793884277344, -0.11751556396484375, -0.11225318908691406, -0.10699081420898438, -0.10172843933105469, -0.096466064453125, -0.09120368957519531, -0.08594131469726562, -0.08067893981933594, -0.07541656494140625, -0.07015419006347656, -0.06489181518554688, -0.05962944030761719, -0.0543670654296875, -0.04910469055175781, -0.043842315673828125, -0.03857994079589844, -0.03331756591796875, -0.028055191040039062, -0.022792816162109375, -0.017530441284179688, -0.01226806640625, -0.0070056915283203125, -0.001743316650390625, 0.0035190582275390625, 0.00878143310546875, 0.014043807983398438, 0.019306182861328125, 0.024568557739257812, 0.0298309326171875, 0.03509330749511719, 0.040355682373046875, 0.04561805725097656, 0.05088043212890625, 0.05614280700683594, 0.061405181884765625, 0.06666755676269531, 0.071929931640625, 0.07719230651855469, 0.08245468139648438, 0.08771705627441406, 0.09297943115234375, 0.09824180603027344, 0.10350418090820312, 0.10876655578613281, 0.1140289306640625, 0.11929130554199219, 0.12455368041992188, 0.12981605529785156, 0.13507843017578125, 0.14034080505371094, 0.14560317993164062, 0.1508655548095703, 0.1561279296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 10.0, 5.0, 7.0, 12.0, 12.0, 15.0, 13.0, 21.0, 20.0, 31.0, 26.0, 43.0, 33.0, 39.0, 39.0, 37.0, 38.0, 45.0, 44.0, 42.0, 45.0, 55.0, 54.0, 30.0, 39.0, 31.0, 34.0, 33.0, 25.0, 25.0, 14.0, 17.0, 14.0, 12.0, 9.0, 7.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1763916015625, -0.1707744598388672, -0.16515731811523438, -0.15954017639160156, -0.15392303466796875, -0.14830589294433594, -0.14268875122070312, -0.1370716094970703, -0.1314544677734375, -0.1258373260498047, -0.12022018432617188, -0.11460304260253906, -0.10898590087890625, -0.10336875915527344, -0.09775161743164062, -0.09213447570800781, -0.086517333984375, -0.08090019226074219, -0.07528305053710938, -0.06966590881347656, -0.06404876708984375, -0.05843162536621094, -0.052814483642578125, -0.04719734191894531, -0.0415802001953125, -0.03596305847167969, -0.030345916748046875, -0.024728775024414062, -0.01911163330078125, -0.013494491577148438, -0.007877349853515625, -0.0022602081298828125, 0.00335693359375, 0.008974075317382812, 0.014591217041015625, 0.020208358764648438, 0.02582550048828125, 0.03144264221191406, 0.037059783935546875, 0.04267692565917969, 0.0482940673828125, 0.05391120910644531, 0.059528350830078125, 0.06514549255371094, 0.07076263427734375, 0.07637977600097656, 0.08199691772460938, 0.08761405944824219, 0.093231201171875, 0.09884834289550781, 0.10446548461914062, 0.11008262634277344, 0.11569976806640625, 0.12131690979003906, 0.12693405151367188, 0.1325511932373047, 0.1381683349609375, 0.1437854766845703, 0.14940261840820312, 0.15501976013183594, 0.16063690185546875, 0.16625404357910156, 0.17187118530273438, 0.1774883270263672, 0.18310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 9.0, 21.0, 42.0, 57.0, 107.0, 139.0, 402.0, 958.0, 2773.0, 9974.0, 49496.0, 314016.0, 529960.0, 113948.0, 19419.0, 4654.0, 1448.0, 552.0, 247.0, 137.0, 70.0, 37.0, 30.0, 12.0, 14.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.08712291717529297, -0.08403587341308594, -0.0809488296508789, -0.07786178588867188, -0.07477474212646484, -0.07168769836425781, -0.06860065460205078, -0.06551361083984375, -0.06242656707763672, -0.05933952331542969, -0.056252479553222656, -0.053165435791015625, -0.050078392028808594, -0.04699134826660156, -0.04390430450439453, -0.0408172607421875, -0.03773021697998047, -0.03464317321777344, -0.031556129455566406, -0.028469085693359375, -0.025382041931152344, -0.022294998168945312, -0.01920795440673828, -0.01612091064453125, -0.013033866882324219, -0.009946823120117188, -0.006859779357910156, -0.003772735595703125, -0.0006856918334960938, 0.0024013519287109375, 0.005488395690917969, 0.008575439453125, 0.011662483215332031, 0.014749526977539062, 0.017836570739746094, 0.020923614501953125, 0.024010658264160156, 0.027097702026367188, 0.03018474578857422, 0.03327178955078125, 0.03635883331298828, 0.03944587707519531, 0.042532920837402344, 0.045619964599609375, 0.048707008361816406, 0.05179405212402344, 0.05488109588623047, 0.0579681396484375, 0.06105518341064453, 0.06414222717285156, 0.0672292709350586, 0.07031631469726562, 0.07340335845947266, 0.07649040222167969, 0.07957744598388672, 0.08266448974609375, 0.08575153350830078, 0.08883857727050781, 0.09192562103271484, 0.09501266479492188, 0.0980997085571289, 0.10118675231933594, 0.10427379608154297, 0.10736083984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 6.0, 13.0, 17.0, 15.0, 24.0, 22.0, 26.0, 44.0, 59.0, 28.0, 75.0, 60.0, 74.0, 71.0, 64.0, 42.0, 68.0, 54.0, 37.0, 37.0, 26.0, 27.0, 15.0, 20.0, 13.0, 10.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-06, -8.234754204750061e-06, -7.946044206619263e-06, -7.657334208488464e-06, -7.368624210357666e-06, -7.079914212226868e-06, -6.791204214096069e-06, -6.502494215965271e-06, -6.213784217834473e-06, -5.925074219703674e-06, -5.636364221572876e-06, -5.347654223442078e-06, -5.058944225311279e-06, -4.770234227180481e-06, -4.481524229049683e-06, -4.192814230918884e-06, -3.904104232788086e-06, -3.6153942346572876e-06, -3.3266842365264893e-06, -3.037974238395691e-06, -2.7492642402648926e-06, -2.4605542421340942e-06, -2.171844244003296e-06, -1.8831342458724976e-06, -1.5944242477416992e-06, -1.3057142496109009e-06, -1.0170042514801025e-06, -7.282942533493042e-07, -4.3958425521850586e-07, -1.5087425708770752e-07, 1.3783574104309082e-07, 4.2654573917388916e-07, 7.152557373046875e-07, 1.0039657354354858e-06, 1.2926757335662842e-06, 1.5813857316970825e-06, 1.8700957298278809e-06, 2.158805727958679e-06, 2.4475157260894775e-06, 2.736225724220276e-06, 3.0249357223510742e-06, 3.3136457204818726e-06, 3.602355718612671e-06, 3.891065716743469e-06, 4.179775714874268e-06, 4.468485713005066e-06, 4.757195711135864e-06, 5.045905709266663e-06, 5.334615707397461e-06, 5.623325705528259e-06, 5.912035703659058e-06, 6.200745701789856e-06, 6.489455699920654e-06, 6.778165698051453e-06, 7.066875696182251e-06, 7.355585694313049e-06, 7.644295692443848e-06, 7.933005690574646e-06, 8.221715688705444e-06, 8.510425686836243e-06, 8.799135684967041e-06, 9.08784568309784e-06, 9.376555681228638e-06, 9.665265679359436e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 12.0, 12.0, 24.0, 37.0, 57.0, 101.0, 146.0, 238.0, 436.0, 772.0, 1510.0, 3118.0, 7409.0, 19379.0, 59459.0, 201470.0, 411958.0, 234540.0, 70231.0, 22193.0, 8253.0, 3486.0, 1657.0, 850.0, 474.0, 275.0, 151.0, 102.0, 67.0, 52.0, 30.0, 12.0, 16.0, 6.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051116943359375, -0.04919290542602539, -0.04726886749267578, -0.04534482955932617, -0.04342079162597656, -0.04149675369262695, -0.039572715759277344, -0.037648677825927734, -0.035724639892578125, -0.033800601959228516, -0.031876564025878906, -0.029952526092529297, -0.028028488159179688, -0.026104450225830078, -0.02418041229248047, -0.02225637435913086, -0.02033233642578125, -0.01840829849243164, -0.01648426055908203, -0.014560222625732422, -0.012636184692382812, -0.010712146759033203, -0.008788108825683594, -0.006864070892333984, -0.004940032958984375, -0.0030159950256347656, -0.0010919570922851562, 0.0008320808410644531, 0.0027561187744140625, 0.004680156707763672, 0.006604194641113281, 0.00852823257446289, 0.0104522705078125, 0.01237630844116211, 0.014300346374511719, 0.016224384307861328, 0.018148422241210938, 0.020072460174560547, 0.021996498107910156, 0.023920536041259766, 0.025844573974609375, 0.027768611907958984, 0.029692649841308594, 0.0316166877746582, 0.03354072570800781, 0.03546476364135742, 0.03738880157470703, 0.03931283950805664, 0.04123687744140625, 0.04316091537475586, 0.04508495330810547, 0.04700899124145508, 0.04893302917480469, 0.0508570671081543, 0.052781105041503906, 0.054705142974853516, 0.056629180908203125, 0.058553218841552734, 0.060477256774902344, 0.06240129470825195, 0.06432533264160156, 0.06624937057495117, 0.06817340850830078, 0.07009744644165039, 0.072021484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 10.0, 6.0, 8.0, 16.0, 22.0, 21.0, 20.0, 37.0, 36.0, 44.0, 58.0, 76.0, 107.0, 78.0, 97.0, 69.0, 61.0, 62.0, 51.0, 33.0, 24.0, 20.0, 12.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07544183731079102, -0.07343006134033203, -0.07141828536987305, -0.06940650939941406, -0.06739473342895508, -0.0653829574584961, -0.06337118148803711, -0.061359405517578125, -0.05934762954711914, -0.057335853576660156, -0.05532407760620117, -0.05331230163574219, -0.0513005256652832, -0.04928874969482422, -0.047276973724365234, -0.04526519775390625, -0.043253421783447266, -0.04124164581298828, -0.0392298698425293, -0.03721809387207031, -0.03520631790161133, -0.033194541931152344, -0.03118276596069336, -0.029170989990234375, -0.02715921401977539, -0.025147438049316406, -0.023135662078857422, -0.021123886108398438, -0.019112110137939453, -0.01710033416748047, -0.015088558197021484, -0.0130767822265625, -0.011065006256103516, -0.009053230285644531, -0.007041454315185547, -0.0050296783447265625, -0.003017902374267578, -0.0010061264038085938, 0.0010056495666503906, 0.003017425537109375, 0.005029201507568359, 0.007040977478027344, 0.009052753448486328, 0.011064529418945312, 0.013076305389404297, 0.015088081359863281, 0.017099857330322266, 0.01911163330078125, 0.021123409271240234, 0.02313518524169922, 0.025146961212158203, 0.027158737182617188, 0.029170513153076172, 0.031182289123535156, 0.03319406509399414, 0.035205841064453125, 0.03721761703491211, 0.039229393005371094, 0.04124116897583008, 0.04325294494628906, 0.04526472091674805, 0.04727649688720703, 0.049288272857666016, 0.051300048828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 26.0, 58.0, 124.0, 197.0, 231.0, 154.0, 83.0, 45.0, 28.0, 15.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2926026582717896, -1.2587108612060547, -1.2248190641403198, -1.190927267074585, -1.15703547000885, -1.1231436729431152, -1.0892518758773804, -1.0553600788116455, -1.021468162536621, -0.9875763654708862, -0.9536845684051514, -0.9197927713394165, -0.8859009742736816, -0.8520091772079468, -0.8181173205375671, -0.7842255234718323, -0.7503337860107422, -0.7164419889450073, -0.6825501918792725, -0.6486583948135376, -0.6147665977478027, -0.5808748006820679, -0.5469829440116882, -0.5130911469459534, -0.4791993498802185, -0.44530755281448364, -0.4114157557487488, -0.37752392888069153, -0.34363213181495667, -0.3097403347492218, -0.27584850788116455, -0.2419567108154297, -0.20806503295898438, -0.1741732358932495, -0.14028142392635345, -0.106389619410038, -0.07249781489372253, -0.03860601782798767, -0.004714205861091614, 0.029177606105804443, 0.0630694031715393, 0.09696120768785477, 0.13085301220417023, 0.16474482417106628, 0.19863662123680115, 0.232528418302536, 0.26642024517059326, 0.3003120422363281, 0.334203839302063, 0.36809563636779785, 0.4019874334335327, 0.43587926030158997, 0.46977105736732483, 0.5036628246307373, 0.5375546813011169, 0.5714464783668518, 0.6053382754325867, 0.6392300724983215, 0.6731218695640564, 0.7070136666297913, 0.7409055233001709, 0.7747973203659058, 0.8086891174316406, 0.8425809144973755, 0.8764727115631104]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 11.0, 12.0, 14.0, 17.0, 28.0, 27.0, 22.0, 29.0, 23.0, 41.0, 59.0, 49.0, 62.0, 52.0, 64.0, 51.0, 64.0, 52.0, 58.0, 44.0, 36.0, 37.0, 33.0, 21.0, 11.0, 25.0, 10.0, 11.0, 10.0, 5.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6633507013320923, -0.6390447616577148, -0.6147388815879822, -0.5904330015182495, -0.5661270618438721, -0.5418211221694946, -0.517515242099762, -0.4932093322277069, -0.46890342235565186, -0.4445975124835968, -0.42029160261154175, -0.3959856927394867, -0.37167978286743164, -0.3473738729953766, -0.32306796312332153, -0.2987620532512665, -0.2744561433792114, -0.25015023350715637, -0.22584432363510132, -0.20153841376304626, -0.1772325038909912, -0.15292659401893616, -0.1286206841468811, -0.10431477427482605, -0.080008864402771, -0.05570295453071594, -0.03139704465866089, -0.007091134786605835, 0.01721477508544922, 0.04152068495750427, 0.06582659482955933, 0.09013250470161438, 0.11443835496902466, 0.1387442648410797, 0.16305017471313477, 0.18735608458518982, 0.21166199445724487, 0.23596790432929993, 0.260273814201355, 0.28457972407341003, 0.3088856339454651, 0.33319154381752014, 0.3574974536895752, 0.38180336356163025, 0.4061092734336853, 0.43041518330574036, 0.4547210931777954, 0.47902700304985046, 0.5033329129219055, 0.5276387929916382, 0.5519447326660156, 0.5762506723403931, 0.6005565524101257, 0.6248624324798584, 0.6491683721542358, 0.6734743118286133, 0.697780191898346, 0.7220860719680786, 0.746392011642456, 0.7706979513168335, 0.7950038313865662, 0.8193097114562988, 0.8436156511306763, 0.8679215908050537, 0.8922274708747864]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 1.0, 7.0, 11.0, 8.0, 12.0, 28.0, 26.0, 28.0, 70.0, 96.0, 130.0, 196.0, 363.0, 683.0, 1520.0, 4137.0, 11784.0, 45542.0, 694093.0, 3246615.0, 157474.0, 21362.0, 5633.0, 1917.0, 906.0, 538.0, 313.0, 205.0, 149.0, 109.0, 80.0, 52.0, 43.0, 36.0, 22.0, 21.0, 11.0, 16.0, 8.0, 9.0, 12.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1978759765625, -0.19112014770507812, -0.18436431884765625, -0.17760848999023438, -0.1708526611328125, -0.16409683227539062, -0.15734100341796875, -0.15058517456054688, -0.143829345703125, -0.13707351684570312, -0.13031768798828125, -0.12356185913085938, -0.1168060302734375, -0.11005020141601562, -0.10329437255859375, -0.09653854370117188, -0.08978271484375, -0.08302688598632812, -0.07627105712890625, -0.06951522827148438, -0.0627593994140625, -0.056003570556640625, -0.04924774169921875, -0.042491912841796875, -0.035736083984375, -0.028980255126953125, -0.02222442626953125, -0.015468597412109375, -0.0087127685546875, -0.001956939697265625, 0.00479888916015625, 0.011554718017578125, 0.018310546875, 0.025066375732421875, 0.03182220458984375, 0.038578033447265625, 0.0453338623046875, 0.052089691162109375, 0.05884552001953125, 0.06560134887695312, 0.072357177734375, 0.07911300659179688, 0.08586883544921875, 0.09262466430664062, 0.0993804931640625, 0.10613632202148438, 0.11289215087890625, 0.11964797973632812, 0.12640380859375, 0.13315963745117188, 0.13991546630859375, 0.14667129516601562, 0.1534271240234375, 0.16018295288085938, 0.16693878173828125, 0.17369461059570312, 0.180450439453125, 0.18720626831054688, 0.19396209716796875, 0.20071792602539062, 0.2074737548828125, 0.21422958374023438, 0.22098541259765625, 0.22774124145507812, 0.2344970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 9.0, 7.0, 12.0, 36.0, 64.0, 82.0, 127.0, 145.0, 127.0, 140.0, 108.0, 71.0, 35.0, 19.0, 13.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188232421875, -0.18074798583984375, -0.1732635498046875, -0.16577911376953125, -0.158294677734375, -0.15081024169921875, -0.1433258056640625, -0.13584136962890625, -0.12835693359375, -0.12087249755859375, -0.1133880615234375, -0.10590362548828125, -0.098419189453125, -0.09093475341796875, -0.0834503173828125, -0.07596588134765625, -0.0684814453125, -0.06099700927734375, -0.0535125732421875, -0.04602813720703125, -0.038543701171875, -0.03105926513671875, -0.0235748291015625, -0.01609039306640625, -0.00860595703125, -0.00112152099609375, 0.0063629150390625, 0.01384735107421875, 0.021331787109375, 0.02881622314453125, 0.0363006591796875, 0.04378509521484375, 0.05126953125, 0.05875396728515625, 0.0662384033203125, 0.07372283935546875, 0.081207275390625, 0.08869171142578125, 0.0961761474609375, 0.10366058349609375, 0.11114501953125, 0.11862945556640625, 0.1261138916015625, 0.13359832763671875, 0.141082763671875, 0.14856719970703125, 0.1560516357421875, 0.16353607177734375, 0.1710205078125, 0.17850494384765625, 0.1859893798828125, 0.19347381591796875, 0.200958251953125, 0.20844268798828125, 0.2159271240234375, 0.22341156005859375, 0.23089599609375, 0.23838043212890625, 0.2458648681640625, 0.25334930419921875, 0.260833740234375, 0.26831817626953125, 0.2758026123046875, 0.28328704833984375, 0.290771484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 4.0, 6.0, 11.0, 16.0, 23.0, 20.0, 38.0, 51.0, 76.0, 119.0, 235.0, 360.0, 693.0, 1751.0, 5415.0, 24599.0, 187488.0, 3093365.0, 800930.0, 62779.0, 11020.0, 2935.0, 1075.0, 513.0, 296.0, 154.0, 111.0, 68.0, 48.0, 19.0, 21.0, 14.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.271484375, -0.2649822235107422, -0.2584800720214844, -0.25197792053222656, -0.24547576904296875, -0.23897361755371094, -0.23247146606445312, -0.2259693145751953, -0.2194671630859375, -0.2129650115966797, -0.20646286010742188, -0.19996070861816406, -0.19345855712890625, -0.18695640563964844, -0.18045425415039062, -0.1739521026611328, -0.167449951171875, -0.1609477996826172, -0.15444564819335938, -0.14794349670410156, -0.14144134521484375, -0.13493919372558594, -0.12843704223632812, -0.12193489074707031, -0.1154327392578125, -0.10893058776855469, -0.10242843627929688, -0.09592628479003906, -0.08942413330078125, -0.08292198181152344, -0.07641983032226562, -0.06991767883300781, -0.06341552734375, -0.05691337585449219, -0.050411224365234375, -0.04390907287597656, -0.03740692138671875, -0.030904769897460938, -0.024402618408203125, -0.017900466918945312, -0.0113983154296875, -0.0048961639404296875, 0.001605987548828125, 0.008108139038085938, 0.01461029052734375, 0.021112442016601562, 0.027614593505859375, 0.03411674499511719, 0.040618896484375, 0.04712104797363281, 0.053623199462890625, 0.06012535095214844, 0.06662750244140625, 0.07312965393066406, 0.07963180541992188, 0.08613395690917969, 0.0926361083984375, 0.09913825988769531, 0.10564041137695312, 0.11214256286621094, 0.11864471435546875, 0.12514686584472656, 0.13164901733398438, 0.1381511688232422, 0.1446533203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 8.0, 5.0, 9.0, 11.0, 24.0, 37.0, 51.0, 91.0, 109.0, 230.0, 426.0, 968.0, 1015.0, 448.0, 202.0, 167.0, 91.0, 67.0, 38.0, 22.0, 17.0, 17.0, 8.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14501953125, -0.13811111450195312, -0.13120269775390625, -0.12429428100585938, -0.1173858642578125, -0.11047744750976562, -0.10356903076171875, -0.09666061401367188, -0.089752197265625, -0.08284378051757812, -0.07593536376953125, -0.06902694702148438, -0.0621185302734375, -0.055210113525390625, -0.04830169677734375, -0.041393280029296875, -0.03448486328125, -0.027576446533203125, -0.02066802978515625, -0.013759613037109375, -0.0068511962890625, 5.7220458984375e-05, 0.00696563720703125, 0.013874053955078125, 0.020782470703125, 0.027690887451171875, 0.03459930419921875, 0.041507720947265625, 0.0484161376953125, 0.055324554443359375, 0.06223297119140625, 0.06914138793945312, 0.0760498046875, 0.08295822143554688, 0.08986663818359375, 0.09677505493164062, 0.1036834716796875, 0.11059188842773438, 0.11750030517578125, 0.12440872192382812, 0.131317138671875, 0.13822555541992188, 0.14513397216796875, 0.15204238891601562, 0.1589508056640625, 0.16585922241210938, 0.17276763916015625, 0.17967605590820312, 0.18658447265625, 0.19349288940429688, 0.20040130615234375, 0.20730972290039062, 0.2142181396484375, 0.22112655639648438, 0.22803497314453125, 0.23494338989257812, 0.241851806640625, 0.24876022338867188, 0.25566864013671875, 0.2625770568847656, 0.2694854736328125, 0.2763938903808594, 0.28330230712890625, 0.2902107238769531, 0.297119140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 12.0, 16.0, 47.0, 72.0, 116.0, 134.0, 178.0, 155.0, 103.0, 62.0, 36.0, 20.0, 16.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6531191468238831, -0.6299659609794617, -0.6068128347396851, -0.5836596488952637, -0.5605065226554871, -0.5373533368110657, -0.5142002105712891, -0.4910470247268677, -0.4678938686847687, -0.4447407126426697, -0.4215875566005707, -0.3984344005584717, -0.3752812147140503, -0.3521280884742737, -0.3289749026298523, -0.3058217465877533, -0.2826685905456543, -0.2595154345035553, -0.2363622784614563, -0.2132091075181961, -0.1900559514760971, -0.1669027954339981, -0.14374962449073792, -0.12059646844863892, -0.09744331240653992, -0.07429015636444092, -0.05113699287176132, -0.027983829379081726, -0.004830673336982727, 0.018322482705116272, 0.041475653648376465, 0.06462880969047546, 0.08778196573257446, 0.11093512177467346, 0.13408827781677246, 0.15724144876003265, 0.18039460480213165, 0.20354776084423065, 0.22670093178749084, 0.24985408782958984, 0.27300724387168884, 0.29616039991378784, 0.31931355595588684, 0.34246671199798584, 0.3656198978424072, 0.38877302408218384, 0.4119262099266052, 0.4350793659687042, 0.4582325220108032, 0.4813856780529022, 0.5045388340950012, 0.5276920199394226, 0.5508451461791992, 0.5739983320236206, 0.597151517868042, 0.6203046441078186, 0.6434577703475952, 0.6666109561920166, 0.6897640824317932, 0.7129172682762146, 0.7360703945159912, 0.7592235803604126, 0.782376766204834, 0.8055298924446106, 0.828683078289032]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 5.0, 16.0, 12.0, 20.0, 21.0, 24.0, 31.0, 39.0, 40.0, 48.0, 42.0, 56.0, 57.0, 57.0, 60.0, 66.0, 63.0, 47.0, 49.0, 39.0, 36.0, 35.0, 31.0, 20.0, 20.0, 15.0, 11.0, 8.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6468883752822876, -0.6286016702651978, -0.6103149652481079, -0.5920282602310181, -0.5737414956092834, -0.5554547905921936, -0.5371680855751038, -0.5188813805580139, -0.5005946755409241, -0.48230797052383423, -0.464021235704422, -0.44573453068733215, -0.4274478256702423, -0.4091610908508301, -0.39087438583374023, -0.3725876808166504, -0.35430094599723816, -0.3360142409801483, -0.3177275061607361, -0.29944080114364624, -0.2811540961265564, -0.26286739110946655, -0.24458065629005432, -0.22629395127296448, -0.20800723135471344, -0.1897205114364624, -0.17143380641937256, -0.15314708650112152, -0.13486036658287048, -0.11657366156578064, -0.0982869416475296, -0.08000023663043976, -0.06171351671218872, -0.04342680424451828, -0.02514008805155754, -0.006853371858596802, 0.011433340609073639, 0.02972005307674408, 0.04800677299499512, 0.06629347801208496, 0.084580197930336, 0.10286691039800644, 0.12115362286567688, 0.13944034278392792, 0.15772706270217896, 0.1760137677192688, 0.19430048763751984, 0.21258719265460968, 0.23087391257286072, 0.24916063249111176, 0.2674473524093628, 0.28573405742645264, 0.3040207624435425, 0.3223074674606323, 0.34059420228004456, 0.3588809072971344, 0.37716764211654663, 0.3954543471336365, 0.4137410819530487, 0.43202778697013855, 0.4503144919872284, 0.4686012268066406, 0.48688793182373047, 0.5051746368408203, 0.5234613418579102]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 17.0, 24.0, 25.0, 43.0, 55.0, 83.0, 151.0, 199.0, 328.0, 638.0, 1235.0, 3470.0, 13488.0, 84182.0, 558238.0, 330973.0, 42535.0, 8204.0, 2378.0, 995.0, 490.0, 299.0, 184.0, 95.0, 71.0, 50.0, 33.0, 28.0, 13.0, 7.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.338623046875, -0.3279838562011719, -0.31734466552734375, -0.3067054748535156, -0.2960662841796875, -0.2854270935058594, -0.27478790283203125, -0.2641487121582031, -0.253509521484375, -0.24287033081054688, -0.23223114013671875, -0.22159194946289062, -0.2109527587890625, -0.20031356811523438, -0.18967437744140625, -0.17903518676757812, -0.16839599609375, -0.15775680541992188, -0.14711761474609375, -0.13647842407226562, -0.1258392333984375, -0.11520004272460938, -0.10456085205078125, -0.09392166137695312, -0.083282470703125, -0.07264328002929688, -0.06200408935546875, -0.051364898681640625, -0.0407257080078125, -0.030086517333984375, -0.01944732666015625, -0.008808135986328125, 0.0018310546875, 0.012470245361328125, 0.02310943603515625, 0.033748626708984375, 0.0443878173828125, 0.055027008056640625, 0.06566619873046875, 0.07630538940429688, 0.086944580078125, 0.09758377075195312, 0.10822296142578125, 0.11886215209960938, 0.1295013427734375, 0.14014053344726562, 0.15077972412109375, 0.16141891479492188, 0.17205810546875, 0.18269729614257812, 0.19333648681640625, 0.20397567749023438, 0.2146148681640625, 0.22525405883789062, 0.23589324951171875, 0.24653244018554688, 0.257171630859375, 0.2678108215332031, 0.27845001220703125, 0.2890892028808594, 0.2997283935546875, 0.3103675842285156, 0.32100677490234375, 0.3316459655761719, 0.34228515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 12.0, 15.0, 33.0, 50.0, 78.0, 122.0, 154.0, 164.0, 124.0, 113.0, 79.0, 31.0, 15.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.1894245147705078, -0.18219375610351562, -0.17496299743652344, -0.16773223876953125, -0.16050148010253906, -0.15327072143554688, -0.1460399627685547, -0.1388092041015625, -0.1315784454345703, -0.12434768676757812, -0.11711692810058594, -0.10988616943359375, -0.10265541076660156, -0.09542465209960938, -0.08819389343261719, -0.080963134765625, -0.07373237609863281, -0.06650161743164062, -0.05927085876464844, -0.05204010009765625, -0.04480934143066406, -0.037578582763671875, -0.030347824096679688, -0.0231170654296875, -0.015886306762695312, -0.008655548095703125, -0.0014247894287109375, 0.00580596923828125, 0.013036727905273438, 0.020267486572265625, 0.027498245239257812, 0.03472900390625, 0.04195976257324219, 0.049190521240234375, 0.05642127990722656, 0.06365203857421875, 0.07088279724121094, 0.07811355590820312, 0.08534431457519531, 0.0925750732421875, 0.09980583190917969, 0.10703659057617188, 0.11426734924316406, 0.12149810791015625, 0.12872886657714844, 0.13595962524414062, 0.1431903839111328, 0.150421142578125, 0.1576519012451172, 0.16488265991210938, 0.17211341857910156, 0.17934417724609375, 0.18657493591308594, 0.19380569458007812, 0.2010364532470703, 0.2082672119140625, 0.2154979705810547, 0.22272872924804688, 0.22995948791503906, 0.23719024658203125, 0.24442100524902344, 0.2516517639160156, 0.2588825225830078, 0.26611328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 10.0, 12.0, 15.0, 29.0, 47.0, 52.0, 99.0, 147.0, 268.0, 520.0, 1200.0, 3090.0, 8843.0, 32217.0, 151182.0, 536503.0, 244894.0, 49537.0, 12765.0, 4098.0, 1500.0, 710.0, 341.0, 172.0, 93.0, 62.0, 41.0, 23.0, 17.0, 24.0, 5.0, 8.0, 6.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23286819458007812, -0.22501373291015625, -0.21715927124023438, -0.2093048095703125, -0.20145034790039062, -0.19359588623046875, -0.18574142456054688, -0.177886962890625, -0.17003250122070312, -0.16217803955078125, -0.15432357788085938, -0.1464691162109375, -0.13861465454101562, -0.13076019287109375, -0.12290573120117188, -0.11505126953125, -0.10719680786132812, -0.09934234619140625, -0.09148788452148438, -0.0836334228515625, -0.07577896118164062, -0.06792449951171875, -0.060070037841796875, -0.052215576171875, -0.044361114501953125, -0.03650665283203125, -0.028652191162109375, -0.0207977294921875, -0.012943267822265625, -0.00508880615234375, 0.002765655517578125, 0.0106201171875, 0.018474578857421875, 0.02632904052734375, 0.034183502197265625, 0.0420379638671875, 0.049892425537109375, 0.05774688720703125, 0.06560134887695312, 0.073455810546875, 0.08131027221679688, 0.08916473388671875, 0.09701919555664062, 0.1048736572265625, 0.11272811889648438, 0.12058258056640625, 0.12843704223632812, 0.13629150390625, 0.14414596557617188, 0.15200042724609375, 0.15985488891601562, 0.1677093505859375, 0.17556381225585938, 0.18341827392578125, 0.19127273559570312, 0.199127197265625, 0.20698165893554688, 0.21483612060546875, 0.22269058227539062, 0.2305450439453125, 0.23839950561523438, 0.24625396728515625, 0.2541084289550781, 0.261962890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 8.0, 17.0, 11.0, 18.0, 19.0, 21.0, 23.0, 37.0, 35.0, 43.0, 48.0, 53.0, 56.0, 53.0, 55.0, 67.0, 59.0, 42.0, 57.0, 48.0, 33.0, 28.0, 35.0, 17.0, 22.0, 21.0, 12.0, 10.0, 13.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2678680419921875, -0.259613037109375, -0.2513580322265625, -0.24310302734375, -0.2348480224609375, -0.226593017578125, -0.2183380126953125, -0.2100830078125, -0.2018280029296875, -0.193572998046875, -0.1853179931640625, -0.17706298828125, -0.1688079833984375, -0.160552978515625, -0.1522979736328125, -0.14404296875, -0.1357879638671875, -0.127532958984375, -0.1192779541015625, -0.11102294921875, -0.1027679443359375, -0.094512939453125, -0.0862579345703125, -0.0780029296875, -0.0697479248046875, -0.061492919921875, -0.0532379150390625, -0.04498291015625, -0.0367279052734375, -0.028472900390625, -0.0202178955078125, -0.011962890625, -0.0037078857421875, 0.004547119140625, 0.0128021240234375, 0.02105712890625, 0.0293121337890625, 0.037567138671875, 0.0458221435546875, 0.0540771484375, 0.0623321533203125, 0.070587158203125, 0.0788421630859375, 0.08709716796875, 0.0953521728515625, 0.103607177734375, 0.1118621826171875, 0.1201171875, 0.1283721923828125, 0.136627197265625, 0.1448822021484375, 0.15313720703125, 0.1613922119140625, 0.169647216796875, 0.1779022216796875, 0.1861572265625, 0.1944122314453125, 0.202667236328125, 0.2109222412109375, 0.21917724609375, 0.2274322509765625, 0.235687255859375, 0.2439422607421875, 0.252197265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 16.0, 24.0, 22.0, 31.0, 44.0, 51.0, 109.0, 125.0, 212.0, 343.0, 531.0, 1045.0, 1768.0, 3407.0, 6460.0, 13557.0, 29219.0, 72330.0, 212467.0, 395842.0, 192368.0, 65686.0, 26875.0, 12502.0, 6149.0, 3116.0, 1711.0, 955.0, 579.0, 374.0, 215.0, 129.0, 96.0, 63.0, 30.0, 32.0, 16.0, 9.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.057830810546875, -0.05604887008666992, -0.054266929626464844, -0.052484989166259766, -0.05070304870605469, -0.04892110824584961, -0.04713916778564453, -0.04535722732543945, -0.043575286865234375, -0.0417933464050293, -0.04001140594482422, -0.03822946548461914, -0.03644752502441406, -0.034665584564208984, -0.032883644104003906, -0.031101703643798828, -0.02931976318359375, -0.027537822723388672, -0.025755882263183594, -0.023973941802978516, -0.022192001342773438, -0.02041006088256836, -0.01862812042236328, -0.016846179962158203, -0.015064239501953125, -0.013282299041748047, -0.011500358581542969, -0.00971841812133789, -0.007936477661132812, -0.006154537200927734, -0.004372596740722656, -0.002590656280517578, -0.0008087158203125, 0.0009732246398925781, 0.0027551651000976562, 0.004537105560302734, 0.0063190460205078125, 0.00810098648071289, 0.009882926940917969, 0.011664867401123047, 0.013446807861328125, 0.015228748321533203, 0.01701068878173828, 0.01879262924194336, 0.020574569702148438, 0.022356510162353516, 0.024138450622558594, 0.025920391082763672, 0.02770233154296875, 0.029484272003173828, 0.031266212463378906, 0.033048152923583984, 0.03483009338378906, 0.03661203384399414, 0.03839397430419922, 0.0401759147644043, 0.041957855224609375, 0.04373979568481445, 0.04552173614501953, 0.04730367660522461, 0.04908561706542969, 0.050867557525634766, 0.052649497985839844, 0.05443143844604492, 0.05621337890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 9.0, 12.0, 8.0, 26.0, 37.0, 41.0, 63.0, 82.0, 109.0, 149.0, 130.0, 97.0, 66.0, 47.0, 32.0, 25.0, 10.0, 15.0, 9.0, 9.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8358230590820312e-05, -1.7793849110603333e-05, -1.7229467630386353e-05, -1.6665086150169373e-05, -1.6100704669952393e-05, -1.5536323189735413e-05, -1.4971941709518433e-05, -1.4407560229301453e-05, -1.3843178749084473e-05, -1.3278797268867493e-05, -1.2714415788650513e-05, -1.2150034308433533e-05, -1.1585652828216553e-05, -1.1021271347999573e-05, -1.0456889867782593e-05, -9.892508387565613e-06, -9.328126907348633e-06, -8.763745427131653e-06, -8.199363946914673e-06, -7.634982466697693e-06, -7.070600986480713e-06, -6.506219506263733e-06, -5.941838026046753e-06, -5.377456545829773e-06, -4.813075065612793e-06, -4.248693585395813e-06, -3.684312105178833e-06, -3.119930624961853e-06, -2.555549144744873e-06, -1.991167664527893e-06, -1.426786184310913e-06, -8.624047040939331e-07, -2.980232238769531e-07, 2.6635825634002686e-07, 8.307397365570068e-07, 1.3951212167739868e-06, 1.959502696990967e-06, 2.5238841772079468e-06, 3.0882656574249268e-06, 3.6526471376419067e-06, 4.217028617858887e-06, 4.781410098075867e-06, 5.345791578292847e-06, 5.910173058509827e-06, 6.474554538726807e-06, 7.038936018943787e-06, 7.603317499160767e-06, 8.167698979377747e-06, 8.732080459594727e-06, 9.296461939811707e-06, 9.860843420028687e-06, 1.0425224900245667e-05, 1.0989606380462646e-05, 1.1553987860679626e-05, 1.2118369340896606e-05, 1.2682750821113586e-05, 1.3247132301330566e-05, 1.3811513781547546e-05, 1.4375895261764526e-05, 1.4940276741981506e-05, 1.5504658222198486e-05, 1.6069039702415466e-05, 1.6633421182632446e-05, 1.7197802662849426e-05, 1.7762184143066406e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 9.0, 18.0, 28.0, 34.0, 49.0, 74.0, 110.0, 176.0, 260.0, 448.0, 777.0, 1336.0, 2523.0, 5092.0, 11275.0, 28795.0, 95868.0, 397085.0, 368892.0, 87237.0, 27006.0, 10755.0, 5004.0, 2414.0, 1332.0, 696.0, 437.0, 281.0, 170.0, 105.0, 67.0, 61.0, 32.0, 23.0, 22.0, 12.0, 8.0, 10.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.07135009765625, -0.0690460205078125, -0.066741943359375, -0.0644378662109375, -0.0621337890625, -0.0598297119140625, -0.057525634765625, -0.0552215576171875, -0.05291748046875, -0.0506134033203125, -0.048309326171875, -0.0460052490234375, -0.043701171875, -0.0413970947265625, -0.039093017578125, -0.0367889404296875, -0.03448486328125, -0.0321807861328125, -0.029876708984375, -0.0275726318359375, -0.0252685546875, -0.0229644775390625, -0.020660400390625, -0.0183563232421875, -0.01605224609375, -0.0137481689453125, -0.011444091796875, -0.0091400146484375, -0.0068359375, -0.0045318603515625, -0.002227783203125, 7.62939453125e-05, 0.00238037109375, 0.0046844482421875, 0.006988525390625, 0.0092926025390625, 0.0115966796875, 0.0139007568359375, 0.016204833984375, 0.0185089111328125, 0.02081298828125, 0.0231170654296875, 0.025421142578125, 0.0277252197265625, 0.030029296875, 0.0323333740234375, 0.034637451171875, 0.0369415283203125, 0.03924560546875, 0.0415496826171875, 0.043853759765625, 0.0461578369140625, 0.0484619140625, 0.0507659912109375, 0.053070068359375, 0.0553741455078125, 0.05767822265625, 0.0599822998046875, 0.062286376953125, 0.0645904541015625, 0.06689453125, 0.0691986083984375, 0.071502685546875, 0.0738067626953125, 0.07611083984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 6.0, 9.0, 10.0, 12.0, 15.0, 19.0, 16.0, 25.0, 39.0, 51.0, 56.0, 81.0, 105.0, 100.0, 81.0, 68.0, 66.0, 48.0, 30.0, 30.0, 23.0, 16.0, 20.0, 8.0, 14.0, 4.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08428955078125, -0.08176708221435547, -0.07924461364746094, -0.0767221450805664, -0.07419967651367188, -0.07167720794677734, -0.06915473937988281, -0.06663227081298828, -0.06410980224609375, -0.06158733367919922, -0.05906486511230469, -0.056542396545410156, -0.054019927978515625, -0.051497459411621094, -0.04897499084472656, -0.04645252227783203, -0.0439300537109375, -0.04140758514404297, -0.03888511657714844, -0.036362648010253906, -0.033840179443359375, -0.031317710876464844, -0.028795242309570312, -0.02627277374267578, -0.02375030517578125, -0.02122783660888672, -0.018705368041992188, -0.016182899475097656, -0.013660430908203125, -0.011137962341308594, -0.008615493774414062, -0.006093025207519531, -0.003570556640625, -0.0010480880737304688, 0.0014743804931640625, 0.003996849060058594, 0.006519317626953125, 0.009041786193847656, 0.011564254760742188, 0.014086723327636719, 0.01660919189453125, 0.01913166046142578, 0.021654129028320312, 0.024176597595214844, 0.026699066162109375, 0.029221534729003906, 0.03174400329589844, 0.03426647186279297, 0.0367889404296875, 0.03931140899658203, 0.04183387756347656, 0.044356346130371094, 0.046878814697265625, 0.049401283264160156, 0.05192375183105469, 0.05444622039794922, 0.05696868896484375, 0.05949115753173828, 0.06201362609863281, 0.06453609466552734, 0.06705856323242188, 0.0695810317993164, 0.07210350036621094, 0.07462596893310547, 0.0771484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 10.0, 35.0, 164.0, 386.0, 278.0, 83.0, 32.0, 12.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.375499963760376, -1.309369444847107, -1.243238925933838, -1.1771085262298584, -1.1109780073165894, -1.0448474884033203, -0.978717029094696, -0.9125865697860718, -0.8464560508728027, -0.7803255319595337, -0.7141950726509094, -0.6480646133422852, -0.5819340944290161, -0.5158035755157471, -0.4496731162071228, -0.38354262709617615, -0.3174121379852295, -0.25128164887428284, -0.18515115976333618, -0.11902067065238953, -0.05289018154144287, 0.013240307569503784, 0.07937079668045044, 0.1455012857913971, 0.21163177490234375, 0.2777622640132904, 0.34389275312423706, 0.4100232422351837, 0.47615373134613037, 0.5422842502593994, 0.6084147095680237, 0.674545168876648, 0.7406759262084961, 0.8068064451217651, 0.8729369044303894, 0.9390673637390137, 1.0051978826522827, 1.0713284015655518, 1.1374588012695312, 1.2035893201828003, 1.2697198390960693, 1.3358503580093384, 1.4019808769226074, 1.468111276626587, 1.534241795539856, 1.600372314453125, 1.6665027141571045, 1.7326332330703735, 1.7987637519836426, 1.8648942708969116, 1.9310247898101807, 1.9971551895141602, 2.0632858276367188, 2.1294162273406982, 2.1955466270446777, 2.2616772651672363, 2.327807664871216, 2.3939380645751953, 2.460068702697754, 2.5261991024017334, 2.592329502105713, 2.6584601402282715, 2.724590539932251, 2.7907211780548096, 2.856851577758789]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 15.0, 10.0, 15.0, 14.0, 15.0, 22.0, 28.0, 27.0, 33.0, 29.0, 29.0, 33.0, 26.0, 32.0, 39.0, 38.0, 46.0, 35.0, 39.0, 48.0, 36.0, 47.0, 35.0, 32.0, 29.0, 26.0, 24.0, 26.0, 20.0, 23.0, 26.0, 14.0, 17.0, 14.0, 7.0, 6.0, 6.0, 11.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7356966733932495, -0.7147986888885498, -0.6939006447792053, -0.6730026006698608, -0.6521046161651611, -0.6312066316604614, -0.6103085875511169, -0.5894105434417725, -0.5685125589370728, -0.547614574432373, -0.5267165303230286, -0.5058184862136841, -0.4849205017089844, -0.4640224874019623, -0.4431244730949402, -0.4222264587879181, -0.401328444480896, -0.3804304301738739, -0.3595324158668518, -0.3386344015598297, -0.3177363872528076, -0.2968383729457855, -0.2759403586387634, -0.25504234433174133, -0.23414433002471924, -0.21324631571769714, -0.19234830141067505, -0.17145028710365295, -0.15055227279663086, -0.12965425848960876, -0.10875624418258667, -0.08785822987556458, -0.0669601559638977, -0.04606214165687561, -0.025164127349853516, -0.004266113042831421, 0.016631901264190674, 0.03752991557121277, 0.05842792987823486, 0.07932594418525696, 0.10022395849227905, 0.12112197279930115, 0.14201998710632324, 0.16291800141334534, 0.18381601572036743, 0.20471403002738953, 0.22561204433441162, 0.24651005864143372, 0.2674080729484558, 0.2883060872554779, 0.3092041015625, 0.3301021158695221, 0.3510001301765442, 0.3718981444835663, 0.3927961587905884, 0.4136941730976105, 0.43459218740463257, 0.45549020171165466, 0.47638821601867676, 0.49728623032569885, 0.518184244632721, 0.5390822887420654, 0.5599802732467651, 0.5808782577514648, 0.6017763018608093]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 11.0, 7.0, 26.0, 29.0, 32.0, 58.0, 89.0, 161.0, 299.0, 499.0, 1153.0, 2963.0, 8365.0, 35434.0, 372711.0, 3510763.0, 225945.0, 24901.0, 6116.0, 2148.0, 973.0, 581.0, 301.0, 219.0, 135.0, 99.0, 68.0, 47.0, 36.0, 30.0, 26.0, 11.0, 12.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18896484375, -0.1815338134765625, -0.174102783203125, -0.1666717529296875, -0.15924072265625, -0.1518096923828125, -0.144378662109375, -0.1369476318359375, -0.1295166015625, -0.1220855712890625, -0.114654541015625, -0.1072235107421875, -0.09979248046875, -0.0923614501953125, -0.084930419921875, -0.0774993896484375, -0.070068359375, -0.0626373291015625, -0.055206298828125, -0.0477752685546875, -0.04034423828125, -0.0329132080078125, -0.025482177734375, -0.0180511474609375, -0.0106201171875, -0.0031890869140625, 0.004241943359375, 0.0116729736328125, 0.01910400390625, 0.0265350341796875, 0.033966064453125, 0.0413970947265625, 0.048828125, 0.0562591552734375, 0.063690185546875, 0.0711212158203125, 0.07855224609375, 0.0859832763671875, 0.093414306640625, 0.1008453369140625, 0.1082763671875, 0.1157073974609375, 0.123138427734375, 0.1305694580078125, 0.13800048828125, 0.1454315185546875, 0.152862548828125, 0.1602935791015625, 0.167724609375, 0.1751556396484375, 0.182586669921875, 0.1900177001953125, 0.19744873046875, 0.2048797607421875, 0.212310791015625, 0.2197418212890625, 0.2271728515625, 0.2346038818359375, 0.242034912109375, 0.2494659423828125, 0.25689697265625, 0.2643280029296875, 0.271759033203125, 0.2791900634765625, 0.28662109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 8.0, 11.0, 26.0, 58.0, 68.0, 96.0, 138.0, 132.0, 141.0, 102.0, 92.0, 61.0, 32.0, 21.0, 10.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2021484375, -0.19429397583007812, -0.18643951416015625, -0.17858505249023438, -0.1707305908203125, -0.16287612915039062, -0.15502166748046875, -0.14716720581054688, -0.139312744140625, -0.13145828247070312, -0.12360382080078125, -0.11574935913085938, -0.1078948974609375, -0.10004043579101562, -0.09218597412109375, -0.08433151245117188, -0.07647705078125, -0.06862258911132812, -0.06076812744140625, -0.052913665771484375, -0.0450592041015625, -0.037204742431640625, -0.02935028076171875, -0.021495819091796875, -0.013641357421875, -0.005786895751953125, 0.00206756591796875, 0.009922027587890625, 0.0177764892578125, 0.025630950927734375, 0.03348541259765625, 0.041339874267578125, 0.0491943359375, 0.057048797607421875, 0.06490325927734375, 0.07275772094726562, 0.0806121826171875, 0.08846664428710938, 0.09632110595703125, 0.10417556762695312, 0.112030029296875, 0.11988449096679688, 0.12773895263671875, 0.13559341430664062, 0.1434478759765625, 0.15130233764648438, 0.15915679931640625, 0.16701126098632812, 0.17486572265625, 0.18272018432617188, 0.19057464599609375, 0.19842910766601562, 0.2062835693359375, 0.21413803100585938, 0.22199249267578125, 0.22984695434570312, 0.237701416015625, 0.24555587768554688, 0.25341033935546875, 0.2612648010253906, 0.2691192626953125, 0.2769737243652344, 0.28482818603515625, 0.2926826477050781, 0.300537109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 2.0, 8.0, 11.0, 15.0, 24.0, 37.0, 72.0, 81.0, 144.0, 190.0, 325.0, 442.0, 808.0, 1592.0, 3388.0, 9660.0, 32993.0, 157646.0, 1443072.0, 2252471.0, 226835.0, 44109.0, 11945.0, 4152.0, 1820.0, 882.0, 568.0, 317.0, 224.0, 148.0, 98.0, 61.0, 38.0, 26.0, 36.0, 15.0, 3.0, 7.0, 6.0, 4.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.15035057067871094, -0.14518356323242188, -0.1400165557861328, -0.13484954833984375, -0.1296825408935547, -0.12451553344726562, -0.11934852600097656, -0.1141815185546875, -0.10901451110839844, -0.10384750366210938, -0.09868049621582031, -0.09351348876953125, -0.08834648132324219, -0.08317947387695312, -0.07801246643066406, -0.072845458984375, -0.06767845153808594, -0.06251144409179688, -0.05734443664550781, -0.05217742919921875, -0.04701042175292969, -0.041843414306640625, -0.03667640686035156, -0.0315093994140625, -0.026342391967773438, -0.021175384521484375, -0.016008377075195312, -0.01084136962890625, -0.0056743621826171875, -0.000507354736328125, 0.0046596527099609375, 0.00982666015625, 0.014993667602539062, 0.020160675048828125, 0.025327682495117188, 0.03049468994140625, 0.03566169738769531, 0.040828704833984375, 0.04599571228027344, 0.0511627197265625, 0.05632972717285156, 0.061496734619140625, 0.06666374206542969, 0.07183074951171875, 0.07699775695800781, 0.08216476440429688, 0.08733177185058594, 0.092498779296875, 0.09766578674316406, 0.10283279418945312, 0.10799980163574219, 0.11316680908203125, 0.11833381652832031, 0.12350082397460938, 0.12866783142089844, 0.1338348388671875, 0.13900184631347656, 0.14416885375976562, 0.1493358612060547, 0.15450286865234375, 0.1596698760986328, 0.16483688354492188, 0.17000389099121094, 0.1751708984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 7.0, 13.0, 14.0, 18.0, 27.0, 51.0, 50.0, 71.0, 120.0, 175.0, 284.0, 591.0, 927.0, 698.0, 325.0, 206.0, 142.0, 86.0, 65.0, 61.0, 49.0, 28.0, 14.0, 17.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.1303253173828125, -0.124298095703125, -0.1182708740234375, -0.11224365234375, -0.1062164306640625, -0.100189208984375, -0.0941619873046875, -0.088134765625, -0.0821075439453125, -0.076080322265625, -0.0700531005859375, -0.06402587890625, -0.0579986572265625, -0.051971435546875, -0.0459442138671875, -0.0399169921875, -0.0338897705078125, -0.027862548828125, -0.0218353271484375, -0.01580810546875, -0.0097808837890625, -0.003753662109375, 0.0022735595703125, 0.00830078125, 0.0143280029296875, 0.020355224609375, 0.0263824462890625, 0.03240966796875, 0.0384368896484375, 0.044464111328125, 0.0504913330078125, 0.0565185546875, 0.0625457763671875, 0.068572998046875, 0.0746002197265625, 0.08062744140625, 0.0866546630859375, 0.092681884765625, 0.0987091064453125, 0.104736328125, 0.1107635498046875, 0.116790771484375, 0.1228179931640625, 0.12884521484375, 0.1348724365234375, 0.140899658203125, 0.1469268798828125, 0.1529541015625, 0.1589813232421875, 0.165008544921875, 0.1710357666015625, 0.17706298828125, 0.1830902099609375, 0.189117431640625, 0.1951446533203125, 0.201171875, 0.2071990966796875, 0.213226318359375, 0.2192535400390625, 0.22528076171875, 0.2313079833984375, 0.237335205078125, 0.2433624267578125, 0.2493896484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 15.0, 18.0, 41.0, 76.0, 113.0, 146.0, 145.0, 149.0, 102.0, 66.0, 46.0, 28.0, 25.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0051913261413574, -0.9789215326309204, -0.9526517391204834, -0.9263820052146912, -0.9001122117042542, -0.8738424181938171, -0.8475726842880249, -0.8213028907775879, -0.7950330972671509, -0.7687633037567139, -0.7424935102462769, -0.7162237763404846, -0.6899539828300476, -0.6636841893196106, -0.6374144554138184, -0.6111446619033813, -0.5848748683929443, -0.5586050748825073, -0.5323352813720703, -0.5060655474662781, -0.47979575395584106, -0.45352596044540405, -0.42725619673728943, -0.4009864330291748, -0.3747166395187378, -0.3484468460083008, -0.32217708230018616, -0.29590731859207153, -0.2696375250816345, -0.2433677464723587, -0.21709796786308289, -0.19082818925380707, -0.16455847024917603, -0.1382886916399002, -0.11201891303062439, -0.08574913442134857, -0.059479355812072754, -0.033209577202796936, -0.006939798593521118, 0.0193299800157547, 0.04559975862503052, 0.07186953723430634, 0.09813931584358215, 0.12440909445285797, 0.1506788730621338, 0.1769486516714096, 0.20321843028068542, 0.22948820888996124, 0.25575798749923706, 0.2820277810096741, 0.3082975447177887, 0.3345673084259033, 0.36083710193634033, 0.38710689544677734, 0.41337665915489197, 0.4396464228630066, 0.4659162163734436, 0.4921860098838806, 0.5184557437896729, 0.5447255373001099, 0.5709953308105469, 0.5972651243209839, 0.6235349178314209, 0.6498046517372131, 0.6760744452476501]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 11.0, 11.0, 13.0, 16.0, 17.0, 18.0, 25.0, 28.0, 24.0, 24.0, 41.0, 42.0, 41.0, 37.0, 40.0, 47.0, 45.0, 41.0, 30.0, 40.0, 50.0, 36.0, 30.0, 34.0, 23.0, 36.0, 23.0, 20.0, 19.0, 15.0, 14.0, 14.0, 11.0, 7.0, 7.0, 12.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0], "bins": [-0.49532490968704224, -0.48124873638153076, -0.4671725332736969, -0.4530963599681854, -0.43902018666267395, -0.4249439835548401, -0.4108678102493286, -0.39679163694381714, -0.3827154338359833, -0.3686392605304718, -0.35456305742263794, -0.34048688411712646, -0.326410710811615, -0.31233450770378113, -0.29825833439826965, -0.2841821312904358, -0.2701059579849243, -0.25602978467941284, -0.24195359647274017, -0.2278774082660675, -0.21380122005939484, -0.19972503185272217, -0.1856488585472107, -0.17157267034053802, -0.15749651193618774, -0.14342032372951508, -0.1293441504240036, -0.11526796221733093, -0.10119177401065826, -0.08711559325456619, -0.07303941249847412, -0.05896322429180145, -0.044887036085128784, -0.030810851603746414, -0.016734668985009193, -0.0026584863662719727, 0.011417698115110397, 0.025493882596492767, 0.03957006335258484, 0.05364625155925751, 0.06772243231534958, 0.08179861307144165, 0.09587480127811432, 0.10995098203420639, 0.12402716279029846, 0.13810335099697113, 0.1521795392036438, 0.16625571250915527, 0.18033190071582794, 0.1944080889225006, 0.20848426222801208, 0.22256045043468475, 0.23663663864135742, 0.2507128119468689, 0.26478898525238037, 0.27886518836021423, 0.2929413616657257, 0.3070175349712372, 0.32109373807907104, 0.3351699113845825, 0.349246084690094, 0.36332228779792786, 0.37739846110343933, 0.3914746642112732, 0.40555083751678467]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 8.0, 11.0, 10.0, 17.0, 24.0, 38.0, 60.0, 75.0, 92.0, 168.0, 244.0, 478.0, 764.0, 1572.0, 3903.0, 13174.0, 61282.0, 346520.0, 488182.0, 102553.0, 19566.0, 5417.0, 1992.0, 940.0, 527.0, 357.0, 177.0, 127.0, 89.0, 58.0, 36.0, 25.0, 23.0, 15.0, 9.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3184623718261719, -0.30855560302734375, -0.2986488342285156, -0.2887420654296875, -0.2788352966308594, -0.26892852783203125, -0.2590217590332031, -0.249114990234375, -0.23920822143554688, -0.22930145263671875, -0.21939468383789062, -0.2094879150390625, -0.19958114624023438, -0.18967437744140625, -0.17976760864257812, -0.16986083984375, -0.15995407104492188, -0.15004730224609375, -0.14014053344726562, -0.1302337646484375, -0.12032699584960938, -0.11042022705078125, -0.10051345825195312, -0.090606689453125, -0.08069992065429688, -0.07079315185546875, -0.060886383056640625, -0.0509796142578125, -0.041072845458984375, -0.03116607666015625, -0.021259307861328125, -0.0113525390625, -0.001445770263671875, 0.00846099853515625, 0.018367767333984375, 0.0282745361328125, 0.038181304931640625, 0.04808807373046875, 0.057994842529296875, 0.067901611328125, 0.07780838012695312, 0.08771514892578125, 0.09762191772460938, 0.1075286865234375, 0.11743545532226562, 0.12734222412109375, 0.13724899291992188, 0.14715576171875, 0.15706253051757812, 0.16696929931640625, 0.17687606811523438, 0.1867828369140625, 0.19668960571289062, 0.20659637451171875, 0.21650314331054688, 0.226409912109375, 0.23631668090820312, 0.24622344970703125, 0.2561302185058594, 0.2660369873046875, 0.2759437561035156, 0.28585052490234375, 0.2957572937011719, 0.3056640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 15.0, 19.0, 46.0, 60.0, 101.0, 130.0, 142.0, 120.0, 134.0, 79.0, 61.0, 41.0, 26.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.1783905029296875, -0.171234130859375, -0.1640777587890625, -0.15692138671875, -0.1497650146484375, -0.142608642578125, -0.1354522705078125, -0.1282958984375, -0.1211395263671875, -0.113983154296875, -0.1068267822265625, -0.09967041015625, -0.0925140380859375, -0.085357666015625, -0.0782012939453125, -0.071044921875, -0.0638885498046875, -0.056732177734375, -0.0495758056640625, -0.04241943359375, -0.0352630615234375, -0.028106689453125, -0.0209503173828125, -0.0137939453125, -0.0066375732421875, 0.000518798828125, 0.0076751708984375, 0.01483154296875, 0.0219879150390625, 0.029144287109375, 0.0363006591796875, 0.04345703125, 0.0506134033203125, 0.057769775390625, 0.0649261474609375, 0.07208251953125, 0.0792388916015625, 0.086395263671875, 0.0935516357421875, 0.1007080078125, 0.1078643798828125, 0.115020751953125, 0.1221771240234375, 0.12933349609375, 0.1364898681640625, 0.143646240234375, 0.1508026123046875, 0.157958984375, 0.1651153564453125, 0.172271728515625, 0.1794281005859375, 0.18658447265625, 0.1937408447265625, 0.200897216796875, 0.2080535888671875, 0.2152099609375, 0.2223663330078125, 0.229522705078125, 0.2366790771484375, 0.24383544921875, 0.2509918212890625, 0.258148193359375, 0.2653045654296875, 0.2724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 6.0, 11.0, 7.0, 8.0, 17.0, 25.0, 34.0, 51.0, 75.0, 174.0, 376.0, 966.0, 2579.0, 8615.0, 33682.0, 164789.0, 519039.0, 249555.0, 50801.0, 11990.0, 3492.0, 1268.0, 465.0, 247.0, 99.0, 50.0, 33.0, 25.0, 15.0, 11.0, 11.0, 6.0, 8.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2384033203125, -0.22945213317871094, -0.22050094604492188, -0.2115497589111328, -0.20259857177734375, -0.1936473846435547, -0.18469619750976562, -0.17574501037597656, -0.1667938232421875, -0.15784263610839844, -0.14889144897460938, -0.1399402618408203, -0.13098907470703125, -0.12203788757324219, -0.11308670043945312, -0.10413551330566406, -0.095184326171875, -0.08623313903808594, -0.07728195190429688, -0.06833076477050781, -0.05937957763671875, -0.05042839050292969, -0.041477203369140625, -0.03252601623535156, -0.0235748291015625, -0.014623641967773438, -0.005672454833984375, 0.0032787322998046875, 0.01222991943359375, 0.021181106567382812, 0.030132293701171875, 0.03908348083496094, 0.04803466796875, 0.05698585510253906, 0.06593704223632812, 0.07488822937011719, 0.08383941650390625, 0.09279060363769531, 0.10174179077148438, 0.11069297790527344, 0.1196441650390625, 0.12859535217285156, 0.13754653930664062, 0.1464977264404297, 0.15544891357421875, 0.1644001007080078, 0.17335128784179688, 0.18230247497558594, 0.191253662109375, 0.20020484924316406, 0.20915603637695312, 0.2181072235107422, 0.22705841064453125, 0.2360095977783203, 0.24496078491210938, 0.25391197204589844, 0.2628631591796875, 0.27181434631347656, 0.2807655334472656, 0.2897167205810547, 0.29866790771484375, 0.3076190948486328, 0.3165702819824219, 0.32552146911621094, 0.33447265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 6.0, 4.0, 13.0, 12.0, 6.0, 12.0, 17.0, 22.0, 34.0, 39.0, 35.0, 33.0, 35.0, 32.0, 59.0, 45.0, 54.0, 45.0, 48.0, 37.0, 39.0, 53.0, 47.0, 41.0, 37.0, 24.0, 30.0, 22.0, 26.0, 12.0, 10.0, 15.0, 11.0, 4.0, 2.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.288330078125, -0.2805805206298828, -0.2728309631347656, -0.26508140563964844, -0.25733184814453125, -0.24958229064941406, -0.24183273315429688, -0.2340831756591797, -0.2263336181640625, -0.2185840606689453, -0.21083450317382812, -0.20308494567871094, -0.19533538818359375, -0.18758583068847656, -0.17983627319335938, -0.1720867156982422, -0.164337158203125, -0.1565876007080078, -0.14883804321289062, -0.14108848571777344, -0.13333892822265625, -0.12558937072753906, -0.11783981323242188, -0.11009025573730469, -0.1023406982421875, -0.09459114074707031, -0.08684158325195312, -0.07909202575683594, -0.07134246826171875, -0.06359291076660156, -0.055843353271484375, -0.04809379577636719, -0.04034423828125, -0.03259468078613281, -0.024845123291015625, -0.017095565795898438, -0.00934600830078125, -0.0015964508056640625, 0.006153106689453125, 0.013902664184570312, 0.0216522216796875, 0.029401779174804688, 0.037151336669921875, 0.04490089416503906, 0.05265045166015625, 0.06040000915527344, 0.06814956665039062, 0.07589912414550781, 0.083648681640625, 0.09139823913574219, 0.09914779663085938, 0.10689735412597656, 0.11464691162109375, 0.12239646911621094, 0.13014602661132812, 0.1378955841064453, 0.1456451416015625, 0.1533946990966797, 0.16114425659179688, 0.16889381408691406, 0.17664337158203125, 0.18439292907714844, 0.19214248657226562, 0.1998920440673828, 0.2076416015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 5.0, 18.0, 27.0, 29.0, 50.0, 78.0, 124.0, 188.0, 275.0, 424.0, 740.0, 1156.0, 1960.0, 3512.0, 6413.0, 12476.0, 26744.0, 59786.0, 139022.0, 267311.0, 271396.0, 141267.0, 60621.0, 26972.0, 12904.0, 6479.0, 3495.0, 1990.0, 1129.0, 697.0, 443.0, 246.0, 177.0, 135.0, 80.0, 70.0, 30.0, 30.0, 16.0, 16.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.047454833984375, -0.045972347259521484, -0.04448986053466797, -0.04300737380981445, -0.04152488708496094, -0.04004240036010742, -0.038559913635253906, -0.03707742691040039, -0.035594940185546875, -0.03411245346069336, -0.032629966735839844, -0.031147480010986328, -0.029664993286132812, -0.028182506561279297, -0.02670001983642578, -0.025217533111572266, -0.02373504638671875, -0.022252559661865234, -0.02077007293701172, -0.019287586212158203, -0.017805099487304688, -0.016322612762451172, -0.014840126037597656, -0.01335763931274414, -0.011875152587890625, -0.01039266586303711, -0.008910179138183594, -0.007427692413330078, -0.0059452056884765625, -0.004462718963623047, -0.0029802322387695312, -0.0014977455139160156, -1.52587890625e-05, 0.0014672279357910156, 0.0029497146606445312, 0.004432201385498047, 0.0059146881103515625, 0.007397174835205078, 0.008879661560058594, 0.01036214828491211, 0.011844635009765625, 0.01332712173461914, 0.014809608459472656, 0.016292095184326172, 0.017774581909179688, 0.019257068634033203, 0.02073955535888672, 0.022222042083740234, 0.02370452880859375, 0.025187015533447266, 0.02666950225830078, 0.028151988983154297, 0.029634475708007812, 0.031116962432861328, 0.032599449157714844, 0.03408193588256836, 0.035564422607421875, 0.03704690933227539, 0.038529396057128906, 0.04001188278198242, 0.04149436950683594, 0.04297685623168945, 0.04445934295654297, 0.045941829681396484, 0.04742431640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 7.0, 2.0, 3.0, 9.0, 8.0, 7.0, 9.0, 13.0, 13.0, 16.0, 22.0, 28.0, 32.0, 34.0, 51.0, 54.0, 56.0, 83.0, 67.0, 63.0, 62.0, 43.0, 45.0, 52.0, 43.0, 30.0, 36.0, 17.0, 18.0, 21.0, 11.0, 15.0, 5.0, 5.0, 9.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.043081283569336e-05, -1.0123476386070251e-05, -9.816139936447144e-06, -9.508803486824036e-06, -9.201467037200928e-06, -8.89413058757782e-06, -8.586794137954712e-06, -8.279457688331604e-06, -7.972121238708496e-06, -7.664784789085388e-06, -7.35744833946228e-06, -7.050111889839172e-06, -6.7427754402160645e-06, -6.4354389905929565e-06, -6.128102540969849e-06, -5.820766091346741e-06, -5.513429641723633e-06, -5.206093192100525e-06, -4.898756742477417e-06, -4.591420292854309e-06, -4.284083843231201e-06, -3.976747393608093e-06, -3.6694109439849854e-06, -3.3620744943618774e-06, -3.0547380447387695e-06, -2.7474015951156616e-06, -2.4400651454925537e-06, -2.132728695869446e-06, -1.8253922462463379e-06, -1.51805579662323e-06, -1.210719347000122e-06, -9.033828973770142e-07, -5.960464477539062e-07, -2.8870999813079834e-07, 1.862645149230957e-08, 3.259629011154175e-07, 6.332993507385254e-07, 9.406358003616333e-07, 1.2479722499847412e-06, 1.5553086996078491e-06, 1.862645149230957e-06, 2.169981598854065e-06, 2.477318048477173e-06, 2.7846544981002808e-06, 3.0919909477233887e-06, 3.3993273973464966e-06, 3.7066638469696045e-06, 4.014000296592712e-06, 4.32133674621582e-06, 4.628673195838928e-06, 4.936009645462036e-06, 5.243346095085144e-06, 5.550682544708252e-06, 5.85801899433136e-06, 6.165355443954468e-06, 6.472691893577576e-06, 6.780028343200684e-06, 7.0873647928237915e-06, 7.394701242446899e-06, 7.702037692070007e-06, 8.009374141693115e-06, 8.316710591316223e-06, 8.624047040939331e-06, 8.931383490562439e-06, 9.238719940185547e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 27.0, 44.0, 53.0, 90.0, 115.0, 192.0, 316.0, 519.0, 950.0, 1668.0, 3278.0, 7230.0, 18289.0, 56901.0, 190999.0, 394226.0, 252486.0, 78978.0, 24408.0, 9103.0, 3928.0, 1999.0, 1110.0, 624.0, 373.0, 213.0, 143.0, 89.0, 53.0, 42.0, 25.0, 19.0, 18.0, 5.0, 7.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0672607421875, -0.0652608871459961, -0.06326103210449219, -0.06126117706298828, -0.059261322021484375, -0.05726146697998047, -0.05526161193847656, -0.053261756896972656, -0.05126190185546875, -0.049262046813964844, -0.04726219177246094, -0.04526233673095703, -0.043262481689453125, -0.04126262664794922, -0.03926277160644531, -0.037262916564941406, -0.0352630615234375, -0.033263206481933594, -0.03126335144042969, -0.02926349639892578, -0.027263641357421875, -0.02526378631591797, -0.023263931274414062, -0.021264076232910156, -0.01926422119140625, -0.017264366149902344, -0.015264511108398438, -0.013264656066894531, -0.011264801025390625, -0.009264945983886719, -0.0072650909423828125, -0.005265235900878906, -0.003265380859375, -0.0012655258178710938, 0.0007343292236328125, 0.0027341842651367188, 0.004734039306640625, 0.006733894348144531, 0.008733749389648438, 0.010733604431152344, 0.01273345947265625, 0.014733314514160156, 0.016733169555664062, 0.01873302459716797, 0.020732879638671875, 0.02273273468017578, 0.024732589721679688, 0.026732444763183594, 0.0287322998046875, 0.030732154846191406, 0.03273200988769531, 0.03473186492919922, 0.036731719970703125, 0.03873157501220703, 0.04073143005371094, 0.042731285095214844, 0.04473114013671875, 0.046730995178222656, 0.04873085021972656, 0.05073070526123047, 0.052730560302734375, 0.05473041534423828, 0.05673027038574219, 0.058730125427246094, 0.06072998046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 10.0, 12.0, 16.0, 29.0, 34.0, 50.0, 67.0, 79.0, 87.0, 71.0, 88.0, 75.0, 86.0, 62.0, 52.0, 45.0, 30.0, 26.0, 13.0, 12.0, 4.0, 3.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07366943359375, -0.07130050659179688, -0.06893157958984375, -0.06656265258789062, -0.0641937255859375, -0.061824798583984375, -0.05945587158203125, -0.057086944580078125, -0.054718017578125, -0.052349090576171875, -0.04998016357421875, -0.047611236572265625, -0.0452423095703125, -0.042873382568359375, -0.04050445556640625, -0.038135528564453125, -0.0357666015625, -0.033397674560546875, -0.03102874755859375, -0.028659820556640625, -0.0262908935546875, -0.023921966552734375, -0.02155303955078125, -0.019184112548828125, -0.016815185546875, -0.014446258544921875, -0.01207733154296875, -0.009708404541015625, -0.0073394775390625, -0.004970550537109375, -0.00260162353515625, -0.000232696533203125, 0.00213623046875, 0.004505157470703125, 0.00687408447265625, 0.009243011474609375, 0.0116119384765625, 0.013980865478515625, 0.01634979248046875, 0.018718719482421875, 0.021087646484375, 0.023456573486328125, 0.02582550048828125, 0.028194427490234375, 0.0305633544921875, 0.032932281494140625, 0.03530120849609375, 0.037670135498046875, 0.0400390625, 0.042407989501953125, 0.04477691650390625, 0.047145843505859375, 0.0495147705078125, 0.051883697509765625, 0.05425262451171875, 0.056621551513671875, 0.058990478515625, 0.061359405517578125, 0.06372833251953125, 0.06609725952148438, 0.0684661865234375, 0.07083511352539062, 0.07320404052734375, 0.07557296752929688, 0.07794189453125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 34.0, 41.0, 54.0, 70.0, 102.0, 130.0, 145.0, 120.0, 81.0, 69.0, 48.0, 32.0, 22.0, 14.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26213550567626953, -0.2405075877904892, -0.21887965500354767, -0.19725173711776733, -0.1756238043308258, -0.15399588644504547, -0.13236796855926514, -0.11074003577232361, -0.08911211788654327, -0.06748419255018234, -0.04585627093911171, -0.024228349328041077, -0.0026004239916801453, 0.019027501344680786, 0.04065541923046112, 0.06228335201740265, 0.08391126990318298, 0.10553919523954391, 0.12716712057590485, 0.14879503846168518, 0.1704229712486267, 0.19205088913440704, 0.21367880702018738, 0.2353067398071289, 0.25693464279174805, 0.2785625755786896, 0.3001904785633087, 0.32181841135025024, 0.3434463441371918, 0.3650742769241333, 0.38670217990875244, 0.40833011269569397, 0.4299580454826355, 0.451585978269577, 0.47321388125419617, 0.4948418140411377, 0.5164697170257568, 0.5380976796150208, 0.5597255825996399, 0.5813535451889038, 0.602981448173523, 0.6246093511581421, 0.646237313747406, 0.6678652167320251, 0.6894931197166443, 0.7111210823059082, 0.7327489852905273, 0.7543768882751465, 0.7760047912597656, 0.7976326942443848, 0.8192606568336487, 0.8408885598182678, 0.862516462802887, 0.8841444253921509, 0.90577232837677, 0.9274002313613892, 0.9490281939506531, 0.9706560969352722, 0.9922840595245361, 1.0139119625091553, 1.0355398654937744, 1.0571677684783936, 1.0787956714630127, 1.1004236936569214, 1.1220515966415405]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 10.0, 13.0, 15.0, 13.0, 18.0, 24.0, 19.0, 27.0, 27.0, 31.0, 29.0, 28.0, 38.0, 25.0, 46.0, 30.0, 48.0, 35.0, 36.0, 51.0, 35.0, 36.0, 43.0, 34.0, 27.0, 35.0, 27.0, 26.0, 27.0, 18.0, 19.0, 22.0, 10.0, 10.0, 10.0, 8.0, 11.0, 7.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5198078155517578, -0.503398060798645, -0.4869883060455322, -0.47057855129241943, -0.45416879653930664, -0.43775904178619385, -0.42134925723075867, -0.4049395024776459, -0.3885297477245331, -0.3721199929714203, -0.3557102382183075, -0.3393004834651947, -0.3228906989097595, -0.30648094415664673, -0.29007118940353394, -0.27366143465042114, -0.25725167989730835, -0.24084192514419556, -0.22443217039108276, -0.20802240073680878, -0.19161264598369598, -0.1752028912305832, -0.1587931215763092, -0.1423833668231964, -0.12597361207008362, -0.10956385731697083, -0.09315409511327744, -0.07674433290958405, -0.06033457815647125, -0.04392482340335846, -0.02751506119966507, -0.01110529899597168, 0.005304455757141113, 0.021714214235544205, 0.038123972713947296, 0.05453373119235039, 0.07094348967075348, 0.08735324442386627, 0.10376300662755966, 0.12017276883125305, 0.13658252358436584, 0.15299227833747864, 0.16940203309059143, 0.18581180274486542, 0.2022215574979782, 0.218631312251091, 0.235041081905365, 0.2514508366584778, 0.2678605914115906, 0.28427034616470337, 0.30068010091781616, 0.31708985567092896, 0.33349961042404175, 0.34990936517715454, 0.3663191497325897, 0.3827289044857025, 0.3991386592388153, 0.4155484139919281, 0.4319581687450409, 0.4483679234981537, 0.46477770805358887, 0.48118746280670166, 0.49759721755981445, 0.5140069723129272, 0.53041672706604]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 4.0, 11.0, 8.0, 7.0, 22.0, 27.0, 39.0, 54.0, 82.0, 127.0, 195.0, 318.0, 603.0, 1058.0, 2305.0, 5204.0, 14362.0, 52542.0, 593763.0, 3237529.0, 239003.0, 31776.0, 8555.0, 3051.0, 1427.0, 774.0, 442.0, 308.0, 170.0, 132.0, 85.0, 72.0, 49.0, 35.0, 38.0, 26.0, 18.0, 11.0, 10.0, 6.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1575946807861328, -0.15161514282226562, -0.14563560485839844, -0.13965606689453125, -0.13367652893066406, -0.12769699096679688, -0.12171745300292969, -0.1157379150390625, -0.10975837707519531, -0.10377883911132812, -0.09779930114746094, -0.09181976318359375, -0.08584022521972656, -0.07986068725585938, -0.07388114929199219, -0.067901611328125, -0.06192207336425781, -0.055942535400390625, -0.04996299743652344, -0.04398345947265625, -0.03800392150878906, -0.032024383544921875, -0.026044845581054688, -0.0200653076171875, -0.014085769653320312, -0.008106231689453125, -0.0021266937255859375, 0.00385284423828125, 0.009832382202148438, 0.015811920166015625, 0.021791458129882812, 0.02777099609375, 0.03375053405761719, 0.039730072021484375, 0.04570960998535156, 0.05168914794921875, 0.05766868591308594, 0.06364822387695312, 0.06962776184082031, 0.0756072998046875, 0.08158683776855469, 0.08756637573242188, 0.09354591369628906, 0.09952545166015625, 0.10550498962402344, 0.11148452758789062, 0.11746406555175781, 0.123443603515625, 0.1294231414794922, 0.13540267944335938, 0.14138221740722656, 0.14736175537109375, 0.15334129333496094, 0.15932083129882812, 0.1653003692626953, 0.1712799072265625, 0.1772594451904297, 0.18323898315429688, 0.18921852111816406, 0.19519805908203125, 0.20117759704589844, 0.20715713500976562, 0.2131366729736328, 0.2191162109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 13.0, 22.0, 44.0, 74.0, 77.0, 109.0, 129.0, 140.0, 134.0, 92.0, 63.0, 46.0, 30.0, 10.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.16934585571289062, -0.16168975830078125, -0.15403366088867188, -0.1463775634765625, -0.13872146606445312, -0.13106536865234375, -0.12340927124023438, -0.115753173828125, -0.10809707641601562, -0.10044097900390625, -0.09278488159179688, -0.0851287841796875, -0.07747268676757812, -0.06981658935546875, -0.062160491943359375, -0.05450439453125, -0.046848297119140625, -0.03919219970703125, -0.031536102294921875, -0.0238800048828125, -0.016223907470703125, -0.00856781005859375, -0.000911712646484375, 0.006744384765625, 0.014400482177734375, 0.02205657958984375, 0.029712677001953125, 0.0373687744140625, 0.045024871826171875, 0.05268096923828125, 0.060337066650390625, 0.0679931640625, 0.07564926147460938, 0.08330535888671875, 0.09096145629882812, 0.0986175537109375, 0.10627365112304688, 0.11392974853515625, 0.12158584594726562, 0.129241943359375, 0.13689804077148438, 0.14455413818359375, 0.15221023559570312, 0.1598663330078125, 0.16752243041992188, 0.17517852783203125, 0.18283462524414062, 0.19049072265625, 0.19814682006835938, 0.20580291748046875, 0.21345901489257812, 0.2211151123046875, 0.22877120971679688, 0.23642730712890625, 0.24408340454101562, 0.251739501953125, 0.2593955993652344, 0.26705169677734375, 0.2747077941894531, 0.2823638916015625, 0.2900199890136719, 0.29767608642578125, 0.3053321838378906, 0.31298828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 5.0, 8.0, 14.0, 25.0, 15.0, 27.0, 35.0, 35.0, 72.0, 95.0, 142.0, 324.0, 703.0, 2745.0, 19088.0, 431239.0, 3636442.0, 93188.0, 7471.0, 1470.0, 457.0, 221.0, 118.0, 80.0, 63.0, 39.0, 34.0, 28.0, 18.0, 18.0, 19.0, 10.0, 4.0, 5.0, 5.0, 6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.29422760009765625, -0.2830352783203125, -0.27184295654296875, -0.260650634765625, -0.24945831298828125, -0.2382659912109375, -0.22707366943359375, -0.21588134765625, -0.20468902587890625, -0.1934967041015625, -0.18230438232421875, -0.171112060546875, -0.15991973876953125, -0.1487274169921875, -0.13753509521484375, -0.1263427734375, -0.11515045166015625, -0.1039581298828125, -0.09276580810546875, -0.081573486328125, -0.07038116455078125, -0.0591888427734375, -0.04799652099609375, -0.03680419921875, -0.02561187744140625, -0.0144195556640625, -0.00322723388671875, 0.007965087890625, 0.01915740966796875, 0.0303497314453125, 0.04154205322265625, 0.052734375, 0.06392669677734375, 0.0751190185546875, 0.08631134033203125, 0.097503662109375, 0.10869598388671875, 0.1198883056640625, 0.13108062744140625, 0.14227294921875, 0.15346527099609375, 0.1646575927734375, 0.17584991455078125, 0.187042236328125, 0.19823455810546875, 0.2094268798828125, 0.22061920166015625, 0.2318115234375, 0.24300384521484375, 0.2541961669921875, 0.26538848876953125, 0.276580810546875, 0.28777313232421875, 0.2989654541015625, 0.31015777587890625, 0.32135009765625, 0.33254241943359375, 0.3437347412109375, 0.35492706298828125, 0.366119384765625, 0.37731170654296875, 0.3885040283203125, 0.39969635009765625, 0.410888671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 19.0, 32.0, 50.0, 100.0, 192.0, 526.0, 1598.0, 941.0, 291.0, 143.0, 73.0, 45.0, 27.0, 14.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.1435680389404297, -0.13442611694335938, -0.12528419494628906, -0.11614227294921875, -0.10700035095214844, -0.09785842895507812, -0.08871650695800781, -0.0795745849609375, -0.07043266296386719, -0.061290740966796875, -0.05214881896972656, -0.04300689697265625, -0.03386497497558594, -0.024723052978515625, -0.015581130981445312, -0.006439208984375, 0.0027027130126953125, 0.011844635009765625, 0.020986557006835938, 0.03012847900390625, 0.03927040100097656, 0.048412322998046875, 0.05755424499511719, 0.0666961669921875, 0.07583808898925781, 0.08498001098632812, 0.09412193298339844, 0.10326385498046875, 0.11240577697753906, 0.12154769897460938, 0.1306896209716797, 0.13983154296875, 0.1489734649658203, 0.15811538696289062, 0.16725730895996094, 0.17639923095703125, 0.18554115295410156, 0.19468307495117188, 0.2038249969482422, 0.2129669189453125, 0.2221088409423828, 0.23125076293945312, 0.24039268493652344, 0.24953460693359375, 0.25867652893066406, 0.2678184509277344, 0.2769603729248047, 0.286102294921875, 0.2952442169189453, 0.3043861389160156, 0.31352806091308594, 0.32266998291015625, 0.33181190490722656, 0.3409538269042969, 0.3500957489013672, 0.3592376708984375, 0.3683795928955078, 0.3775215148925781, 0.38666343688964844, 0.39580535888671875, 0.40494728088378906, 0.4140892028808594, 0.4232311248779297, 0.432373046875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 2.0, 11.0, 15.0, 26.0, 35.0, 54.0, 78.0, 123.0, 134.0, 136.0, 100.0, 91.0, 69.0, 35.0, 30.0, 19.0, 12.0, 11.0, 7.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046882152557373, -0.7853681445121765, -0.7660480737686157, -0.7467280030250549, -0.7274079322814941, -0.7080878615379333, -0.6887677907943726, -0.669447660446167, -0.650127649307251, -0.6308075785636902, -0.6114875078201294, -0.5921674370765686, -0.5728473663330078, -0.553527295589447, -0.5342072248458862, -0.5148870944976807, -0.4955670237541199, -0.4762469530105591, -0.4569268822669983, -0.4376068115234375, -0.4182867407798767, -0.3989666700363159, -0.37964656949043274, -0.36032649874687195, -0.34100642800331116, -0.32168635725975037, -0.3023662865161896, -0.2830462157726288, -0.2637261152267456, -0.244406059384346, -0.22508597373962402, -0.20576590299606323, -0.18644580245018005, -0.16712573170661926, -0.14780566096305847, -0.1284855753183365, -0.1091655045747757, -0.0898454338312149, -0.07052535563707352, -0.05120527744293213, -0.03188520669937134, -0.012565132230520248, 0.006754942238330841, 0.02607501670718193, 0.04539509117603302, 0.06471516191959381, 0.0840352401137352, 0.10335531830787659, 0.12267538905143738, 0.14199545979499817, 0.16131553053855896, 0.18063561618328094, 0.19995568692684174, 0.21927575767040253, 0.2385958433151245, 0.2579159140586853, 0.2772359848022461, 0.2965560555458069, 0.3158761262893677, 0.33519619703292847, 0.35451626777648926, 0.37383633852005005, 0.3931564390659332, 0.412476509809494, 0.4317965805530548]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 2.0, 6.0, 5.0, 5.0, 8.0, 11.0, 15.0, 9.0, 16.0, 25.0, 21.0, 31.0, 39.0, 32.0, 33.0, 25.0, 30.0, 39.0, 37.0, 44.0, 37.0, 48.0, 28.0, 37.0, 29.0, 39.0, 38.0, 45.0, 29.0, 37.0, 30.0, 28.0, 18.0, 27.0, 18.0, 14.0, 13.0, 16.0, 6.0, 8.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.3997815251350403, -0.3874533772468567, -0.3751252293586731, -0.3627970814704895, -0.3504689037799835, -0.3381407558917999, -0.32581260800361633, -0.31348446011543274, -0.30115631222724915, -0.28882816433906555, -0.27650001645088196, -0.264171838760376, -0.2518436908721924, -0.2395155429840088, -0.2271873950958252, -0.2148592472076416, -0.20253108441829681, -0.19020293653011322, -0.17787477374076843, -0.16554662585258484, -0.15321847796440125, -0.14089033007621765, -0.12856216728687286, -0.11623401939868927, -0.10390586405992508, -0.09157770872116089, -0.0792495608329773, -0.0669214054942131, -0.05459325388073921, -0.04226510226726532, -0.02993694692850113, -0.017608799040317535, -0.005280643701553345, 0.007047508843243122, 0.01937566138803959, 0.03170381486415863, 0.04403196647763252, 0.056360118091106415, 0.0686882734298706, 0.0810164213180542, 0.09334457665681839, 0.10567273199558258, 0.11800087988376617, 0.13032904267311096, 0.14265719056129456, 0.15498533844947815, 0.16731348633766174, 0.17964163422584534, 0.19196979701519012, 0.20429794490337372, 0.2166261076927185, 0.2289542555809021, 0.2412824034690857, 0.2536105513572693, 0.2659386992454529, 0.2782668471336365, 0.29059502482414246, 0.30292317271232605, 0.31525132060050964, 0.3275794982910156, 0.3399076461791992, 0.3522357940673828, 0.3645639419555664, 0.37689208984375, 0.3892202377319336]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 13.0, 28.0, 33.0, 43.0, 67.0, 130.0, 196.0, 309.0, 529.0, 1037.0, 2252.0, 6017.0, 22142.0, 117723.0, 580458.0, 259483.0, 41815.0, 9934.0, 3240.0, 1448.0, 666.0, 342.0, 222.0, 138.0, 90.0, 48.0, 35.0, 23.0, 13.0, 15.0, 9.0, 12.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.31134033203125, -0.2996826171875, -0.28802490234375, -0.2763671875, -0.26470947265625, -0.2530517578125, -0.24139404296875, -0.229736328125, -0.21807861328125, -0.2064208984375, -0.19476318359375, -0.18310546875, -0.17144775390625, -0.1597900390625, -0.14813232421875, -0.136474609375, -0.12481689453125, -0.1131591796875, -0.10150146484375, -0.08984375, -0.07818603515625, -0.0665283203125, -0.05487060546875, -0.043212890625, -0.03155517578125, -0.0198974609375, -0.00823974609375, 0.00341796875, 0.01507568359375, 0.0267333984375, 0.03839111328125, 0.050048828125, 0.06170654296875, 0.0733642578125, 0.08502197265625, 0.0966796875, 0.10833740234375, 0.1199951171875, 0.13165283203125, 0.143310546875, 0.15496826171875, 0.1666259765625, 0.17828369140625, 0.18994140625, 0.20159912109375, 0.2132568359375, 0.22491455078125, 0.236572265625, 0.24822998046875, 0.2598876953125, 0.27154541015625, 0.283203125, 0.29486083984375, 0.3065185546875, 0.31817626953125, 0.329833984375, 0.34149169921875, 0.3531494140625, 0.36480712890625, 0.37646484375, 0.38812255859375, 0.3997802734375, 0.41143798828125, 0.423095703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 11.0, 23.0, 36.0, 49.0, 80.0, 99.0, 143.0, 131.0, 118.0, 97.0, 77.0, 65.0, 34.0, 20.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.1833057403564453, -0.17581558227539062, -0.16832542419433594, -0.16083526611328125, -0.15334510803222656, -0.14585494995117188, -0.1383647918701172, -0.1308746337890625, -0.12338447570800781, -0.11589431762695312, -0.10840415954589844, -0.10091400146484375, -0.09342384338378906, -0.08593368530273438, -0.07844352722167969, -0.070953369140625, -0.06346321105957031, -0.055973052978515625, -0.04848289489746094, -0.04099273681640625, -0.03350257873535156, -0.026012420654296875, -0.018522262573242188, -0.0110321044921875, -0.0035419464111328125, 0.003948211669921875, 0.011438369750976562, 0.01892852783203125, 0.026418685913085938, 0.033908843994140625, 0.04139900207519531, 0.04888916015625, 0.05637931823730469, 0.06386947631835938, 0.07135963439941406, 0.07884979248046875, 0.08633995056152344, 0.09383010864257812, 0.10132026672363281, 0.1088104248046875, 0.11630058288574219, 0.12379074096679688, 0.13128089904785156, 0.13877105712890625, 0.14626121520996094, 0.15375137329101562, 0.1612415313720703, 0.168731689453125, 0.1762218475341797, 0.18371200561523438, 0.19120216369628906, 0.19869232177734375, 0.20618247985839844, 0.21367263793945312, 0.2211627960205078, 0.2286529541015625, 0.2361431121826172, 0.24363327026367188, 0.25112342834472656, 0.25861358642578125, 0.26610374450683594, 0.2735939025878906, 0.2810840606689453, 0.28857421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 11.0, 8.0, 13.0, 12.0, 27.0, 50.0, 65.0, 126.0, 192.0, 365.0, 693.0, 1463.0, 3352.0, 8924.0, 27394.0, 101259.0, 381727.0, 379736.0, 100832.0, 27244.0, 8793.0, 3386.0, 1367.0, 649.0, 347.0, 184.0, 110.0, 60.0, 44.0, 28.0, 18.0, 22.0, 11.0, 5.0, 9.0, 10.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25048828125, -0.24289703369140625, -0.2353057861328125, -0.22771453857421875, -0.220123291015625, -0.21253204345703125, -0.2049407958984375, -0.19734954833984375, -0.18975830078125, -0.18216705322265625, -0.1745758056640625, -0.16698455810546875, -0.159393310546875, -0.15180206298828125, -0.1442108154296875, -0.13661956787109375, -0.1290283203125, -0.12143707275390625, -0.1138458251953125, -0.10625457763671875, -0.098663330078125, -0.09107208251953125, -0.0834808349609375, -0.07588958740234375, -0.06829833984375, -0.06070709228515625, -0.0531158447265625, -0.04552459716796875, -0.037933349609375, -0.03034210205078125, -0.0227508544921875, -0.01515960693359375, -0.007568359375, 2.288818359375e-05, 0.0076141357421875, 0.01520538330078125, 0.022796630859375, 0.03038787841796875, 0.0379791259765625, 0.04557037353515625, 0.05316162109375, 0.06075286865234375, 0.0683441162109375, 0.07593536376953125, 0.083526611328125, 0.09111785888671875, 0.0987091064453125, 0.10630035400390625, 0.1138916015625, 0.12148284912109375, 0.1290740966796875, 0.13666534423828125, 0.144256591796875, 0.15184783935546875, 0.1594390869140625, 0.16703033447265625, 0.17462158203125, 0.18221282958984375, 0.1898040771484375, 0.19739532470703125, 0.204986572265625, 0.21257781982421875, 0.2201690673828125, 0.22776031494140625, 0.2353515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 6.0, 6.0, 8.0, 11.0, 15.0, 12.0, 15.0, 29.0, 27.0, 32.0, 27.0, 39.0, 36.0, 43.0, 50.0, 52.0, 56.0, 52.0, 69.0, 53.0, 41.0, 43.0, 36.0, 50.0, 39.0, 37.0, 24.0, 22.0, 11.0, 15.0, 8.0, 12.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.279541015625, -0.2709236145019531, -0.26230621337890625, -0.2536888122558594, -0.2450714111328125, -0.23645401000976562, -0.22783660888671875, -0.21921920776367188, -0.210601806640625, -0.20198440551757812, -0.19336700439453125, -0.18474960327148438, -0.1761322021484375, -0.16751480102539062, -0.15889739990234375, -0.15027999877929688, -0.14166259765625, -0.13304519653320312, -0.12442779541015625, -0.11581039428710938, -0.1071929931640625, -0.09857559204101562, -0.08995819091796875, -0.08134078979492188, -0.072723388671875, -0.06410598754882812, -0.05548858642578125, -0.046871185302734375, -0.0382537841796875, -0.029636383056640625, -0.02101898193359375, -0.012401580810546875, -0.0037841796875, 0.004833221435546875, 0.01345062255859375, 0.022068023681640625, 0.0306854248046875, 0.039302825927734375, 0.04792022705078125, 0.056537628173828125, 0.065155029296875, 0.07377243041992188, 0.08238983154296875, 0.09100723266601562, 0.0996246337890625, 0.10824203491210938, 0.11685943603515625, 0.12547683715820312, 0.13409423828125, 0.14271163940429688, 0.15132904052734375, 0.15994644165039062, 0.1685638427734375, 0.17718124389648438, 0.18579864501953125, 0.19441604614257812, 0.203033447265625, 0.21165084838867188, 0.22026824951171875, 0.22888565063476562, 0.2375030517578125, 0.24612045288085938, 0.25473785400390625, 0.2633552551269531, 0.27197265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 8.0, 10.0, 21.0, 35.0, 28.0, 34.0, 53.0, 62.0, 83.0, 142.0, 201.0, 257.0, 380.0, 498.0, 728.0, 1090.0, 1658.0, 2507.0, 3936.0, 6216.0, 10647.0, 19297.0, 36927.0, 75968.0, 159136.0, 265344.0, 226343.0, 115516.0, 55264.0, 28056.0, 14778.0, 8556.0, 4979.0, 3194.0, 2094.0, 1407.0, 902.0, 620.0, 446.0, 312.0, 226.0, 157.0, 127.0, 80.0, 63.0, 54.0, 37.0, 24.0, 15.0, 10.0, 8.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04893636703491211, -0.04739665985107422, -0.04585695266723633, -0.04431724548339844, -0.04277753829956055, -0.041237831115722656, -0.039698123931884766, -0.038158416748046875, -0.036618709564208984, -0.035079002380371094, -0.0335392951965332, -0.03199958801269531, -0.030459880828857422, -0.02892017364501953, -0.02738046646118164, -0.02584075927734375, -0.02430105209350586, -0.02276134490966797, -0.021221637725830078, -0.019681930541992188, -0.018142223358154297, -0.016602516174316406, -0.015062808990478516, -0.013523101806640625, -0.011983394622802734, -0.010443687438964844, -0.008903980255126953, -0.0073642730712890625, -0.005824565887451172, -0.004284858703613281, -0.0027451515197753906, -0.0012054443359375, 0.0003342628479003906, 0.0018739700317382812, 0.003413677215576172, 0.0049533843994140625, 0.006493091583251953, 0.008032798767089844, 0.009572505950927734, 0.011112213134765625, 0.012651920318603516, 0.014191627502441406, 0.015731334686279297, 0.017271041870117188, 0.018810749053955078, 0.02035045623779297, 0.02189016342163086, 0.02342987060546875, 0.02496957778930664, 0.02650928497314453, 0.028048992156982422, 0.029588699340820312, 0.031128406524658203, 0.032668113708496094, 0.034207820892333984, 0.035747528076171875, 0.037287235260009766, 0.038826942443847656, 0.04036664962768555, 0.04190635681152344, 0.04344606399536133, 0.04498577117919922, 0.04652547836303711, 0.048065185546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 9.0, 10.0, 15.0, 20.0, 20.0, 19.0, 38.0, 51.0, 52.0, 83.0, 103.0, 80.0, 115.0, 95.0, 82.0, 36.0, 34.0, 22.0, 19.0, 23.0, 16.0, 10.0, 4.0, 9.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3768672943115234e-05, -1.3249926269054413e-05, -1.2731179594993591e-05, -1.221243292093277e-05, -1.1693686246871948e-05, -1.1174939572811127e-05, -1.0656192898750305e-05, -1.0137446224689484e-05, -9.618699550628662e-06, -9.09995287656784e-06, -8.581206202507019e-06, -8.062459528446198e-06, -7.543712854385376e-06, -7.0249661803245544e-06, -6.506219506263733e-06, -5.987472832202911e-06, -5.46872615814209e-06, -4.949979484081268e-06, -4.431232810020447e-06, -3.912486135959625e-06, -3.3937394618988037e-06, -2.874992787837982e-06, -2.3562461137771606e-06, -1.8374994397163391e-06, -1.3187527656555176e-06, -8.00006091594696e-07, -2.812594175338745e-07, 2.3748725652694702e-07, 7.562339305877686e-07, 1.27498060464859e-06, 1.7937272787094116e-06, 2.312473952770233e-06, 2.8312206268310547e-06, 3.3499673008918762e-06, 3.868713974952698e-06, 4.387460649013519e-06, 4.906207323074341e-06, 5.424953997135162e-06, 5.943700671195984e-06, 6.462447345256805e-06, 6.981194019317627e-06, 7.4999406933784485e-06, 8.01868736743927e-06, 8.537434041500092e-06, 9.056180715560913e-06, 9.574927389621735e-06, 1.0093674063682556e-05, 1.0612420737743378e-05, 1.11311674118042e-05, 1.164991408586502e-05, 1.2168660759925842e-05, 1.2687407433986664e-05, 1.3206154108047485e-05, 1.3724900782108307e-05, 1.4243647456169128e-05, 1.476239413022995e-05, 1.528114080429077e-05, 1.5799887478351593e-05, 1.6318634152412415e-05, 1.6837380826473236e-05, 1.7356127500534058e-05, 1.787487417459488e-05, 1.83936208486557e-05, 1.8912367522716522e-05, 1.9431114196777344e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 9.0, 13.0, 29.0, 56.0, 96.0, 208.0, 472.0, 1009.0, 2066.0, 5098.0, 15586.0, 80120.0, 514266.0, 360063.0, 50188.0, 11855.0, 4108.0, 1722.0, 817.0, 368.0, 174.0, 107.0, 49.0, 23.0, 17.0, 10.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0948486328125, -0.09103584289550781, -0.08722305297851562, -0.08341026306152344, -0.07959747314453125, -0.07578468322753906, -0.07197189331054688, -0.06815910339355469, -0.0643463134765625, -0.06053352355957031, -0.056720733642578125, -0.05290794372558594, -0.04909515380859375, -0.04528236389160156, -0.041469573974609375, -0.03765678405761719, -0.033843994140625, -0.030031204223632812, -0.026218414306640625, -0.022405624389648438, -0.01859283447265625, -0.014780044555664062, -0.010967254638671875, -0.0071544647216796875, -0.0033416748046875, 0.0004711151123046875, 0.004283905029296875, 0.008096694946289062, 0.01190948486328125, 0.015722274780273438, 0.019535064697265625, 0.023347854614257812, 0.02716064453125, 0.030973434448242188, 0.034786224365234375, 0.03859901428222656, 0.04241180419921875, 0.04622459411621094, 0.050037384033203125, 0.05385017395019531, 0.0576629638671875, 0.06147575378417969, 0.06528854370117188, 0.06910133361816406, 0.07291412353515625, 0.07672691345214844, 0.08053970336914062, 0.08435249328613281, 0.088165283203125, 0.09197807312011719, 0.09579086303710938, 0.09960365295410156, 0.10341644287109375, 0.10722923278808594, 0.11104202270507812, 0.11485481262207031, 0.1186676025390625, 0.12248039245605469, 0.12629318237304688, 0.13010597229003906, 0.13391876220703125, 0.13773155212402344, 0.14154434204101562, 0.1453571319580078, 0.149169921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 11.0, 9.0, 15.0, 19.0, 22.0, 49.0, 58.0, 80.0, 134.0, 131.0, 112.0, 102.0, 84.0, 55.0, 32.0, 25.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1614990234375, -0.1573324203491211, -0.1531658172607422, -0.14899921417236328, -0.14483261108398438, -0.14066600799560547, -0.13649940490722656, -0.13233280181884766, -0.12816619873046875, -0.12399959564208984, -0.11983299255371094, -0.11566638946533203, -0.11149978637695312, -0.10733318328857422, -0.10316658020019531, -0.0989999771118164, -0.0948333740234375, -0.0906667709350586, -0.08650016784667969, -0.08233356475830078, -0.07816696166992188, -0.07400035858154297, -0.06983375549316406, -0.06566715240478516, -0.06150054931640625, -0.057333946228027344, -0.05316734313964844, -0.04900074005126953, -0.044834136962890625, -0.04066753387451172, -0.03650093078613281, -0.032334327697753906, -0.028167724609375, -0.024001121520996094, -0.019834518432617188, -0.01566791534423828, -0.011501312255859375, -0.007334709167480469, -0.0031681060791015625, 0.0009984970092773438, 0.00516510009765625, 0.009331703186035156, 0.013498306274414062, 0.01766490936279297, 0.021831512451171875, 0.02599811553955078, 0.030164718627929688, 0.034331321716308594, 0.0384979248046875, 0.042664527893066406, 0.04683113098144531, 0.05099773406982422, 0.055164337158203125, 0.05933094024658203, 0.06349754333496094, 0.06766414642333984, 0.07183074951171875, 0.07599735260009766, 0.08016395568847656, 0.08433055877685547, 0.08849716186523438, 0.09266376495361328, 0.09683036804199219, 0.1009969711303711, 0.10516357421875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 20.0, 48.0, 89.0, 185.0, 226.0, 177.0, 119.0, 75.0, 35.0, 17.0, 11.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7604790925979614, -0.7139937877655029, -0.6675085425376892, -0.6210232377052307, -0.574537992477417, -0.5280526876449585, -0.4815673828125, -0.4350821077823639, -0.3885968327522278, -0.3421115577220917, -0.29562628269195557, -0.24914097785949707, -0.20265570282936096, -0.15617042779922485, -0.10968512296676636, -0.06319984793663025, -0.01671457290649414, 0.029770709574222565, 0.07625599205493927, 0.12274128198623657, 0.16922655701637268, 0.2157118320465088, 0.2621971368789673, 0.3086824119091034, 0.3551676869392395, 0.4016529619693756, 0.4481382369995117, 0.4946235418319702, 0.5411088466644287, 0.5875940918922424, 0.6340793967247009, 0.6805646419525146, 0.7270500659942627, 0.7735353708267212, 0.8200206160545349, 0.8665059208869934, 0.9129911661148071, 0.9594764709472656, 1.0059617757797241, 1.0524470806121826, 1.0989322662353516, 1.14541757106781, 1.1919028759002686, 1.2383880615234375, 1.284873366355896, 1.3313586711883545, 1.377843976020813, 1.4243292808532715, 1.47081458568573, 1.5172998905181885, 1.563785195350647, 1.6102705001831055, 1.6567556858062744, 1.703240990638733, 1.7497262954711914, 1.79621160030365, 1.8426969051361084, 1.889182209968567, 1.9356675148010254, 1.9821527004241943, 2.0286381244659424, 2.0751233100891113, 2.1216087341308594, 2.1680939197540283, 2.2145791053771973]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 13.0, 11.0, 10.0, 17.0, 10.0, 16.0, 32.0, 20.0, 32.0, 32.0, 26.0, 24.0, 42.0, 50.0, 35.0, 56.0, 54.0, 57.0, 42.0, 56.0, 38.0, 38.0, 42.0, 41.0, 32.0, 25.0, 29.0, 24.0, 20.0, 14.0, 12.0, 9.0, 6.0, 5.0, 8.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7170342206954956, -0.6932783126831055, -0.6695224642753601, -0.64576655626297, -0.6220106482505798, -0.5982547998428345, -0.5744988918304443, -0.5507429838180542, -0.5269870758056641, -0.5032311677932739, -0.4794752895832062, -0.4557194113731384, -0.4319635033607483, -0.40820762515068054, -0.3844517469406128, -0.36069583892822266, -0.3369399905204773, -0.31318411231040955, -0.2894282042980194, -0.26567232608795166, -0.24191643297672272, -0.21816053986549377, -0.19440466165542603, -0.17064876854419708, -0.14689287543296814, -0.1231369823217392, -0.09938109666109085, -0.0756252110004425, -0.05186931788921356, -0.02811342477798462, -0.00435754656791687, 0.019398346543312073, 0.04315429925918579, 0.06691019237041473, 0.09066607803106308, 0.11442196369171143, 0.13817785680294037, 0.1619337499141693, 0.18568962812423706, 0.209445521235466, 0.23320141434669495, 0.2569572925567627, 0.28071320056915283, 0.3044690787792206, 0.32822495698928833, 0.35198086500167847, 0.3757367432117462, 0.39949262142181396, 0.4232485294342041, 0.44700440764427185, 0.470760315656662, 0.49451619386672974, 0.5182721018791199, 0.5420279502868652, 0.5657838582992554, 0.5895397663116455, 0.6132956743240356, 0.6370515823364258, 0.6608074307441711, 0.6845633387565613, 0.7083192467689514, 0.7320750951766968, 0.7558310031890869, 0.779586911201477, 0.8033427596092224]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 11.0, 6.0, 19.0, 25.0, 39.0, 61.0, 104.0, 167.0, 280.0, 545.0, 973.0, 2150.0, 4979.0, 13027.0, 49360.0, 671793.0, 3249978.0, 162418.0, 24353.0, 7567.0, 3046.0, 1499.0, 781.0, 427.0, 247.0, 135.0, 97.0, 67.0, 47.0, 28.0, 18.0, 8.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1737060546875, -0.1670970916748047, -0.16048812866210938, -0.15387916564941406, -0.14727020263671875, -0.14066123962402344, -0.13405227661132812, -0.1274433135986328, -0.1208343505859375, -0.11422538757324219, -0.10761642456054688, -0.10100746154785156, -0.09439849853515625, -0.08778953552246094, -0.08118057250976562, -0.07457160949707031, -0.067962646484375, -0.06135368347167969, -0.054744720458984375, -0.04813575744628906, -0.04152679443359375, -0.03491783142089844, -0.028308868408203125, -0.021699905395507812, -0.0150909423828125, -0.008481979370117188, -0.001873016357421875, 0.0047359466552734375, 0.01134490966796875, 0.017953872680664062, 0.024562835693359375, 0.031171798706054688, 0.03778076171875, 0.04438972473144531, 0.050998687744140625, 0.05760765075683594, 0.06421661376953125, 0.07082557678222656, 0.07743453979492188, 0.08404350280761719, 0.0906524658203125, 0.09726142883300781, 0.10387039184570312, 0.11047935485839844, 0.11708831787109375, 0.12369728088378906, 0.13030624389648438, 0.1369152069091797, 0.143524169921875, 0.1501331329345703, 0.15674209594726562, 0.16335105895996094, 0.16996002197265625, 0.17656898498535156, 0.18317794799804688, 0.1897869110107422, 0.1963958740234375, 0.2030048370361328, 0.20961380004882812, 0.21622276306152344, 0.22283172607421875, 0.22944068908691406, 0.23604965209960938, 0.2426586151123047, 0.249267578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 24.0, 42.0, 51.0, 65.0, 105.0, 105.0, 125.0, 117.0, 94.0, 84.0, 62.0, 47.0, 24.0, 16.0, 14.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17444229125976562, -0.16675567626953125, -0.15906906127929688, -0.1513824462890625, -0.14369583129882812, -0.13600921630859375, -0.12832260131835938, -0.120635986328125, -0.11294937133789062, -0.10526275634765625, -0.09757614135742188, -0.0898895263671875, -0.08220291137695312, -0.07451629638671875, -0.06682968139648438, -0.05914306640625, -0.051456451416015625, -0.04376983642578125, -0.036083221435546875, -0.0283966064453125, -0.020709991455078125, -0.01302337646484375, -0.005336761474609375, 0.002349853515625, 0.010036468505859375, 0.01772308349609375, 0.025409698486328125, 0.0330963134765625, 0.040782928466796875, 0.04846954345703125, 0.056156158447265625, 0.0638427734375, 0.07152938842773438, 0.07921600341796875, 0.08690261840820312, 0.0945892333984375, 0.10227584838867188, 0.10996246337890625, 0.11764907836914062, 0.125335693359375, 0.13302230834960938, 0.14070892333984375, 0.14839553833007812, 0.1560821533203125, 0.16376876831054688, 0.17145538330078125, 0.17914199829101562, 0.18682861328125, 0.19451522827148438, 0.20220184326171875, 0.20988845825195312, 0.2175750732421875, 0.22526168823242188, 0.23294830322265625, 0.24063491821289062, 0.248321533203125, 0.2560081481933594, 0.26369476318359375, 0.2713813781738281, 0.2790679931640625, 0.2867546081542969, 0.29444122314453125, 0.3021278381347656, 0.309814453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 14.0, 11.0, 15.0, 10.0, 18.0, 23.0, 39.0, 47.0, 54.0, 70.0, 136.0, 176.0, 237.0, 356.0, 457.0, 701.0, 1107.0, 1942.0, 3598.0, 7831.0, 20552.0, 71716.0, 444616.0, 3099193.0, 434209.0, 70403.0, 20102.0, 7531.0, 3494.0, 1961.0, 1159.0, 775.0, 519.0, 323.0, 237.0, 167.0, 131.0, 92.0, 67.0, 54.0, 39.0, 27.0, 17.0, 22.0, 16.0, 4.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.1561412811279297, -0.15066146850585938, -0.14518165588378906, -0.13970184326171875, -0.13422203063964844, -0.12874221801757812, -0.12326240539550781, -0.1177825927734375, -0.11230278015136719, -0.10682296752929688, -0.10134315490722656, -0.09586334228515625, -0.09038352966308594, -0.08490371704101562, -0.07942390441894531, -0.073944091796875, -0.06846427917480469, -0.06298446655273438, -0.05750465393066406, -0.05202484130859375, -0.04654502868652344, -0.041065216064453125, -0.03558540344238281, -0.0301055908203125, -0.024625778198242188, -0.019145965576171875, -0.013666152954101562, -0.00818634033203125, -0.0027065277099609375, 0.002773284912109375, 0.008253097534179688, 0.01373291015625, 0.019212722778320312, 0.024692535400390625, 0.030172348022460938, 0.03565216064453125, 0.04113197326660156, 0.046611785888671875, 0.05209159851074219, 0.0575714111328125, 0.06305122375488281, 0.06853103637695312, 0.07401084899902344, 0.07949066162109375, 0.08497047424316406, 0.09045028686523438, 0.09593009948730469, 0.101409912109375, 0.10688972473144531, 0.11236953735351562, 0.11784934997558594, 0.12332916259765625, 0.12880897521972656, 0.13428878784179688, 0.1397686004638672, 0.1452484130859375, 0.1507282257080078, 0.15620803833007812, 0.16168785095214844, 0.16716766357421875, 0.17264747619628906, 0.17812728881835938, 0.1836071014404297, 0.1890869140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 13.0, 13.0, 30.0, 55.0, 72.0, 130.0, 290.0, 859.0, 1448.0, 636.0, 218.0, 106.0, 65.0, 38.0, 27.0, 18.0, 11.0, 3.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1884765625, -0.18181610107421875, -0.1751556396484375, -0.16849517822265625, -0.161834716796875, -0.15517425537109375, -0.1485137939453125, -0.14185333251953125, -0.13519287109375, -0.12853240966796875, -0.1218719482421875, -0.11521148681640625, -0.108551025390625, -0.10189056396484375, -0.0952301025390625, -0.08856964111328125, -0.0819091796875, -0.07524871826171875, -0.0685882568359375, -0.06192779541015625, -0.055267333984375, -0.04860687255859375, -0.0419464111328125, -0.03528594970703125, -0.02862548828125, -0.02196502685546875, -0.0153045654296875, -0.00864410400390625, -0.001983642578125, 0.00467681884765625, 0.0113372802734375, 0.01799774169921875, 0.024658203125, 0.03131866455078125, 0.0379791259765625, 0.04463958740234375, 0.051300048828125, 0.05796051025390625, 0.0646209716796875, 0.07128143310546875, 0.07794189453125, 0.08460235595703125, 0.0912628173828125, 0.09792327880859375, 0.104583740234375, 0.11124420166015625, 0.1179046630859375, 0.12456512451171875, 0.1312255859375, 0.13788604736328125, 0.1445465087890625, 0.15120697021484375, 0.157867431640625, 0.16452789306640625, 0.1711883544921875, 0.17784881591796875, 0.18450927734375, 0.19116973876953125, 0.1978302001953125, 0.20449066162109375, 0.211151123046875, 0.21781158447265625, 0.2244720458984375, 0.23113250732421875, 0.23779296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 9.0, 12.0, 17.0, 26.0, 35.0, 33.0, 50.0, 74.0, 92.0, 99.0, 95.0, 78.0, 85.0, 70.0, 46.0, 38.0, 35.0, 22.0, 17.0, 13.0, 5.0, 6.0, 11.0, 9.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5029130578041077, -0.4884081780910492, -0.4739033281803131, -0.45939844846725464, -0.44489359855651855, -0.4303887188434601, -0.4158838391304016, -0.4013789892196655, -0.38687410950660706, -0.3723692297935486, -0.3578643798828125, -0.34335950016975403, -0.32885465025901794, -0.3143497705459595, -0.2998449206352234, -0.2853400409221649, -0.27083516120910645, -0.256330281496048, -0.2418254315853119, -0.22732055187225342, -0.21281568706035614, -0.19831082224845886, -0.18380595743656158, -0.1693010926246643, -0.15479624271392822, -0.14029137790203094, -0.12578651309013367, -0.11128164082765579, -0.09677676856517792, -0.08227190375328064, -0.06776703894138336, -0.05326216667890549, -0.03875729441642761, -0.024252425879240036, -0.009747559204697609, 0.004757307469844818, 0.019262176007032394, 0.03376704454421997, 0.04827190935611725, 0.06277678161859512, 0.0772816464304924, 0.09178651124238968, 0.10629138350486755, 0.12079624831676483, 0.1353011131286621, 0.14980599284172058, 0.16431084275245667, 0.17881572246551514, 0.19332058727741241, 0.2078254520893097, 0.22233031690120697, 0.23683518171310425, 0.2513400614261627, 0.2658449411392212, 0.2803497910499573, 0.29485467076301575, 0.30935952067375183, 0.3238644003868103, 0.3383692502975464, 0.35287413001060486, 0.36737897992134094, 0.3818838596343994, 0.3963887095451355, 0.41089358925819397, 0.42539846897125244]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 0.0, 4.0, 11.0, 9.0, 10.0, 19.0, 13.0, 13.0, 26.0, 18.0, 32.0, 31.0, 24.0, 33.0, 26.0, 36.0, 34.0, 48.0, 34.0, 41.0, 39.0, 48.0, 36.0, 40.0, 37.0, 30.0, 34.0, 28.0, 27.0, 29.0, 26.0, 29.0, 21.0, 17.0, 16.0, 13.0, 7.0, 11.0, 18.0, 7.0, 6.0, 10.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.47773128747940063, -0.46515607833862305, -0.45258089900016785, -0.44000568985939026, -0.42743051052093506, -0.41485530138015747, -0.4022800922393799, -0.3897049129009247, -0.3771297037601471, -0.3645544946193695, -0.3519793152809143, -0.3394041061401367, -0.3268289268016815, -0.31425371766090393, -0.30167853832244873, -0.28910332918167114, -0.27652812004089355, -0.26395291090011597, -0.25137773156166077, -0.23880252242088318, -0.22622732818126678, -0.2136521339416504, -0.201076939702034, -0.1885017454624176, -0.1759265661239624, -0.163351371884346, -0.15077617764472961, -0.13820096850395203, -0.12562577426433563, -0.11305058002471924, -0.10047538578510284, -0.08790018409490585, -0.07532498240470886, -0.06274978816509247, -0.05017458647489548, -0.03759939223527908, -0.02502419427037239, -0.012448996305465698, 0.0001261979341506958, 0.012701399624347687, 0.02527659386396408, 0.03785179182887077, 0.050426989793777466, 0.06300218403339386, 0.07557737827301025, 0.08815257996320724, 0.10072777420282364, 0.11330297589302063, 0.12587817013263702, 0.13845336437225342, 0.1510285586118698, 0.1636037528514862, 0.1761789619922638, 0.1887541562318802, 0.20132935047149658, 0.21390455961227417, 0.22647973895072937, 0.23905493319034576, 0.25163012742996216, 0.26420533657073975, 0.27678051590919495, 0.28935572504997253, 0.30193090438842773, 0.3145061135292053, 0.3270813226699829]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 13.0, 13.0, 7.0, 20.0, 23.0, 35.0, 52.0, 77.0, 93.0, 164.0, 284.0, 424.0, 709.0, 1227.0, 2312.0, 4420.0, 9035.0, 21618.0, 58770.0, 186624.0, 445698.0, 207794.0, 65170.0, 23682.0, 9939.0, 4718.0, 2378.0, 1313.0, 720.0, 425.0, 270.0, 163.0, 113.0, 68.0, 52.0, 38.0, 20.0, 21.0, 18.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2042236328125, -0.1970691680908203, -0.18991470336914062, -0.18276023864746094, -0.17560577392578125, -0.16845130920410156, -0.16129684448242188, -0.1541423797607422, -0.1469879150390625, -0.1398334503173828, -0.13267898559570312, -0.12552452087402344, -0.11837005615234375, -0.11121559143066406, -0.10406112670898438, -0.09690666198730469, -0.089752197265625, -0.08259773254394531, -0.07544326782226562, -0.06828880310058594, -0.06113433837890625, -0.05397987365722656, -0.046825408935546875, -0.03967094421386719, -0.0325164794921875, -0.025362014770507812, -0.018207550048828125, -0.011053085327148438, -0.00389862060546875, 0.0032558441162109375, 0.010410308837890625, 0.017564773559570312, 0.02471923828125, 0.03187370300292969, 0.039028167724609375, 0.04618263244628906, 0.05333709716796875, 0.06049156188964844, 0.06764602661132812, 0.07480049133300781, 0.0819549560546875, 0.08910942077636719, 0.09626388549804688, 0.10341835021972656, 0.11057281494140625, 0.11772727966308594, 0.12488174438476562, 0.1320362091064453, 0.139190673828125, 0.1463451385498047, 0.15349960327148438, 0.16065406799316406, 0.16780853271484375, 0.17496299743652344, 0.18211746215820312, 0.1892719268798828, 0.1964263916015625, 0.2035808563232422, 0.21073532104492188, 0.21788978576660156, 0.22504425048828125, 0.23219871520996094, 0.23935317993164062, 0.2465076446533203, 0.253662109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 9.0, 12.0, 25.0, 31.0, 46.0, 63.0, 97.0, 91.0, 105.0, 115.0, 93.0, 97.0, 73.0, 50.0, 43.0, 24.0, 10.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197021484375, -0.1891937255859375, -0.181365966796875, -0.1735382080078125, -0.16571044921875, -0.1578826904296875, -0.150054931640625, -0.1422271728515625, -0.1343994140625, -0.1265716552734375, -0.118743896484375, -0.1109161376953125, -0.10308837890625, -0.0952606201171875, -0.087432861328125, -0.0796051025390625, -0.07177734375, -0.0639495849609375, -0.056121826171875, -0.0482940673828125, -0.04046630859375, -0.0326385498046875, -0.024810791015625, -0.0169830322265625, -0.0091552734375, -0.0013275146484375, 0.006500244140625, 0.0143280029296875, 0.02215576171875, 0.0299835205078125, 0.037811279296875, 0.0456390380859375, 0.053466796875, 0.0612945556640625, 0.069122314453125, 0.0769500732421875, 0.08477783203125, 0.0926055908203125, 0.100433349609375, 0.1082611083984375, 0.1160888671875, 0.1239166259765625, 0.131744384765625, 0.1395721435546875, 0.14739990234375, 0.1552276611328125, 0.163055419921875, 0.1708831787109375, 0.1787109375, 0.1865386962890625, 0.194366455078125, 0.2021942138671875, 0.21002197265625, 0.2178497314453125, 0.225677490234375, 0.2335052490234375, 0.2413330078125, 0.2491607666015625, 0.256988525390625, 0.2648162841796875, 0.27264404296875, 0.2804718017578125, 0.288299560546875, 0.2961273193359375, 0.303955078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 5.0, 15.0, 5.0, 19.0, 21.0, 22.0, 62.0, 74.0, 110.0, 256.0, 542.0, 1290.0, 3337.0, 9543.0, 31986.0, 137305.0, 554207.0, 238117.0, 50003.0, 13940.0, 4579.0, 1690.0, 662.0, 326.0, 163.0, 82.0, 45.0, 42.0, 25.0, 12.0, 16.0, 12.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.3138771057128906, -0.30426788330078125, -0.2946586608886719, -0.2850494384765625, -0.2754402160644531, -0.26583099365234375, -0.2562217712402344, -0.246612548828125, -0.23700332641601562, -0.22739410400390625, -0.21778488159179688, -0.2081756591796875, -0.19856643676757812, -0.18895721435546875, -0.17934799194335938, -0.16973876953125, -0.16012954711914062, -0.15052032470703125, -0.14091110229492188, -0.1313018798828125, -0.12169265747070312, -0.11208343505859375, -0.10247421264648438, -0.092864990234375, -0.08325576782226562, -0.07364654541015625, -0.06403732299804688, -0.0544281005859375, -0.044818878173828125, -0.03520965576171875, -0.025600433349609375, -0.0159912109375, -0.006381988525390625, 0.00322723388671875, 0.012836456298828125, 0.0224456787109375, 0.032054901123046875, 0.04166412353515625, 0.051273345947265625, 0.060882568359375, 0.07049179077148438, 0.08010101318359375, 0.08971023559570312, 0.0993194580078125, 0.10892868041992188, 0.11853790283203125, 0.12814712524414062, 0.13775634765625, 0.14736557006835938, 0.15697479248046875, 0.16658401489257812, 0.1761932373046875, 0.18580245971679688, 0.19541168212890625, 0.20502090454101562, 0.214630126953125, 0.22423934936523438, 0.23384857177734375, 0.24345779418945312, 0.2530670166015625, 0.2626762390136719, 0.27228546142578125, 0.2818946838378906, 0.29150390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 11.0, 14.0, 17.0, 26.0, 16.0, 19.0, 31.0, 41.0, 45.0, 31.0, 41.0, 31.0, 43.0, 37.0, 48.0, 40.0, 42.0, 37.0, 49.0, 50.0, 37.0, 25.0, 28.0, 36.0, 28.0, 30.0, 17.0, 11.0, 23.0, 15.0, 10.0, 11.0, 7.0, 5.0, 2.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2403564453125, -0.2313060760498047, -0.22225570678710938, -0.21320533752441406, -0.20415496826171875, -0.19510459899902344, -0.18605422973632812, -0.1770038604736328, -0.1679534912109375, -0.1589031219482422, -0.14985275268554688, -0.14080238342285156, -0.13175201416015625, -0.12270164489746094, -0.11365127563476562, -0.10460090637207031, -0.095550537109375, -0.08650016784667969, -0.07744979858398438, -0.06839942932128906, -0.05934906005859375, -0.05029869079589844, -0.041248321533203125, -0.03219795227050781, -0.0231475830078125, -0.014097213745117188, -0.005046844482421875, 0.0040035247802734375, 0.01305389404296875, 0.022104263305664062, 0.031154632568359375, 0.04020500183105469, 0.04925537109375, 0.05830574035644531, 0.06735610961914062, 0.07640647888183594, 0.08545684814453125, 0.09450721740722656, 0.10355758666992188, 0.11260795593261719, 0.1216583251953125, 0.1307086944580078, 0.13975906372070312, 0.14880943298339844, 0.15785980224609375, 0.16691017150878906, 0.17596054077148438, 0.1850109100341797, 0.194061279296875, 0.2031116485595703, 0.21216201782226562, 0.22121238708496094, 0.23026275634765625, 0.23931312561035156, 0.24836349487304688, 0.2574138641357422, 0.2664642333984375, 0.2755146026611328, 0.2845649719238281, 0.29361534118652344, 0.30266571044921875, 0.31171607971191406, 0.3207664489746094, 0.3298168182373047, 0.3388671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 8.0, 7.0, 12.0, 27.0, 39.0, 56.0, 62.0, 91.0, 126.0, 227.0, 287.0, 428.0, 677.0, 1051.0, 1683.0, 3067.0, 6007.0, 13202.0, 34023.0, 122133.0, 568015.0, 214714.0, 48174.0, 17501.0, 7689.0, 3706.0, 2048.0, 1229.0, 740.0, 472.0, 317.0, 216.0, 160.0, 99.0, 75.0, 69.0, 27.0, 27.0, 15.0, 14.0, 10.0, 3.0, 3.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.10303306579589844, -0.09943771362304688, -0.09584236145019531, -0.09224700927734375, -0.08865165710449219, -0.08505630493164062, -0.08146095275878906, -0.0778656005859375, -0.07427024841308594, -0.07067489624023438, -0.06707954406738281, -0.06348419189453125, -0.05988883972167969, -0.056293487548828125, -0.05269813537597656, -0.049102783203125, -0.04550743103027344, -0.041912078857421875, -0.03831672668457031, -0.03472137451171875, -0.031126022338867188, -0.027530670166015625, -0.023935317993164062, -0.0203399658203125, -0.016744613647460938, -0.013149261474609375, -0.009553909301757812, -0.00595855712890625, -0.0023632049560546875, 0.001232147216796875, 0.0048274993896484375, 0.0084228515625, 0.012018203735351562, 0.015613555908203125, 0.019208908081054688, 0.02280426025390625, 0.026399612426757812, 0.029994964599609375, 0.03359031677246094, 0.0371856689453125, 0.04078102111816406, 0.044376373291015625, 0.04797172546386719, 0.05156707763671875, 0.05516242980957031, 0.058757781982421875, 0.06235313415527344, 0.065948486328125, 0.06954383850097656, 0.07313919067382812, 0.07673454284667969, 0.08032989501953125, 0.08392524719238281, 0.08752059936523438, 0.09111595153808594, 0.0947113037109375, 0.09830665588378906, 0.10190200805664062, 0.10549736022949219, 0.10909271240234375, 0.11268806457519531, 0.11628341674804688, 0.11987876892089844, 0.12347412109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 11.0, 4.0, 7.0, 11.0, 17.0, 7.0, 19.0, 21.0, 41.0, 34.0, 63.0, 75.0, 115.0, 120.0, 127.0, 92.0, 58.0, 34.0, 18.0, 23.0, 13.0, 13.0, 16.0, 6.0, 7.0, 5.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.627206802368164e-05, -1.569930464029312e-05, -1.5126541256904602e-05, -1.4553777873516083e-05, -1.3981014490127563e-05, -1.3408251106739044e-05, -1.2835487723350525e-05, -1.2262724339962006e-05, -1.1689960956573486e-05, -1.1117197573184967e-05, -1.0544434189796448e-05, -9.971670806407928e-06, -9.39890742301941e-06, -8.82614403963089e-06, -8.25338065624237e-06, -7.680617272853851e-06, -7.107853889465332e-06, -6.535090506076813e-06, -5.9623271226882935e-06, -5.389563739299774e-06, -4.816800355911255e-06, -4.244036972522736e-06, -3.6712735891342163e-06, -3.098510205745697e-06, -2.5257468223571777e-06, -1.9529834389686584e-06, -1.3802200555801392e-06, -8.074566721916199e-07, -2.3469328880310059e-07, 3.380700945854187e-07, 9.10833477973938e-07, 1.4835968613624573e-06, 2.0563602447509766e-06, 2.629123628139496e-06, 3.201887011528015e-06, 3.7746503949165344e-06, 4.347413778305054e-06, 4.920177161693573e-06, 5.492940545082092e-06, 6.0657039284706116e-06, 6.638467311859131e-06, 7.21123069524765e-06, 7.78399407863617e-06, 8.356757462024689e-06, 8.929520845413208e-06, 9.502284228801727e-06, 1.0075047612190247e-05, 1.0647810995578766e-05, 1.1220574378967285e-05, 1.1793337762355804e-05, 1.2366101145744324e-05, 1.2938864529132843e-05, 1.3511627912521362e-05, 1.4084391295909882e-05, 1.4657154679298401e-05, 1.522991806268692e-05, 1.580268144607544e-05, 1.637544482946396e-05, 1.6948208212852478e-05, 1.7520971596240997e-05, 1.8093734979629517e-05, 1.8666498363018036e-05, 1.9239261746406555e-05, 1.9812025129795074e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 15.0, 22.0, 30.0, 55.0, 59.0, 118.0, 196.0, 299.0, 563.0, 1006.0, 2000.0, 4088.0, 10019.0, 30853.0, 140844.0, 659092.0, 148305.0, 31932.0, 10273.0, 4303.0, 2033.0, 1049.0, 578.0, 317.0, 185.0, 132.0, 57.0, 41.0, 20.0, 18.0, 14.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1297607421875, -0.12588882446289062, -0.12201690673828125, -0.11814498901367188, -0.1142730712890625, -0.11040115356445312, -0.10652923583984375, -0.10265731811523438, -0.098785400390625, -0.09491348266601562, -0.09104156494140625, -0.08716964721679688, -0.0832977294921875, -0.07942581176757812, -0.07555389404296875, -0.07168197631835938, -0.06781005859375, -0.06393814086914062, -0.06006622314453125, -0.056194305419921875, -0.0523223876953125, -0.048450469970703125, -0.04457855224609375, -0.040706634521484375, -0.036834716796875, -0.032962799072265625, -0.02909088134765625, -0.025218963623046875, -0.0213470458984375, -0.017475128173828125, -0.01360321044921875, -0.009731292724609375, -0.005859375, -0.001987457275390625, 0.00188446044921875, 0.005756378173828125, 0.0096282958984375, 0.013500213623046875, 0.01737213134765625, 0.021244049072265625, 0.025115966796875, 0.028987884521484375, 0.03285980224609375, 0.036731719970703125, 0.0406036376953125, 0.044475555419921875, 0.04834747314453125, 0.052219390869140625, 0.05609130859375, 0.059963226318359375, 0.06383514404296875, 0.06770706176757812, 0.0715789794921875, 0.07545089721679688, 0.07932281494140625, 0.08319473266601562, 0.087066650390625, 0.09093856811523438, 0.09481048583984375, 0.09868240356445312, 0.1025543212890625, 0.10642623901367188, 0.11029815673828125, 0.11417007446289062, 0.1180419921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 14.0, 12.0, 19.0, 29.0, 25.0, 52.0, 80.0, 158.0, 181.0, 130.0, 81.0, 54.0, 42.0, 20.0, 19.0, 12.0, 10.0, 6.0, 11.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140625, -0.13629150390625, -0.1319580078125, -0.12762451171875, -0.123291015625, -0.11895751953125, -0.1146240234375, -0.11029052734375, -0.10595703125, -0.10162353515625, -0.0972900390625, -0.09295654296875, -0.088623046875, -0.08428955078125, -0.0799560546875, -0.07562255859375, -0.0712890625, -0.06695556640625, -0.0626220703125, -0.05828857421875, -0.053955078125, -0.04962158203125, -0.0452880859375, -0.04095458984375, -0.03662109375, -0.03228759765625, -0.0279541015625, -0.02362060546875, -0.019287109375, -0.01495361328125, -0.0106201171875, -0.00628662109375, -0.001953125, 0.00238037109375, 0.0067138671875, 0.01104736328125, 0.015380859375, 0.01971435546875, 0.0240478515625, 0.02838134765625, 0.03271484375, 0.03704833984375, 0.0413818359375, 0.04571533203125, 0.050048828125, 0.05438232421875, 0.0587158203125, 0.06304931640625, 0.0673828125, 0.07171630859375, 0.0760498046875, 0.08038330078125, 0.084716796875, 0.08905029296875, 0.0933837890625, 0.09771728515625, 0.10205078125, 0.10638427734375, 0.1107177734375, 0.11505126953125, 0.119384765625, 0.12371826171875, 0.1280517578125, 0.13238525390625, 0.13671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [22.0, 114.0, 400.0, 377.0, 87.0, 20.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3815043866634369, -0.2477998286485672, -0.11409527063369751, 0.019609302282333374, 0.15331384539604187, 0.28701838850975037, 0.42072299122810364, 0.5544275045394897, 0.6881320476531982, 0.8218365907669067, 0.9555411338806152, 1.0892457962036133, 1.2229502201080322, 1.3566548824310303, 1.4903594255447388, 1.6240639686584473, 1.7577685117721558, 1.8914730548858643, 2.0251777172088623, 2.1588821411132812, 2.2925868034362793, 2.4262912273406982, 2.5599958896636963, 2.6937003135681152, 2.8274049758911133, 2.9611096382141113, 3.0948140621185303, 3.2285187244415283, 3.3622231483459473, 3.4959278106689453, 3.6296324729919434, 3.7633368968963623, 3.8970417976379395, 4.0307464599609375, 4.1644511222839355, 4.298155307769775, 4.431859970092773, 4.5655646324157715, 4.6992692947387695, 4.832973480224609, 4.966678142547607, 5.1003828048706055, 5.2340874671936035, 5.367791652679443, 5.501496315002441, 5.6352009773254395, 5.7689056396484375, 5.902609825134277, 6.036314964294434, 6.170019626617432, 6.30372428894043, 6.4374284744262695, 6.571133136749268, 6.704837799072266, 6.838542461395264, 6.972247123718262, 7.105951309204102, 7.2396559715271, 7.373360633850098, 7.5070648193359375, 7.6407694816589355, 7.774474143981934, 7.908178806304932, 8.04188346862793, 8.17558765411377]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 6.0, 22.0, 17.0, 7.0, 16.0, 19.0, 25.0, 23.0, 28.0, 38.0, 26.0, 38.0, 39.0, 41.0, 31.0, 31.0, 44.0, 43.0, 44.0, 35.0, 34.0, 31.0, 31.0, 29.0, 44.0, 33.0, 24.0, 23.0, 22.0, 24.0, 20.0, 17.0, 12.0, 7.0, 14.0, 6.0, 3.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7734782695770264, -0.7494469881057739, -0.7254157066345215, -0.701384425163269, -0.6773531436920166, -0.6533218622207642, -0.6292905807495117, -0.6052592992782593, -0.5812280178070068, -0.5571967363357544, -0.533165454864502, -0.5091341733932495, -0.48510289192199707, -0.46107161045074463, -0.4370402991771698, -0.41300901770591736, -0.38897770643234253, -0.3649464249610901, -0.34091514348983765, -0.3168838620185852, -0.29285258054733276, -0.2688212990760803, -0.2447899878025055, -0.22075870633125305, -0.1967274248600006, -0.17269614338874817, -0.14866486191749573, -0.12463356554508209, -0.10060228407382965, -0.07657100260257721, -0.052539706230163574, -0.028508424758911133, -0.004477083683013916, 0.019554201513528824, 0.043585486710071564, 0.0676167756319046, 0.09164805710315704, 0.11567933857440948, 0.13971063494682312, 0.16374191641807556, 0.187773197889328, 0.21180447936058044, 0.23583576083183289, 0.2598670721054077, 0.28389835357666016, 0.3079296350479126, 0.33196091651916504, 0.3559921979904175, 0.3800234794616699, 0.40405476093292236, 0.4280860424041748, 0.45211732387542725, 0.4761486053466797, 0.5001798868179321, 0.5242111682891846, 0.548242449760437, 0.5722737312316895, 0.5963050127029419, 0.6203362941741943, 0.6443675756454468, 0.6683988571166992, 0.6924301385879517, 0.7164614200592041, 0.7404927015304565, 0.7645240426063538]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 13.0, 6.0, 11.0, 16.0, 22.0, 33.0, 53.0, 80.0, 139.0, 201.0, 340.0, 556.0, 930.0, 1842.0, 3519.0, 7415.0, 17543.0, 49102.0, 248409.0, 2708540.0, 998860.0, 106666.0, 28055.0, 11020.0, 4956.0, 2442.0, 1372.0, 786.0, 452.0, 295.0, 196.0, 133.0, 78.0, 69.0, 40.0, 30.0, 23.0, 11.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.1274261474609375, -0.122283935546875, -0.1171417236328125, -0.11199951171875, -0.1068572998046875, -0.101715087890625, -0.0965728759765625, -0.0914306640625, -0.0862884521484375, -0.081146240234375, -0.0760040283203125, -0.07086181640625, -0.0657196044921875, -0.060577392578125, -0.0554351806640625, -0.05029296875, -0.0451507568359375, -0.040008544921875, -0.0348663330078125, -0.02972412109375, -0.0245819091796875, -0.019439697265625, -0.0142974853515625, -0.0091552734375, -0.0040130615234375, 0.001129150390625, 0.0062713623046875, 0.01141357421875, 0.0165557861328125, 0.021697998046875, 0.0268402099609375, 0.031982421875, 0.0371246337890625, 0.042266845703125, 0.0474090576171875, 0.05255126953125, 0.0576934814453125, 0.062835693359375, 0.0679779052734375, 0.0731201171875, 0.0782623291015625, 0.083404541015625, 0.0885467529296875, 0.09368896484375, 0.0988311767578125, 0.103973388671875, 0.1091156005859375, 0.1142578125, 0.1194000244140625, 0.124542236328125, 0.1296844482421875, 0.13482666015625, 0.1399688720703125, 0.145111083984375, 0.1502532958984375, 0.1553955078125, 0.1605377197265625, 0.165679931640625, 0.1708221435546875, 0.17596435546875, 0.1811065673828125, 0.186248779296875, 0.1913909912109375, 0.196533203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 16.0, 18.0, 33.0, 52.0, 44.0, 72.0, 73.0, 81.0, 124.0, 109.0, 94.0, 65.0, 75.0, 44.0, 31.0, 25.0, 15.0, 6.0, 11.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1943359375, -0.1864776611328125, -0.178619384765625, -0.1707611083984375, -0.16290283203125, -0.1550445556640625, -0.147186279296875, -0.1393280029296875, -0.1314697265625, -0.1236114501953125, -0.115753173828125, -0.1078948974609375, -0.10003662109375, -0.0921783447265625, -0.084320068359375, -0.0764617919921875, -0.068603515625, -0.0607452392578125, -0.052886962890625, -0.0450286865234375, -0.03717041015625, -0.0293121337890625, -0.021453857421875, -0.0135955810546875, -0.0057373046875, 0.0021209716796875, 0.009979248046875, 0.0178375244140625, 0.02569580078125, 0.0335540771484375, 0.041412353515625, 0.0492706298828125, 0.05712890625, 0.0649871826171875, 0.072845458984375, 0.0807037353515625, 0.08856201171875, 0.0964202880859375, 0.104278564453125, 0.1121368408203125, 0.1199951171875, 0.1278533935546875, 0.135711669921875, 0.1435699462890625, 0.15142822265625, 0.1592864990234375, 0.167144775390625, 0.1750030517578125, 0.182861328125, 0.1907196044921875, 0.198577880859375, 0.2064361572265625, 0.21429443359375, 0.2221527099609375, 0.230010986328125, 0.2378692626953125, 0.2457275390625, 0.2535858154296875, 0.261444091796875, 0.2693023681640625, 0.27716064453125, 0.2850189208984375, 0.292877197265625, 0.3007354736328125, 0.30859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 4.0, 7.0, 6.0, 12.0, 14.0, 24.0, 22.0, 20.0, 44.0, 63.0, 91.0, 110.0, 209.0, 346.0, 650.0, 1462.0, 4098.0, 16902.0, 152276.0, 3714782.0, 270805.0, 23480.0, 5207.0, 1797.0, 708.0, 376.0, 227.0, 129.0, 98.0, 70.0, 38.0, 34.0, 34.0, 22.0, 15.0, 15.0, 11.0, 8.0, 11.0, 8.0, 10.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4306640625, -0.417449951171875, -0.40423583984375, -0.391021728515625, -0.3778076171875, -0.364593505859375, -0.35137939453125, -0.338165283203125, -0.324951171875, -0.311737060546875, -0.29852294921875, -0.285308837890625, -0.2720947265625, -0.258880615234375, -0.24566650390625, -0.232452392578125, -0.21923828125, -0.206024169921875, -0.19281005859375, -0.179595947265625, -0.1663818359375, -0.153167724609375, -0.13995361328125, -0.126739501953125, -0.113525390625, -0.100311279296875, -0.08709716796875, -0.073883056640625, -0.0606689453125, -0.047454833984375, -0.03424072265625, -0.021026611328125, -0.0078125, 0.005401611328125, 0.01861572265625, 0.031829833984375, 0.0450439453125, 0.058258056640625, 0.07147216796875, 0.084686279296875, 0.097900390625, 0.111114501953125, 0.12432861328125, 0.137542724609375, 0.1507568359375, 0.163970947265625, 0.17718505859375, 0.190399169921875, 0.20361328125, 0.216827392578125, 0.23004150390625, 0.243255615234375, 0.2564697265625, 0.269683837890625, 0.28289794921875, 0.296112060546875, 0.309326171875, 0.322540283203125, 0.33575439453125, 0.348968505859375, 0.3621826171875, 0.375396728515625, 0.38861083984375, 0.401824951171875, 0.4150390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 10.0, 15.0, 28.0, 51.0, 119.0, 323.0, 1577.0, 1440.0, 290.0, 93.0, 51.0, 32.0, 10.0, 16.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17013931274414062, -0.15790557861328125, -0.14567184448242188, -0.1334381103515625, -0.12120437622070312, -0.10897064208984375, -0.09673690795898438, -0.084503173828125, -0.07226943969726562, -0.06003570556640625, -0.047801971435546875, -0.0355682373046875, -0.023334503173828125, -0.01110076904296875, 0.001132965087890625, 0.01336669921875, 0.025600433349609375, 0.03783416748046875, 0.050067901611328125, 0.0623016357421875, 0.07453536987304688, 0.08676910400390625, 0.09900283813476562, 0.111236572265625, 0.12347030639648438, 0.13570404052734375, 0.14793777465820312, 0.1601715087890625, 0.17240524291992188, 0.18463897705078125, 0.19687271118164062, 0.2091064453125, 0.22134017944335938, 0.23357391357421875, 0.24580764770507812, 0.2580413818359375, 0.2702751159667969, 0.28250885009765625, 0.2947425842285156, 0.306976318359375, 0.3192100524902344, 0.33144378662109375, 0.3436775207519531, 0.3559112548828125, 0.3681449890136719, 0.38037872314453125, 0.3926124572753906, 0.40484619140625, 0.4170799255371094, 0.42931365966796875, 0.4415473937988281, 0.4537811279296875, 0.4660148620605469, 0.47824859619140625, 0.4904823303222656, 0.502716064453125, 0.5149497985839844, 0.5271835327148438, 0.5394172668457031, 0.5516510009765625, 0.5638847351074219, 0.5761184692382812, 0.5883522033691406, 0.6005859375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 19.0, 37.0, 32.0, 46.0, 60.0, 94.0, 92.0, 89.0, 104.0, 80.0, 86.0, 58.0, 38.0, 48.0, 31.0, 18.0, 17.0, 7.0, 9.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47700566053390503, -0.4544636905193329, -0.43192169070243835, -0.4093797206878662, -0.3868377208709717, -0.36429575085639954, -0.3417537808418274, -0.31921178102493286, -0.2966698110103607, -0.2741278409957886, -0.25158584117889404, -0.2290438711643219, -0.20650188624858856, -0.18395990133285522, -0.16141793131828308, -0.13887594640254974, -0.1163339614868164, -0.09379197657108307, -0.07124999910593033, -0.04870802164077759, -0.02616603672504425, -0.003624051809310913, 0.01891791820526123, 0.04145990312099457, 0.0640018880367279, 0.08654387295246124, 0.10908585041761398, 0.13162782788276672, 0.15416981279850006, 0.1767117977142334, 0.19925376772880554, 0.22179575264453888, 0.24433773756027222, 0.26687970757484436, 0.2894217073917389, 0.31196367740631104, 0.33450567722320557, 0.3570476472377777, 0.37958961725234985, 0.4021316170692444, 0.42467358708381653, 0.44721555709838867, 0.4697575569152832, 0.49229952692985535, 0.5148414969444275, 0.537383496761322, 0.5599254369735718, 0.5824674367904663, 0.6050094366073608, 0.6275514364242554, 0.6500933766365051, 0.6726353764533997, 0.6951773762702942, 0.717719316482544, 0.7402613162994385, 0.762803316116333, 0.7853453159332275, 0.8078873157501221, 0.8304292559623718, 0.8529712557792664, 0.8755132555961609, 0.8980551958084106, 0.9205971956253052, 0.9431391954421997, 0.9656811356544495]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 6.0, 7.0, 8.0, 16.0, 13.0, 18.0, 25.0, 30.0, 25.0, 28.0, 26.0, 31.0, 33.0, 34.0, 36.0, 36.0, 40.0, 42.0, 50.0, 53.0, 38.0, 39.0, 31.0, 41.0, 37.0, 32.0, 34.0, 30.0, 24.0, 26.0, 22.0, 13.0, 19.0, 10.0, 11.0, 11.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6244544982910156, -0.6047027111053467, -0.5849509835243225, -0.5651991963386536, -0.5454474687576294, -0.5256956815719604, -0.5059439539909363, -0.48619216680526733, -0.4664404094219208, -0.4466886520385742, -0.42693689465522766, -0.4071851372718811, -0.38743335008621216, -0.367681622505188, -0.34792983531951904, -0.3281780779361725, -0.3084263205528259, -0.28867456316947937, -0.2689228057861328, -0.24917103350162506, -0.2294192761182785, -0.20966751873493195, -0.1899157464504242, -0.17016398906707764, -0.15041223168373108, -0.13066047430038452, -0.11090870946645737, -0.09115694463253021, -0.07140518724918365, -0.0516534298658371, -0.03190166503190994, -0.012149900197982788, 0.007601916790008545, 0.0273536778986454, 0.04710543900728226, 0.06685720384120941, 0.08660896122455597, 0.10636071860790253, 0.12611249089241028, 0.14586424827575684, 0.1656160056591034, 0.18536776304244995, 0.2051195204257965, 0.22487129271030426, 0.24462305009365082, 0.2643747925758362, 0.2841265797615051, 0.3038783371448517, 0.32363009452819824, 0.3433818519115448, 0.36313360929489136, 0.3828853666782379, 0.4026371240615845, 0.4223889112472534, 0.4421406686306, 0.46189242601394653, 0.4816441833972931, 0.5013959407806396, 0.5211477279663086, 0.5408994555473328, 0.5606512427330017, 0.5804029703140259, 0.6001547574996948, 0.6199065446853638, 0.6396582722663879]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 11.0, 15.0, 30.0, 33.0, 70.0, 124.0, 220.0, 333.0, 560.0, 1136.0, 2448.0, 4981.0, 11663.0, 29912.0, 91125.0, 324163.0, 400705.0, 117972.0, 37162.0, 14221.0, 6046.0, 2680.0, 1302.0, 698.0, 383.0, 229.0, 131.0, 68.0, 49.0, 29.0, 11.0, 13.0, 8.0, 8.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3090248107910156, -0.29969024658203125, -0.2903556823730469, -0.2810211181640625, -0.2716865539550781, -0.26235198974609375, -0.2530174255371094, -0.243682861328125, -0.23434829711914062, -0.22501373291015625, -0.21567916870117188, -0.2063446044921875, -0.19701004028320312, -0.18767547607421875, -0.17834091186523438, -0.16900634765625, -0.15967178344726562, -0.15033721923828125, -0.14100265502929688, -0.1316680908203125, -0.12233352661132812, -0.11299896240234375, -0.10366439819335938, -0.094329833984375, -0.08499526977539062, -0.07566070556640625, -0.06632614135742188, -0.0569915771484375, -0.047657012939453125, -0.03832244873046875, -0.028987884521484375, -0.0196533203125, -0.010318756103515625, -0.00098419189453125, 0.008350372314453125, 0.0176849365234375, 0.027019500732421875, 0.03635406494140625, 0.045688629150390625, 0.055023193359375, 0.06435775756835938, 0.07369232177734375, 0.08302688598632812, 0.0923614501953125, 0.10169601440429688, 0.11103057861328125, 0.12036514282226562, 0.12969970703125, 0.13903427124023438, 0.14836883544921875, 0.15770339965820312, 0.1670379638671875, 0.17637252807617188, 0.18570709228515625, 0.19504165649414062, 0.204376220703125, 0.21371078491210938, 0.22304534912109375, 0.23237991333007812, 0.2417144775390625, 0.2510490417480469, 0.26038360595703125, 0.2697181701660156, 0.279052734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 20.0, 20.0, 27.0, 35.0, 36.0, 65.0, 60.0, 76.0, 70.0, 67.0, 86.0, 77.0, 68.0, 68.0, 46.0, 52.0, 32.0, 32.0, 21.0, 11.0, 8.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.1683330535888672, -0.16100692749023438, -0.15368080139160156, -0.14635467529296875, -0.13902854919433594, -0.13170242309570312, -0.12437629699707031, -0.1170501708984375, -0.10972404479980469, -0.10239791870117188, -0.09507179260253906, -0.08774566650390625, -0.08041954040527344, -0.07309341430664062, -0.06576728820800781, -0.058441162109375, -0.05111503601074219, -0.043788909912109375, -0.03646278381347656, -0.02913665771484375, -0.021810531616210938, -0.014484405517578125, -0.0071582794189453125, 0.0001678466796875, 0.0074939727783203125, 0.014820098876953125, 0.022146224975585938, 0.02947235107421875, 0.03679847717285156, 0.044124603271484375, 0.05145072937011719, 0.05877685546875, 0.06610298156738281, 0.07342910766601562, 0.08075523376464844, 0.08808135986328125, 0.09540748596191406, 0.10273361206054688, 0.11005973815917969, 0.1173858642578125, 0.12471199035644531, 0.13203811645507812, 0.13936424255371094, 0.14669036865234375, 0.15401649475097656, 0.16134262084960938, 0.1686687469482422, 0.175994873046875, 0.1833209991455078, 0.19064712524414062, 0.19797325134277344, 0.20529937744140625, 0.21262550354003906, 0.21995162963867188, 0.2272777557373047, 0.2346038818359375, 0.2419300079345703, 0.24925613403320312, 0.25658226013183594, 0.26390838623046875, 0.27123451232910156, 0.2785606384277344, 0.2858867645263672, 0.293212890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 12.0, 10.0, 12.0, 10.0, 15.0, 22.0, 28.0, 61.0, 90.0, 201.0, 371.0, 933.0, 2193.0, 5919.0, 18544.0, 72952.0, 456230.0, 399832.0, 64784.0, 16761.0, 5751.0, 2125.0, 893.0, 359.0, 179.0, 79.0, 54.0, 33.0, 21.0, 18.0, 14.0, 10.0, 6.0, 7.0, 5.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.461669921875, -0.447662353515625, -0.43365478515625, -0.419647216796875, -0.4056396484375, -0.391632080078125, -0.37762451171875, -0.363616943359375, -0.349609375, -0.335601806640625, -0.32159423828125, -0.307586669921875, -0.2935791015625, -0.279571533203125, -0.26556396484375, -0.251556396484375, -0.237548828125, -0.223541259765625, -0.20953369140625, -0.195526123046875, -0.1815185546875, -0.167510986328125, -0.15350341796875, -0.139495849609375, -0.12548828125, -0.111480712890625, -0.09747314453125, -0.083465576171875, -0.0694580078125, -0.055450439453125, -0.04144287109375, -0.027435302734375, -0.013427734375, 0.000579833984375, 0.01458740234375, 0.028594970703125, 0.0426025390625, 0.056610107421875, 0.07061767578125, 0.084625244140625, 0.0986328125, 0.112640380859375, 0.12664794921875, 0.140655517578125, 0.1546630859375, 0.168670654296875, 0.18267822265625, 0.196685791015625, 0.210693359375, 0.224700927734375, 0.23870849609375, 0.252716064453125, 0.2667236328125, 0.280731201171875, 0.29473876953125, 0.308746337890625, 0.32275390625, 0.336761474609375, 0.35076904296875, 0.364776611328125, 0.3787841796875, 0.392791748046875, 0.40679931640625, 0.420806884765625, 0.434814453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 5.0, 7.0, 7.0, 5.0, 14.0, 15.0, 12.0, 18.0, 26.0, 30.0, 28.0, 37.0, 39.0, 38.0, 42.0, 49.0, 41.0, 63.0, 44.0, 50.0, 52.0, 38.0, 45.0, 40.0, 33.0, 36.0, 29.0, 20.0, 20.0, 14.0, 15.0, 16.0, 11.0, 10.0, 4.0, 5.0, 7.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.4521484375, -0.4389610290527344, -0.42577362060546875, -0.4125862121582031, -0.3993988037109375, -0.3862113952636719, -0.37302398681640625, -0.3598365783691406, -0.346649169921875, -0.3334617614746094, -0.32027435302734375, -0.3070869445800781, -0.2938995361328125, -0.2807121276855469, -0.26752471923828125, -0.2543373107910156, -0.24114990234375, -0.22796249389648438, -0.21477508544921875, -0.20158767700195312, -0.1884002685546875, -0.17521286010742188, -0.16202545166015625, -0.14883804321289062, -0.135650634765625, -0.12246322631835938, -0.10927581787109375, -0.09608840942382812, -0.0829010009765625, -0.06971359252929688, -0.05652618408203125, -0.043338775634765625, -0.0301513671875, -0.016963958740234375, -0.00377655029296875, 0.009410858154296875, 0.0225982666015625, 0.035785675048828125, 0.04897308349609375, 0.062160491943359375, 0.075347900390625, 0.08853530883789062, 0.10172271728515625, 0.11491012573242188, 0.1280975341796875, 0.14128494262695312, 0.15447235107421875, 0.16765975952148438, 0.18084716796875, 0.19403457641601562, 0.20722198486328125, 0.22040939331054688, 0.2335968017578125, 0.24678421020507812, 0.25997161865234375, 0.2731590270996094, 0.286346435546875, 0.2995338439941406, 0.31272125244140625, 0.3259086608886719, 0.3390960693359375, 0.3522834777832031, 0.36547088623046875, 0.3786582946777344, 0.391845703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 19.0, 16.0, 36.0, 53.0, 59.0, 106.0, 162.0, 319.0, 654.0, 1457.0, 3476.0, 9225.0, 25750.0, 86772.0, 433681.0, 374142.0, 75370.0, 23065.0, 8385.0, 3101.0, 1272.0, 601.0, 316.0, 170.0, 91.0, 60.0, 46.0, 31.0, 21.0, 17.0, 15.0, 14.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14892578125, -0.1439533233642578, -0.13898086547851562, -0.13400840759277344, -0.12903594970703125, -0.12406349182128906, -0.11909103393554688, -0.11411857604980469, -0.1091461181640625, -0.10417366027832031, -0.09920120239257812, -0.09422874450683594, -0.08925628662109375, -0.08428382873535156, -0.07931137084960938, -0.07433891296386719, -0.069366455078125, -0.06439399719238281, -0.059421539306640625, -0.05444908142089844, -0.04947662353515625, -0.04450416564941406, -0.039531707763671875, -0.03455924987792969, -0.0295867919921875, -0.024614334106445312, -0.019641876220703125, -0.014669418334960938, -0.00969696044921875, -0.0047245025634765625, 0.000247955322265625, 0.0052204132080078125, 0.01019287109375, 0.015165328979492188, 0.020137786865234375, 0.025110244750976562, 0.03008270263671875, 0.03505516052246094, 0.040027618408203125, 0.04500007629394531, 0.0499725341796875, 0.05494499206542969, 0.059917449951171875, 0.06488990783691406, 0.06986236572265625, 0.07483482360839844, 0.07980728149414062, 0.08477973937988281, 0.089752197265625, 0.09472465515136719, 0.09969711303710938, 0.10466957092285156, 0.10964202880859375, 0.11461448669433594, 0.11958694458007812, 0.12455940246582031, 0.1295318603515625, 0.1345043182373047, 0.13947677612304688, 0.14444923400878906, 0.14942169189453125, 0.15439414978027344, 0.15936660766601562, 0.1643390655517578, 0.1693115234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 11.0, 11.0, 5.0, 10.0, 21.0, 22.0, 44.0, 68.0, 101.0, 139.0, 155.0, 141.0, 95.0, 63.0, 43.0, 21.0, 16.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3915042877197266e-05, -3.267824649810791e-05, -3.1441450119018555e-05, -3.02046537399292e-05, -2.8967857360839844e-05, -2.7731060981750488e-05, -2.6494264602661133e-05, -2.5257468223571777e-05, -2.4020671844482422e-05, -2.2783875465393066e-05, -2.154707908630371e-05, -2.0310282707214355e-05, -1.9073486328125e-05, -1.7836689949035645e-05, -1.659989356994629e-05, -1.5363097190856934e-05, -1.4126300811767578e-05, -1.2889504432678223e-05, -1.1652708053588867e-05, -1.0415911674499512e-05, -9.179115295410156e-06, -7.9423189163208e-06, -6.705522537231445e-06, -5.46872615814209e-06, -4.231929779052734e-06, -2.995133399963379e-06, -1.7583370208740234e-06, -5.21540641784668e-07, 7.152557373046875e-07, 1.952052116394043e-06, 3.1888484954833984e-06, 4.425644874572754e-06, 5.662441253662109e-06, 6.899237632751465e-06, 8.13603401184082e-06, 9.372830390930176e-06, 1.0609626770019531e-05, 1.1846423149108887e-05, 1.3083219528198242e-05, 1.4320015907287598e-05, 1.5556812286376953e-05, 1.679360866546631e-05, 1.8030405044555664e-05, 1.926720142364502e-05, 2.0503997802734375e-05, 2.174079418182373e-05, 2.2977590560913086e-05, 2.421438694000244e-05, 2.5451183319091797e-05, 2.6687979698181152e-05, 2.7924776077270508e-05, 2.9161572456359863e-05, 3.039836883544922e-05, 3.1635165214538574e-05, 3.287196159362793e-05, 3.4108757972717285e-05, 3.534555435180664e-05, 3.6582350730895996e-05, 3.781914710998535e-05, 3.905594348907471e-05, 4.029273986816406e-05, 4.152953624725342e-05, 4.2766332626342773e-05, 4.400312900543213e-05, 4.5239925384521484e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 7.0, 12.0, 29.0, 33.0, 79.0, 132.0, 230.0, 428.0, 926.0, 1913.0, 4687.0, 13470.0, 47930.0, 240490.0, 563172.0, 130495.0, 29109.0, 9159.0, 3370.0, 1434.0, 650.0, 361.0, 182.0, 106.0, 64.0, 36.0, 21.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.142425537109375, -0.13787841796875, -0.133331298828125, -0.1287841796875, -0.124237060546875, -0.11968994140625, -0.115142822265625, -0.110595703125, -0.106048583984375, -0.10150146484375, -0.096954345703125, -0.0924072265625, -0.087860107421875, -0.08331298828125, -0.078765869140625, -0.07421875, -0.069671630859375, -0.06512451171875, -0.060577392578125, -0.0560302734375, -0.051483154296875, -0.04693603515625, -0.042388916015625, -0.037841796875, -0.033294677734375, -0.02874755859375, -0.024200439453125, -0.0196533203125, -0.015106201171875, -0.01055908203125, -0.006011962890625, -0.00146484375, 0.003082275390625, 0.00762939453125, 0.012176513671875, 0.0167236328125, 0.021270751953125, 0.02581787109375, 0.030364990234375, 0.034912109375, 0.039459228515625, 0.04400634765625, 0.048553466796875, 0.0531005859375, 0.057647705078125, 0.06219482421875, 0.066741943359375, 0.0712890625, 0.075836181640625, 0.08038330078125, 0.084930419921875, 0.0894775390625, 0.094024658203125, 0.09857177734375, 0.103118896484375, 0.107666015625, 0.112213134765625, 0.11676025390625, 0.121307373046875, 0.1258544921875, 0.130401611328125, 0.13494873046875, 0.139495849609375, 0.14404296875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 13.0, 12.0, 11.0, 13.0, 31.0, 44.0, 59.0, 71.0, 114.0, 131.0, 127.0, 93.0, 94.0, 60.0, 44.0, 29.0, 13.0, 8.0, 7.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.1651935577392578, -0.15985488891601562, -0.15451622009277344, -0.14917755126953125, -0.14383888244628906, -0.13850021362304688, -0.1331615447998047, -0.1278228759765625, -0.12248420715332031, -0.11714553833007812, -0.11180686950683594, -0.10646820068359375, -0.10112953186035156, -0.09579086303710938, -0.09045219421386719, -0.085113525390625, -0.07977485656738281, -0.07443618774414062, -0.06909751892089844, -0.06375885009765625, -0.05842018127441406, -0.053081512451171875, -0.04774284362792969, -0.0424041748046875, -0.03706550598144531, -0.031726837158203125, -0.026388168334960938, -0.02104949951171875, -0.015710830688476562, -0.010372161865234375, -0.0050334930419921875, 0.00030517578125, 0.0056438446044921875, 0.010982513427734375, 0.016321182250976562, 0.02165985107421875, 0.026998519897460938, 0.032337188720703125, 0.03767585754394531, 0.0430145263671875, 0.04835319519042969, 0.053691864013671875, 0.05903053283691406, 0.06436920166015625, 0.06970787048339844, 0.07504653930664062, 0.08038520812988281, 0.085723876953125, 0.09106254577636719, 0.09640121459960938, 0.10173988342285156, 0.10707855224609375, 0.11241722106933594, 0.11775588989257812, 0.12309455871582031, 0.1284332275390625, 0.1337718963623047, 0.13911056518554688, 0.14444923400878906, 0.14978790283203125, 0.15512657165527344, 0.16046524047851562, 0.1658039093017578, 0.171142578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 12.0, 51.0, 272.0, 413.0, 202.0, 47.0, 13.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5906901955604553, -0.45336323976516724, -0.31603631377220154, -0.17870938777923584, -0.041382431983947754, 0.09594452381134033, 0.23327142000198364, 0.37059837579727173, 0.5079253315925598, 0.6452522873878479, 0.7825791835784912, 0.9199061393737793, 1.0572330951690674, 1.1945600509643555, 1.3318870067596436, 1.4692139625549316, 1.6065409183502197, 1.7438678741455078, 1.881194829940796, 2.018521785736084, 2.155848741531372, 2.29317569732666, 2.430502414703369, 2.5678296089172363, 2.7051563262939453, 2.8424832820892334, 2.9798102378845215, 3.1171371936798096, 3.2544641494750977, 3.3917911052703857, 3.529118061065674, 3.666444778442383, 3.803771495819092, 3.94109845161438, 4.078425407409668, 4.215752124786377, 4.353079319000244, 4.490406036376953, 4.62773323059082, 4.765059947967529, 4.9023871421813965, 5.0397138595581055, 5.177041053771973, 5.314367771148682, 5.451694965362549, 5.589021682739258, 5.726348876953125, 5.863675594329834, 6.001002311706543, 6.138329029083252, 6.275656223297119, 6.412982940673828, 6.550310134887695, 6.687636852264404, 6.8249640464782715, 6.9622907638549805, 7.099617958068848, 7.236944675445557, 7.374271869659424, 7.511598587036133, 7.64892578125, 7.786252498626709, 7.923579692840576, 8.060906410217285, 8.198233604431152]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 11.0, 5.0, 4.0, 12.0, 16.0, 16.0, 22.0, 23.0, 26.0, 21.0, 24.0, 31.0, 32.0, 26.0, 42.0, 38.0, 43.0, 45.0, 38.0, 35.0, 51.0, 46.0, 51.0, 40.0, 21.0, 46.0, 35.0, 23.0, 25.0, 26.0, 19.0, 24.0, 12.0, 25.0, 8.0, 4.0, 7.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9291442632675171, -0.8967629075050354, -0.8643815517425537, -0.8320001363754272, -0.7996187806129456, -0.7672374248504639, -0.7348560094833374, -0.7024746537208557, -0.670093297958374, -0.6377119421958923, -0.6053305864334106, -0.5729491710662842, -0.5405678153038025, -0.5081864595413208, -0.4758050739765167, -0.44342368841171265, -0.41104233264923096, -0.37866097688674927, -0.3462795913219452, -0.3138982057571411, -0.2815168499946594, -0.24913547933101654, -0.21675410866737366, -0.18437273800373077, -0.1519913673400879, -0.11960999667644501, -0.08722862601280212, -0.05484725534915924, -0.022465884685516357, 0.009915485978126526, 0.04229685664176941, 0.07467822730541229, 0.10705971717834473, 0.1394410878419876, 0.1718224585056305, 0.20420382916927338, 0.23658519983291626, 0.26896655559539795, 0.301347941160202, 0.3337293267250061, 0.3661106824874878, 0.3984920382499695, 0.43087342381477356, 0.46325480937957764, 0.4956361651420593, 0.528017520904541, 0.5603989362716675, 0.5927802920341492, 0.6251616477966309, 0.6575430035591125, 0.6899243593215942, 0.7223057746887207, 0.7546871304512024, 0.7870684862136841, 0.8194499015808105, 0.8518312573432922, 0.8842126131057739, 0.9165939688682556, 0.9489753246307373, 0.9813567399978638, 1.0137381553649902, 1.0461194515228271, 1.0785008668899536, 1.1108821630477905, 1.143263578414917]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 9.0, 18.0, 28.0, 42.0, 55.0, 71.0, 95.0, 133.0, 176.0, 297.0, 387.0, 711.0, 1151.0, 2405.0, 6017.0, 16128.0, 56344.0, 450586.0, 2905617.0, 657329.0, 66472.0, 17382.0, 6464.0, 2762.0, 1326.0, 805.0, 448.0, 299.0, 198.0, 144.0, 104.0, 67.0, 48.0, 39.0, 33.0, 14.0, 20.0, 20.0, 10.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.245361328125, -0.2380523681640625, -0.230743408203125, -0.2234344482421875, -0.21612548828125, -0.2088165283203125, -0.201507568359375, -0.1941986083984375, -0.1868896484375, -0.1795806884765625, -0.172271728515625, -0.1649627685546875, -0.15765380859375, -0.1503448486328125, -0.143035888671875, -0.1357269287109375, -0.12841796875, -0.1211090087890625, -0.113800048828125, -0.1064910888671875, -0.09918212890625, -0.0918731689453125, -0.084564208984375, -0.0772552490234375, -0.0699462890625, -0.0626373291015625, -0.055328369140625, -0.0480194091796875, -0.04071044921875, -0.0334014892578125, -0.026092529296875, -0.0187835693359375, -0.011474609375, -0.0041656494140625, 0.003143310546875, 0.0104522705078125, 0.01776123046875, 0.0250701904296875, 0.032379150390625, 0.0396881103515625, 0.0469970703125, 0.0543060302734375, 0.061614990234375, 0.0689239501953125, 0.07623291015625, 0.0835418701171875, 0.090850830078125, 0.0981597900390625, 0.10546875, 0.1127777099609375, 0.120086669921875, 0.1273956298828125, 0.13470458984375, 0.1420135498046875, 0.149322509765625, 0.1566314697265625, 0.1639404296875, 0.1712493896484375, 0.178558349609375, 0.1858673095703125, 0.19317626953125, 0.2004852294921875, 0.207794189453125, 0.2151031494140625, 0.222412109375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 8.0, 4.0, 12.0, 8.0, 16.0, 24.0, 35.0, 30.0, 30.0, 54.0, 64.0, 73.0, 61.0, 63.0, 78.0, 76.0, 61.0, 54.0, 63.0, 47.0, 33.0, 23.0, 25.0, 18.0, 14.0, 9.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1801891326904297, -0.17275619506835938, -0.16532325744628906, -0.15789031982421875, -0.15045738220214844, -0.14302444458007812, -0.1355915069580078, -0.1281585693359375, -0.12072563171386719, -0.11329269409179688, -0.10585975646972656, -0.09842681884765625, -0.09099388122558594, -0.08356094360351562, -0.07612800598144531, -0.068695068359375, -0.06126213073730469, -0.053829193115234375, -0.04639625549316406, -0.03896331787109375, -0.03153038024902344, -0.024097442626953125, -0.016664505004882812, -0.0092315673828125, -0.0017986297607421875, 0.005634307861328125, 0.013067245483398438, 0.02050018310546875, 0.027933120727539062, 0.035366058349609375, 0.04279899597167969, 0.05023193359375, 0.05766487121582031, 0.06509780883789062, 0.07253074645996094, 0.07996368408203125, 0.08739662170410156, 0.09482955932617188, 0.10226249694824219, 0.1096954345703125, 0.11712837219238281, 0.12456130981445312, 0.13199424743652344, 0.13942718505859375, 0.14686012268066406, 0.15429306030273438, 0.1617259979248047, 0.169158935546875, 0.1765918731689453, 0.18402481079101562, 0.19145774841308594, 0.19889068603515625, 0.20632362365722656, 0.21375656127929688, 0.2211894989013672, 0.2286224365234375, 0.2360553741455078, 0.24348831176757812, 0.25092124938964844, 0.25835418701171875, 0.26578712463378906, 0.2732200622558594, 0.2806529998779297, 0.2880859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 1.0, 2.0, 2.0, 16.0, 12.0, 9.0, 19.0, 21.0, 36.0, 47.0, 67.0, 77.0, 120.0, 195.0, 308.0, 441.0, 775.0, 1334.0, 2426.0, 4961.0, 11914.0, 38144.0, 189487.0, 2911225.0, 899968.0, 93042.0, 23082.0, 8256.0, 3582.0, 1876.0, 1085.0, 636.0, 361.0, 230.0, 149.0, 95.0, 72.0, 53.0, 38.0, 27.0, 17.0, 18.0, 16.0, 8.0, 10.0, 8.0, 3.0, 1.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3349609375, -0.3247489929199219, -0.31453704833984375, -0.3043251037597656, -0.2941131591796875, -0.2839012145996094, -0.27368927001953125, -0.2634773254394531, -0.253265380859375, -0.24305343627929688, -0.23284149169921875, -0.22262954711914062, -0.2124176025390625, -0.20220565795898438, -0.19199371337890625, -0.18178176879882812, -0.17156982421875, -0.16135787963867188, -0.15114593505859375, -0.14093399047851562, -0.1307220458984375, -0.12051010131835938, -0.11029815673828125, -0.10008621215820312, -0.089874267578125, -0.07966232299804688, -0.06945037841796875, -0.059238433837890625, -0.0490264892578125, -0.038814544677734375, -0.02860260009765625, -0.018390655517578125, -0.0081787109375, 0.002033233642578125, 0.01224517822265625, 0.022457122802734375, 0.0326690673828125, 0.042881011962890625, 0.05309295654296875, 0.06330490112304688, 0.073516845703125, 0.08372879028320312, 0.09394073486328125, 0.10415267944335938, 0.1143646240234375, 0.12457656860351562, 0.13478851318359375, 0.14500045776367188, 0.15521240234375, 0.16542434692382812, 0.17563629150390625, 0.18584823608398438, 0.1960601806640625, 0.20627212524414062, 0.21648406982421875, 0.22669601440429688, 0.236907958984375, 0.24711990356445312, 0.25733184814453125, 0.2675437927246094, 0.2777557373046875, 0.2879676818847656, 0.29817962646484375, 0.3083915710449219, 0.318603515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 5.0, 9.0, 12.0, 20.0, 31.0, 43.0, 78.0, 184.0, 461.0, 1599.0, 1116.0, 268.0, 99.0, 72.0, 32.0, 12.0, 9.0, 12.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.40268707275390625, -0.3864288330078125, -0.37017059326171875, -0.353912353515625, -0.33765411376953125, -0.3213958740234375, -0.30513763427734375, -0.28887939453125, -0.27262115478515625, -0.2563629150390625, -0.24010467529296875, -0.223846435546875, -0.20758819580078125, -0.1913299560546875, -0.17507171630859375, -0.1588134765625, -0.14255523681640625, -0.1262969970703125, -0.11003875732421875, -0.093780517578125, -0.07752227783203125, -0.0612640380859375, -0.04500579833984375, -0.02874755859375, -0.01248931884765625, 0.0037689208984375, 0.02002716064453125, 0.036285400390625, 0.05254364013671875, 0.0688018798828125, 0.08506011962890625, 0.101318359375, 0.11757659912109375, 0.1338348388671875, 0.15009307861328125, 0.166351318359375, 0.18260955810546875, 0.1988677978515625, 0.21512603759765625, 0.23138427734375, 0.24764251708984375, 0.2639007568359375, 0.28015899658203125, 0.296417236328125, 0.31267547607421875, 0.3289337158203125, 0.34519195556640625, 0.3614501953125, 0.37770843505859375, 0.3939666748046875, 0.41022491455078125, 0.426483154296875, 0.44274139404296875, 0.4589996337890625, 0.47525787353515625, 0.49151611328125, 0.5077743530273438, 0.5240325927734375, 0.5402908325195312, 0.556549072265625, 0.5728073120117188, 0.5890655517578125, 0.6053237915039062, 0.62158203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 5.0, 11.0, 10.0, 20.0, 19.0, 15.0, 29.0, 27.0, 42.0, 38.0, 53.0, 84.0, 66.0, 75.0, 79.0, 74.0, 60.0, 53.0, 51.0, 32.0, 32.0, 27.0, 22.0, 15.0, 19.0, 9.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5974494218826294, -0.5755797624588013, -0.5537100434303284, -0.5318403840065002, -0.5099707245826721, -0.4881010353565216, -0.4662313461303711, -0.44436168670654297, -0.42249199748039246, -0.40062230825424194, -0.3787526488304138, -0.3568829596042633, -0.3350132703781128, -0.31314361095428467, -0.29127392172813416, -0.26940423250198364, -0.24753457307815552, -0.2256648987531662, -0.20379522442817688, -0.18192553520202637, -0.16005586087703705, -0.13818618655204773, -0.11631649732589722, -0.0944468230009079, -0.07257714867591858, -0.05070747062563896, -0.028837792575359344, -0.006968110799789429, 0.01490156352519989, 0.03677123785018921, 0.05864092707633972, 0.08051060140132904, 0.10238033533096313, 0.12425000965595245, 0.14611968398094177, 0.16798937320709229, 0.1898590475320816, 0.21172872185707092, 0.23359841108322144, 0.25546807050704956, 0.2773377597332001, 0.2992074489593506, 0.3210771083831787, 0.3429467976093292, 0.36481648683547974, 0.38668614625930786, 0.4085558354854584, 0.4304255247116089, 0.452295184135437, 0.4741648733615875, 0.49603453278541565, 0.5179042220115662, 0.5397738814353943, 0.5616436004638672, 0.5835132598876953, 0.6053829193115234, 0.6272525787353516, 0.6491222381591797, 0.6709919571876526, 0.6928616166114807, 0.7147312760353088, 0.7366009950637817, 0.7584706544876099, 0.780340313911438, 0.8022100329399109]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 10.0, 17.0, 15.0, 13.0, 19.0, 14.0, 20.0, 21.0, 34.0, 23.0, 39.0, 29.0, 32.0, 40.0, 34.0, 34.0, 46.0, 40.0, 31.0, 43.0, 45.0, 32.0, 41.0, 33.0, 35.0, 37.0, 35.0, 20.0, 27.0, 16.0, 16.0, 15.0, 14.0, 11.0, 10.0, 8.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7544849514961243, -0.7314966320991516, -0.7085083723068237, -0.6855200529098511, -0.6625317335128784, -0.6395434141159058, -0.6165551543235779, -0.5935668349266052, -0.5705785751342773, -0.5475902557373047, -0.5246019959449768, -0.5016136765480042, -0.4786253571510315, -0.4556370675563812, -0.43264877796173096, -0.4096604585647583, -0.38667213916778564, -0.3636838495731354, -0.3406955301761627, -0.31770724058151245, -0.2947189211845398, -0.2717306315898895, -0.24874234199523926, -0.2257540374994278, -0.20276573300361633, -0.17977742850780487, -0.1567891240119934, -0.13380083441734314, -0.11081252992153168, -0.08782422542572021, -0.06483593583106995, -0.041847631335258484, -0.01885932683944702, 0.0041289739310741425, 0.027117274701595306, 0.05010557174682617, 0.07309387624263763, 0.0960821807384491, 0.11907047033309937, 0.14205877482891083, 0.1650470793247223, 0.18803538382053375, 0.21102368831634521, 0.23401197791099548, 0.25700026750564575, 0.2799885869026184, 0.3029768764972687, 0.32596516609191895, 0.3489534854888916, 0.37194177508354187, 0.3949300944805145, 0.4179183840751648, 0.44090670347213745, 0.4638949930667877, 0.486883282661438, 0.5098716020584106, 0.5328599214553833, 0.555848240852356, 0.5788365006446838, 0.6018248200416565, 0.6248131394386292, 0.647801399230957, 0.6707897186279297, 0.6937780380249023, 0.7167662978172302]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 27.0, 31.0, 50.0, 70.0, 124.0, 192.0, 302.0, 450.0, 795.0, 1191.0, 1956.0, 3162.0, 5436.0, 9511.0, 17138.0, 32481.0, 64374.0, 127833.0, 229818.0, 248005.0, 147308.0, 74485.0, 37594.0, 19884.0, 10887.0, 6198.0, 3531.0, 2148.0, 1294.0, 803.0, 514.0, 332.0, 224.0, 129.0, 85.0, 65.0, 32.0, 23.0, 18.0, 8.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.2164306640625, -0.21026611328125, -0.2041015625, -0.19793701171875, -0.1917724609375, -0.18560791015625, -0.179443359375, -0.17327880859375, -0.1671142578125, -0.16094970703125, -0.15478515625, -0.14862060546875, -0.1424560546875, -0.13629150390625, -0.130126953125, -0.12396240234375, -0.1177978515625, -0.11163330078125, -0.10546875, -0.09930419921875, -0.0931396484375, -0.08697509765625, -0.080810546875, -0.07464599609375, -0.0684814453125, -0.06231689453125, -0.05615234375, -0.04998779296875, -0.0438232421875, -0.03765869140625, -0.031494140625, -0.02532958984375, -0.0191650390625, -0.01300048828125, -0.0068359375, -0.00067138671875, 0.0054931640625, 0.01165771484375, 0.017822265625, 0.02398681640625, 0.0301513671875, 0.03631591796875, 0.04248046875, 0.04864501953125, 0.0548095703125, 0.06097412109375, 0.067138671875, 0.07330322265625, 0.0794677734375, 0.08563232421875, 0.091796875, 0.09796142578125, 0.1041259765625, 0.11029052734375, 0.116455078125, 0.12261962890625, 0.1287841796875, 0.13494873046875, 0.14111328125, 0.14727783203125, 0.1534423828125, 0.15960693359375, 0.165771484375, 0.17193603515625, 0.1781005859375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 14.0, 17.0, 19.0, 34.0, 34.0, 47.0, 73.0, 59.0, 57.0, 59.0, 73.0, 61.0, 86.0, 78.0, 70.0, 45.0, 40.0, 28.0, 22.0, 25.0, 15.0, 8.0, 9.0, 5.0, 6.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2110595703125, -0.2031688690185547, -0.19527816772460938, -0.18738746643066406, -0.17949676513671875, -0.17160606384277344, -0.16371536254882812, -0.1558246612548828, -0.1479339599609375, -0.1400432586669922, -0.13215255737304688, -0.12426185607910156, -0.11637115478515625, -0.10848045349121094, -0.10058975219726562, -0.09269905090332031, -0.084808349609375, -0.07691764831542969, -0.06902694702148438, -0.06113624572753906, -0.05324554443359375, -0.04535484313964844, -0.037464141845703125, -0.029573440551757812, -0.0216827392578125, -0.013792037963867188, -0.005901336669921875, 0.0019893646240234375, 0.00988006591796875, 0.017770767211914062, 0.025661468505859375, 0.03355216979980469, 0.04144287109375, 0.04933357238769531, 0.057224273681640625, 0.06511497497558594, 0.07300567626953125, 0.08089637756347656, 0.08878707885742188, 0.09667778015136719, 0.1045684814453125, 0.11245918273925781, 0.12034988403320312, 0.12824058532714844, 0.13613128662109375, 0.14402198791503906, 0.15191268920898438, 0.1598033905029297, 0.167694091796875, 0.1755847930908203, 0.18347549438476562, 0.19136619567871094, 0.19925689697265625, 0.20714759826660156, 0.21503829956054688, 0.2229290008544922, 0.2308197021484375, 0.2387104034423828, 0.24660110473632812, 0.25449180603027344, 0.26238250732421875, 0.27027320861816406, 0.2781639099121094, 0.2860546112060547, 0.2939453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 13.0, 22.0, 34.0, 48.0, 100.0, 128.0, 240.0, 415.0, 802.0, 1769.0, 3965.0, 9320.0, 23200.0, 64938.0, 204622.0, 425349.0, 207336.0, 65883.0, 23282.0, 9286.0, 4080.0, 1816.0, 856.0, 460.0, 247.0, 134.0, 68.0, 46.0, 31.0, 18.0, 18.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369140625, -0.3577842712402344, -0.34642791748046875, -0.3350715637207031, -0.3237152099609375, -0.3123588562011719, -0.30100250244140625, -0.2896461486816406, -0.278289794921875, -0.2669334411621094, -0.25557708740234375, -0.24422073364257812, -0.2328643798828125, -0.22150802612304688, -0.21015167236328125, -0.19879531860351562, -0.18743896484375, -0.17608261108398438, -0.16472625732421875, -0.15336990356445312, -0.1420135498046875, -0.13065719604492188, -0.11930084228515625, -0.10794448852539062, -0.096588134765625, -0.08523178100585938, -0.07387542724609375, -0.06251907348632812, -0.0511627197265625, -0.039806365966796875, -0.02845001220703125, -0.017093658447265625, -0.0057373046875, 0.005619049072265625, 0.01697540283203125, 0.028331756591796875, 0.0396881103515625, 0.051044464111328125, 0.06240081787109375, 0.07375717163085938, 0.085113525390625, 0.09646987915039062, 0.10782623291015625, 0.11918258666992188, 0.1305389404296875, 0.14189529418945312, 0.15325164794921875, 0.16460800170898438, 0.17596435546875, 0.18732070922851562, 0.19867706298828125, 0.21003341674804688, 0.2213897705078125, 0.23274612426757812, 0.24410247802734375, 0.2554588317871094, 0.266815185546875, 0.2781715393066406, 0.28952789306640625, 0.3008842468261719, 0.3122406005859375, 0.3235969543457031, 0.33495330810546875, 0.3463096618652344, 0.357666015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 7.0, 9.0, 8.0, 14.0, 6.0, 18.0, 19.0, 21.0, 15.0, 26.0, 36.0, 38.0, 39.0, 43.0, 48.0, 40.0, 52.0, 63.0, 49.0, 53.0, 49.0, 39.0, 51.0, 48.0, 29.0, 35.0, 19.0, 20.0, 23.0, 11.0, 12.0, 13.0, 8.0, 13.0, 6.0, 4.0, 7.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6219711303710938, -0.6018524169921875, -0.5817337036132812, -0.561614990234375, -0.5414962768554688, -0.5213775634765625, -0.5012588500976562, -0.48114013671875, -0.46102142333984375, -0.4409027099609375, -0.42078399658203125, -0.400665283203125, -0.38054656982421875, -0.3604278564453125, -0.34030914306640625, -0.3201904296875, -0.30007171630859375, -0.2799530029296875, -0.25983428955078125, -0.239715576171875, -0.21959686279296875, -0.1994781494140625, -0.17935943603515625, -0.15924072265625, -0.13912200927734375, -0.1190032958984375, -0.09888458251953125, -0.078765869140625, -0.05864715576171875, -0.0385284423828125, -0.01840972900390625, 0.001708984375, 0.02182769775390625, 0.0419464111328125, 0.06206512451171875, 0.082183837890625, 0.10230255126953125, 0.1224212646484375, 0.14253997802734375, 0.16265869140625, 0.18277740478515625, 0.2028961181640625, 0.22301483154296875, 0.243133544921875, 0.26325225830078125, 0.2833709716796875, 0.30348968505859375, 0.3236083984375, 0.34372711181640625, 0.3638458251953125, 0.38396453857421875, 0.404083251953125, 0.42420196533203125, 0.4443206787109375, 0.46443939208984375, 0.48455810546875, 0.5046768188476562, 0.5247955322265625, 0.5449142456054688, 0.565032958984375, 0.5851516723632812, 0.6052703857421875, 0.6253890991210938, 0.6455078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 30.0, 31.0, 55.0, 98.0, 194.0, 381.0, 908.0, 2826.0, 12638.0, 124205.0, 787083.0, 104568.0, 11370.0, 2506.0, 835.0, 393.0, 196.0, 90.0, 39.0, 31.0, 19.0, 8.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48828125, -0.4759101867675781, -0.46353912353515625, -0.4511680603027344, -0.4387969970703125, -0.4264259338378906, -0.41405487060546875, -0.4016838073730469, -0.389312744140625, -0.3769416809082031, -0.36457061767578125, -0.3521995544433594, -0.3398284912109375, -0.3274574279785156, -0.31508636474609375, -0.3027153015136719, -0.29034423828125, -0.2779731750488281, -0.26560211181640625, -0.2532310485839844, -0.2408599853515625, -0.22848892211914062, -0.21611785888671875, -0.20374679565429688, -0.191375732421875, -0.17900466918945312, -0.16663360595703125, -0.15426254272460938, -0.1418914794921875, -0.12952041625976562, -0.11714935302734375, -0.10477828979492188, -0.0924072265625, -0.08003616333007812, -0.06766510009765625, -0.055294036865234375, -0.0429229736328125, -0.030551910400390625, -0.01818084716796875, -0.005809783935546875, 0.006561279296875, 0.018932342529296875, 0.03130340576171875, 0.043674468994140625, 0.0560455322265625, 0.06841659545898438, 0.08078765869140625, 0.09315872192382812, 0.10552978515625, 0.11790084838867188, 0.13027191162109375, 0.14264297485351562, 0.1550140380859375, 0.16738510131835938, 0.17975616455078125, 0.19212722778320312, 0.204498291015625, 0.21686935424804688, 0.22924041748046875, 0.24161148071289062, 0.2539825439453125, 0.2663536071777344, 0.27872467041015625, 0.2910957336425781, 0.303466796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 4.0, 14.0, 16.0, 35.0, 44.0, 55.0, 83.0, 100.0, 151.0, 125.0, 98.0, 71.0, 54.0, 27.0, 32.0, 25.0, 13.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.26173210144043e-05, -4.119612276554108e-05, -3.9774924516677856e-05, -3.8353726267814636e-05, -3.6932528018951416e-05, -3.5511329770088196e-05, -3.4090131521224976e-05, -3.2668933272361755e-05, -3.1247735023498535e-05, -2.9826536774635315e-05, -2.8405338525772095e-05, -2.6984140276908875e-05, -2.5562942028045654e-05, -2.4141743779182434e-05, -2.2720545530319214e-05, -2.1299347281455994e-05, -1.9878149032592773e-05, -1.8456950783729553e-05, -1.7035752534866333e-05, -1.5614554286003113e-05, -1.4193356037139893e-05, -1.2772157788276672e-05, -1.1350959539413452e-05, -9.929761290550232e-06, -8.508563041687012e-06, -7.0873647928237915e-06, -5.666166543960571e-06, -4.244968295097351e-06, -2.823770046234131e-06, -1.4025717973709106e-06, 1.862645149230957e-08, 1.4398247003555298e-06, 2.86102294921875e-06, 4.28222119808197e-06, 5.7034194469451904e-06, 7.124617695808411e-06, 8.545815944671631e-06, 9.967014193534851e-06, 1.1388212442398071e-05, 1.2809410691261292e-05, 1.4230608940124512e-05, 1.5651807188987732e-05, 1.7073005437850952e-05, 1.8494203686714172e-05, 1.9915401935577393e-05, 2.1336600184440613e-05, 2.2757798433303833e-05, 2.4178996682167053e-05, 2.5600194931030273e-05, 2.7021393179893494e-05, 2.8442591428756714e-05, 2.9863789677619934e-05, 3.1284987926483154e-05, 3.2706186175346375e-05, 3.4127384424209595e-05, 3.5548582673072815e-05, 3.6969780921936035e-05, 3.8390979170799255e-05, 3.9812177419662476e-05, 4.1233375668525696e-05, 4.2654573917388916e-05, 4.4075772166252136e-05, 4.5496970415115356e-05, 4.691816866397858e-05, 4.83393669128418e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 16.0, 30.0, 42.0, 71.0, 122.0, 200.0, 374.0, 702.0, 1389.0, 2992.0, 6553.0, 15226.0, 43135.0, 156662.0, 452992.0, 260727.0, 68940.0, 21995.0, 8649.0, 3839.0, 1827.0, 903.0, 486.0, 267.0, 157.0, 89.0, 51.0, 38.0, 24.0, 16.0, 6.0, 11.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.12724876403808594, -0.12229537963867188, -0.11734199523925781, -0.11238861083984375, -0.10743522644042969, -0.10248184204101562, -0.09752845764160156, -0.0925750732421875, -0.08762168884277344, -0.08266830444335938, -0.07771492004394531, -0.07276153564453125, -0.06780815124511719, -0.06285476684570312, -0.05790138244628906, -0.052947998046875, -0.04799461364746094, -0.043041229248046875, -0.03808784484863281, -0.03313446044921875, -0.028181076049804688, -0.023227691650390625, -0.018274307250976562, -0.0133209228515625, -0.008367538452148438, -0.003414154052734375, 0.0015392303466796875, 0.00649261474609375, 0.011445999145507812, 0.016399383544921875, 0.021352767944335938, 0.02630615234375, 0.03125953674316406, 0.036212921142578125, 0.04116630554199219, 0.04611968994140625, 0.05107307434082031, 0.056026458740234375, 0.06097984313964844, 0.0659332275390625, 0.07088661193847656, 0.07583999633789062, 0.08079338073730469, 0.08574676513671875, 0.09070014953613281, 0.09565353393554688, 0.10060691833496094, 0.105560302734375, 0.11051368713378906, 0.11546707153320312, 0.12042045593261719, 0.12537384033203125, 0.1303272247314453, 0.13528060913085938, 0.14023399353027344, 0.1451873779296875, 0.15014076232910156, 0.15509414672851562, 0.1600475311279297, 0.16500091552734375, 0.1699542999267578, 0.17490768432617188, 0.17986106872558594, 0.184814453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 9.0, 12.0, 21.0, 18.0, 29.0, 34.0, 62.0, 70.0, 119.0, 125.0, 129.0, 100.0, 75.0, 52.0, 39.0, 16.0, 20.0, 8.0, 8.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2152099609375, -0.20682716369628906, -0.19844436645507812, -0.1900615692138672, -0.18167877197265625, -0.1732959747314453, -0.16491317749023438, -0.15653038024902344, -0.1481475830078125, -0.13976478576660156, -0.13138198852539062, -0.12299919128417969, -0.11461639404296875, -0.10623359680175781, -0.09785079956054688, -0.08946800231933594, -0.081085205078125, -0.07270240783691406, -0.06431961059570312, -0.05593681335449219, -0.04755401611328125, -0.03917121887207031, -0.030788421630859375, -0.022405624389648438, -0.0140228271484375, -0.0056400299072265625, 0.002742767333984375, 0.011125564575195312, 0.01950836181640625, 0.027891159057617188, 0.036273956298828125, 0.04465675354003906, 0.05303955078125, 0.06142234802246094, 0.06980514526367188, 0.07818794250488281, 0.08657073974609375, 0.09495353698730469, 0.10333633422851562, 0.11171913146972656, 0.1201019287109375, 0.12848472595214844, 0.13686752319335938, 0.1452503204345703, 0.15363311767578125, 0.1620159149169922, 0.17039871215820312, 0.17878150939941406, 0.187164306640625, 0.19554710388183594, 0.20392990112304688, 0.2123126983642578, 0.22069549560546875, 0.2290782928466797, 0.23746109008789062, 0.24584388732910156, 0.2542266845703125, 0.26260948181152344, 0.2709922790527344, 0.2793750762939453, 0.28775787353515625, 0.2961406707763672, 0.3045234680175781, 0.31290626525878906, 0.3212890625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 25.0, 59.0, 123.0, 211.0, 238.0, 173.0, 89.0, 40.0, 23.0, 12.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7351093292236328, -1.6219754219055176, -1.5088415145874023, -1.395707607269287, -1.2825736999511719, -1.1694397926330566, -1.0563058853149414, -0.9431719183921814, -0.8300380110740662, -0.7169041037559509, -0.6037701964378357, -0.49063625931739807, -0.37750235199928284, -0.2643684148788452, -0.15123450756072998, -0.038100600242614746, 0.07503330707550049, 0.18816721439361572, 0.30130112171173096, 0.4144350588321686, 0.5275689363479614, 0.6407029032707214, 0.7538368105888367, 0.8669707179069519, 0.9801046252250671, 1.0932385921478271, 1.2063724994659424, 1.3195064067840576, 1.4326403141021729, 1.545774221420288, 1.6589081287384033, 1.7720420360565186, 1.8851759433746338, 1.998309850692749, 2.1114437580108643, 2.2245776653289795, 2.3377115726470947, 2.45084547996521, 2.563979387283325, 2.6771132946014404, 2.7902472019195557, 2.903381109237671, 3.016515016555786, 3.1296489238739014, 3.2427828311920166, 3.355916738510132, 3.469050645828247, 3.5821845531463623, 3.6953186988830566, 3.808452606201172, 3.921586513519287, 4.034720420837402, 4.147854328155518, 4.260988235473633, 4.374122142791748, 4.487256050109863, 4.6003899574279785, 4.713523864746094, 4.826657772064209, 4.939791679382324, 5.0529255867004395, 5.166059494018555, 5.27919340133667, 5.392327308654785, 5.5054612159729]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 2.0, 1.0, 9.0, 9.0, 7.0, 9.0, 16.0, 15.0, 10.0, 22.0, 28.0, 22.0, 19.0, 27.0, 36.0, 40.0, 35.0, 36.0, 34.0, 38.0, 50.0, 45.0, 32.0, 43.0, 35.0, 31.0, 43.0, 32.0, 36.0, 28.0, 29.0, 20.0, 22.0, 20.0, 15.0, 12.0, 18.0, 14.0, 15.0, 12.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4356026649475098, -1.3884177207946777, -1.3412328958511353, -1.2940479516983032, -1.2468631267547607, -1.1996781826019287, -1.1524933576583862, -1.1053084135055542, -1.0581235885620117, -1.0109386444091797, -0.9637538194656372, -0.91656893491745, -0.8693840503692627, -0.8221991658210754, -0.7750142812728882, -0.7278293371200562, -0.6806444525718689, -0.6334595680236816, -0.5862746834754944, -0.5390897989273071, -0.4919049143791199, -0.4447200298309326, -0.397535115480423, -0.3503502309322357, -0.30316534638404846, -0.2559804618358612, -0.20879557728767395, -0.1616106778383255, -0.11442579329013824, -0.06724090874195099, -0.02005600929260254, 0.027128875255584717, 0.07431375980377197, 0.12149864435195923, 0.16868352890014648, 0.21586842834949493, 0.263053297996521, 0.31023818254470825, 0.3574230968952179, 0.40460798144340515, 0.4517928659915924, 0.49897775053977966, 0.5461626648902893, 0.5933475494384766, 0.6405324339866638, 0.6877173185348511, 0.7349022030830383, 0.7820870876312256, 0.8292719721794128, 0.8764568567276001, 0.9236417412757874, 0.9708266258239746, 1.0180115699768066, 1.0651963949203491, 1.1123813390731812, 1.1595661640167236, 1.2067511081695557, 1.2539360523223877, 1.3011208772659302, 1.3483058214187622, 1.3954906463623047, 1.4426755905151367, 1.4898604154586792, 1.5370453596115112, 1.5842301845550537]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 8.0, 21.0, 26.0, 57.0, 68.0, 116.0, 153.0, 229.0, 369.0, 551.0, 906.0, 1447.0, 2678.0, 4960.0, 9662.0, 21174.0, 55627.0, 189584.0, 776810.0, 1990659.0, 834096.0, 205265.0, 56916.0, 20958.0, 9728.0, 5041.0, 2747.0, 1596.0, 1000.0, 604.0, 409.0, 260.0, 172.0, 125.0, 80.0, 54.0, 45.0, 25.0, 18.0, 12.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1517333984375, -0.14641380310058594, -0.14109420776367188, -0.1357746124267578, -0.13045501708984375, -0.1251354217529297, -0.11981582641601562, -0.11449623107910156, -0.1091766357421875, -0.10385704040527344, -0.09853744506835938, -0.09321784973144531, -0.08789825439453125, -0.08257865905761719, -0.07725906372070312, -0.07193946838378906, -0.066619873046875, -0.06130027770996094, -0.055980682373046875, -0.05066108703613281, -0.04534149169921875, -0.04002189636230469, -0.034702301025390625, -0.029382705688476562, -0.0240631103515625, -0.018743515014648438, -0.013423919677734375, -0.008104324340820312, -0.00278472900390625, 0.0025348663330078125, 0.007854461669921875, 0.013174057006835938, 0.01849365234375, 0.023813247680664062, 0.029132843017578125, 0.03445243835449219, 0.03977203369140625, 0.04509162902832031, 0.050411224365234375, 0.05573081970214844, 0.0610504150390625, 0.06637001037597656, 0.07168960571289062, 0.07700920104980469, 0.08232879638671875, 0.08764839172363281, 0.09296798706054688, 0.09828758239746094, 0.103607177734375, 0.10892677307128906, 0.11424636840820312, 0.11956596374511719, 0.12488555908203125, 0.1302051544189453, 0.13552474975585938, 0.14084434509277344, 0.1461639404296875, 0.15148353576660156, 0.15680313110351562, 0.1621227264404297, 0.16744232177734375, 0.1727619171142578, 0.17808151245117188, 0.18340110778808594, 0.188720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 3.0, 8.0, 7.0, 12.0, 21.0, 19.0, 17.0, 26.0, 34.0, 41.0, 57.0, 60.0, 51.0, 63.0, 64.0, 54.0, 56.0, 71.0, 75.0, 47.0, 43.0, 45.0, 26.0, 28.0, 17.0, 10.0, 8.0, 9.0, 10.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2286376953125, -0.2198925018310547, -0.21114730834960938, -0.20240211486816406, -0.19365692138671875, -0.18491172790527344, -0.17616653442382812, -0.1674213409423828, -0.1586761474609375, -0.1499309539794922, -0.14118576049804688, -0.13244056701660156, -0.12369537353515625, -0.11495018005371094, -0.10620498657226562, -0.09745979309082031, -0.088714599609375, -0.07996940612792969, -0.07122421264648438, -0.06247901916503906, -0.05373382568359375, -0.04498863220214844, -0.036243438720703125, -0.027498245239257812, -0.0187530517578125, -0.010007858276367188, -0.001262664794921875, 0.0074825286865234375, 0.01622772216796875, 0.024972915649414062, 0.033718109130859375, 0.04246330261230469, 0.05120849609375, 0.05995368957519531, 0.06869888305664062, 0.07744407653808594, 0.08618927001953125, 0.09493446350097656, 0.10367965698242188, 0.11242485046386719, 0.1211700439453125, 0.1299152374267578, 0.13866043090820312, 0.14740562438964844, 0.15615081787109375, 0.16489601135253906, 0.17364120483398438, 0.1823863983154297, 0.191131591796875, 0.1998767852783203, 0.20862197875976562, 0.21736717224121094, 0.22611236572265625, 0.23485755920410156, 0.24360275268554688, 0.2523479461669922, 0.2610931396484375, 0.2698383331298828, 0.2785835266113281, 0.28732872009277344, 0.29607391357421875, 0.30481910705566406, 0.3135643005371094, 0.3223094940185547, 0.3310546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 8.0, 17.0, 23.0, 15.0, 29.0, 46.0, 61.0, 61.0, 105.0, 128.0, 180.0, 254.0, 430.0, 728.0, 1282.0, 2816.0, 7903.0, 25682.0, 113000.0, 1089765.0, 2682601.0, 208843.0, 40709.0, 11287.0, 4045.0, 1795.0, 878.0, 506.0, 291.0, 210.0, 136.0, 111.0, 76.0, 57.0, 55.0, 43.0, 29.0, 11.0, 20.0, 15.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43480682373046875, -0.4203948974609375, -0.40598297119140625, -0.391571044921875, -0.37715911865234375, -0.3627471923828125, -0.34833526611328125, -0.33392333984375, -0.31951141357421875, -0.3050994873046875, -0.29068756103515625, -0.276275634765625, -0.26186370849609375, -0.2474517822265625, -0.23303985595703125, -0.2186279296875, -0.20421600341796875, -0.1898040771484375, -0.17539215087890625, -0.160980224609375, -0.14656829833984375, -0.1321563720703125, -0.11774444580078125, -0.10333251953125, -0.08892059326171875, -0.0745086669921875, -0.06009674072265625, -0.045684814453125, -0.03127288818359375, -0.0168609619140625, -0.00244903564453125, 0.011962890625, 0.02637481689453125, 0.0407867431640625, 0.05519866943359375, 0.069610595703125, 0.08402252197265625, 0.0984344482421875, 0.11284637451171875, 0.12725830078125, 0.14167022705078125, 0.1560821533203125, 0.17049407958984375, 0.184906005859375, 0.19931793212890625, 0.2137298583984375, 0.22814178466796875, 0.2425537109375, 0.25696563720703125, 0.2713775634765625, 0.28578948974609375, 0.300201416015625, 0.31461334228515625, 0.3290252685546875, 0.34343719482421875, 0.35784912109375, 0.37226104736328125, 0.3866729736328125, 0.40108489990234375, 0.415496826171875, 0.42990875244140625, 0.4443206787109375, 0.45873260498046875, 0.47314453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 10.0, 6.0, 11.0, 20.0, 44.0, 47.0, 56.0, 61.0, 104.0, 182.0, 342.0, 701.0, 1064.0, 631.0, 323.0, 174.0, 83.0, 69.0, 45.0, 31.0, 21.0, 12.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2832298278808594, -0.26934051513671875, -0.2554512023925781, -0.2415618896484375, -0.22767257690429688, -0.21378326416015625, -0.19989395141601562, -0.186004638671875, -0.17211532592773438, -0.15822601318359375, -0.14433670043945312, -0.1304473876953125, -0.11655807495117188, -0.10266876220703125, -0.08877944946289062, -0.07489013671875, -0.061000823974609375, -0.04711151123046875, -0.033222198486328125, -0.0193328857421875, -0.005443572998046875, 0.00844573974609375, 0.022335052490234375, 0.036224365234375, 0.050113677978515625, 0.06400299072265625, 0.07789230346679688, 0.0917816162109375, 0.10567092895507812, 0.11956024169921875, 0.13344955444335938, 0.1473388671875, 0.16122817993164062, 0.17511749267578125, 0.18900680541992188, 0.2028961181640625, 0.21678543090820312, 0.23067474365234375, 0.24456405639648438, 0.258453369140625, 0.2723426818847656, 0.28623199462890625, 0.3001213073730469, 0.3140106201171875, 0.3278999328613281, 0.34178924560546875, 0.3556785583496094, 0.36956787109375, 0.3834571838378906, 0.39734649658203125, 0.4112358093261719, 0.4251251220703125, 0.4390144348144531, 0.45290374755859375, 0.4667930603027344, 0.480682373046875, 0.4945716857910156, 0.5084609985351562, 0.5223503112792969, 0.5362396240234375, 0.5501289367675781, 0.5640182495117188, 0.5779075622558594, 0.591796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 11.0, 22.0, 29.0, 63.0, 105.0, 154.0, 170.0, 167.0, 110.0, 77.0, 47.0, 19.0, 9.0, 13.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3828850984573364, -1.3085662126541138, -1.2342473268508911, -1.1599284410476685, -1.0856096744537354, -1.0112907886505127, -0.93697190284729, -0.8626530170440674, -0.7883341312408447, -0.7140152454376221, -0.6396963596343994, -0.5653775334358215, -0.4910586476325989, -0.4167397618293762, -0.34242090582847595, -0.2681020498275757, -0.19378316402435303, -0.11946429312229156, -0.0451454222202301, 0.02917344868183136, 0.10349231958389282, 0.17781120538711548, 0.25213006138801575, 0.326448917388916, 0.40076780319213867, 0.47508668899536133, 0.549405574798584, 0.6237244009971619, 0.6980432868003845, 0.7723621726036072, 0.8466809988021851, 0.9209998846054077, 0.9953186511993408, 1.0696375370025635, 1.1439564228057861, 1.2182753086090088, 1.2925941944122314, 1.366913080215454, 1.4412318468093872, 1.5155507326126099, 1.5898696184158325, 1.6641885042190552, 1.7385073900222778, 1.8128262758255005, 1.8871450424194336, 1.9614639282226562, 2.035782814025879, 2.1101016998291016, 2.184420585632324, 2.258739471435547, 2.3330583572387695, 2.407377243041992, 2.481696128845215, 2.5560150146484375, 2.63033390045166, 2.704652786254883, 2.7789716720581055, 2.853290557861328, 2.927609443664551, 3.0019283294677734, 3.076247215270996, 3.1505661010742188, 3.2248849868774414, 3.299203872680664, 3.3735225200653076]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 12.0, 11.0, 15.0, 18.0, 24.0, 22.0, 23.0, 16.0, 36.0, 29.0, 34.0, 29.0, 35.0, 43.0, 34.0, 47.0, 36.0, 43.0, 44.0, 38.0, 38.0, 35.0, 45.0, 34.0, 37.0, 33.0, 23.0, 28.0, 19.0, 14.0, 13.0, 6.0, 10.0, 10.0, 13.0, 10.0, 10.0, 5.0, 3.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0596855878829956, -1.0278637409210205, -0.9960417747497559, -0.964219868183136, -0.9323979616165161, -0.9005760550498962, -0.8687541484832764, -0.8369322419166565, -0.8051103353500366, -0.7732884287834167, -0.7414665222167969, -0.709644615650177, -0.6778227090835571, -0.6460008025169373, -0.6141788959503174, -0.5823569893836975, -0.5505350828170776, -0.5187131762504578, -0.4868912696838379, -0.455069363117218, -0.42324745655059814, -0.39142554998397827, -0.3596036434173584, -0.3277817368507385, -0.29595983028411865, -0.2641379237174988, -0.2323160171508789, -0.20049411058425903, -0.16867220401763916, -0.1368502974510193, -0.10502839088439941, -0.07320648431777954, -0.04138463735580444, -0.00956273078918457, 0.022259175777435303, 0.054081082344055176, 0.08590298891067505, 0.11772489547729492, 0.1495468020439148, 0.18136870861053467, 0.21319061517715454, 0.24501252174377441, 0.2768344283103943, 0.30865633487701416, 0.34047824144363403, 0.3723001480102539, 0.4041220545768738, 0.43594396114349365, 0.4677658677101135, 0.4995877742767334, 0.5314096808433533, 0.5632315874099731, 0.595053493976593, 0.6268754005432129, 0.6586973071098328, 0.6905192136764526, 0.7223411202430725, 0.7541630268096924, 0.7859849333763123, 0.8178068399429321, 0.849628746509552, 0.8814506530761719, 0.9132725596427917, 0.9450944662094116, 0.9769163727760315]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 10.0, 20.0, 22.0, 37.0, 60.0, 69.0, 130.0, 232.0, 342.0, 573.0, 911.0, 1508.0, 2697.0, 4770.0, 8714.0, 16681.0, 31905.0, 63591.0, 134616.0, 267682.0, 258235.0, 128713.0, 60871.0, 30460.0, 15942.0, 8435.0, 4674.0, 2616.0, 1580.0, 921.0, 560.0, 341.0, 210.0, 140.0, 90.0, 53.0, 53.0, 28.0, 14.0, 15.0, 6.0, 8.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.255126953125, -0.2471466064453125, -0.239166259765625, -0.2311859130859375, -0.22320556640625, -0.2152252197265625, -0.207244873046875, -0.1992645263671875, -0.1912841796875, -0.1833038330078125, -0.175323486328125, -0.1673431396484375, -0.15936279296875, -0.1513824462890625, -0.143402099609375, -0.1354217529296875, -0.12744140625, -0.1194610595703125, -0.111480712890625, -0.1035003662109375, -0.09552001953125, -0.0875396728515625, -0.079559326171875, -0.0715789794921875, -0.0635986328125, -0.0556182861328125, -0.047637939453125, -0.0396575927734375, -0.03167724609375, -0.0236968994140625, -0.015716552734375, -0.0077362060546875, 0.000244140625, 0.0082244873046875, 0.016204833984375, 0.0241851806640625, 0.03216552734375, 0.0401458740234375, 0.048126220703125, 0.0561065673828125, 0.0640869140625, 0.0720672607421875, 0.080047607421875, 0.0880279541015625, 0.09600830078125, 0.1039886474609375, 0.111968994140625, 0.1199493408203125, 0.1279296875, 0.1359100341796875, 0.143890380859375, 0.1518707275390625, 0.15985107421875, 0.1678314208984375, 0.175811767578125, 0.1837921142578125, 0.1917724609375, 0.1997528076171875, 0.207733154296875, 0.2157135009765625, 0.22369384765625, 0.2316741943359375, 0.239654541015625, 0.2476348876953125, 0.255615234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 9.0, 15.0, 17.0, 26.0, 25.0, 24.0, 35.0, 38.0, 48.0, 60.0, 62.0, 72.0, 58.0, 62.0, 57.0, 65.0, 65.0, 52.0, 47.0, 37.0, 32.0, 20.0, 14.0, 15.0, 8.0, 6.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2610015869140625, -0.251983642578125, -0.2429656982421875, -0.23394775390625, -0.2249298095703125, -0.215911865234375, -0.2068939208984375, -0.1978759765625, -0.1888580322265625, -0.179840087890625, -0.1708221435546875, -0.16180419921875, -0.1527862548828125, -0.143768310546875, -0.1347503662109375, -0.125732421875, -0.1167144775390625, -0.107696533203125, -0.0986785888671875, -0.08966064453125, -0.0806427001953125, -0.071624755859375, -0.0626068115234375, -0.0535888671875, -0.0445709228515625, -0.035552978515625, -0.0265350341796875, -0.01751708984375, -0.0084991455078125, 0.000518798828125, 0.0095367431640625, 0.0185546875, 0.0275726318359375, 0.036590576171875, 0.0456085205078125, 0.05462646484375, 0.0636444091796875, 0.072662353515625, 0.0816802978515625, 0.0906982421875, 0.0997161865234375, 0.108734130859375, 0.1177520751953125, 0.12677001953125, 0.1357879638671875, 0.144805908203125, 0.1538238525390625, 0.162841796875, 0.1718597412109375, 0.180877685546875, 0.1898956298828125, 0.19891357421875, 0.2079315185546875, 0.216949462890625, 0.2259674072265625, 0.2349853515625, 0.2440032958984375, 0.253021240234375, 0.2620391845703125, 0.27105712890625, 0.2800750732421875, 0.289093017578125, 0.2981109619140625, 0.30712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 7.0, 10.0, 10.0, 23.0, 35.0, 55.0, 56.0, 97.0, 193.0, 274.0, 450.0, 751.0, 1258.0, 2615.0, 4758.0, 10047.0, 21657.0, 51522.0, 133498.0, 360966.0, 286331.0, 99872.0, 39708.0, 17497.0, 7965.0, 4086.0, 2008.0, 1153.0, 709.0, 348.0, 202.0, 130.0, 96.0, 49.0, 34.0, 23.0, 17.0, 12.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40771484375, -0.3953056335449219, -0.38289642333984375, -0.3704872131347656, -0.3580780029296875, -0.3456687927246094, -0.33325958251953125, -0.3208503723144531, -0.308441162109375, -0.2960319519042969, -0.28362274169921875, -0.2712135314941406, -0.2588043212890625, -0.24639511108398438, -0.23398590087890625, -0.22157669067382812, -0.20916748046875, -0.19675827026367188, -0.18434906005859375, -0.17193984985351562, -0.1595306396484375, -0.14712142944335938, -0.13471221923828125, -0.12230300903320312, -0.109893798828125, -0.09748458862304688, -0.08507537841796875, -0.07266616821289062, -0.0602569580078125, -0.047847747802734375, -0.03543853759765625, -0.023029327392578125, -0.0106201171875, 0.001789093017578125, 0.01419830322265625, 0.026607513427734375, 0.0390167236328125, 0.051425933837890625, 0.06383514404296875, 0.07624435424804688, 0.088653564453125, 0.10106277465820312, 0.11347198486328125, 0.12588119506835938, 0.1382904052734375, 0.15069961547851562, 0.16310882568359375, 0.17551803588867188, 0.18792724609375, 0.20033645629882812, 0.21274566650390625, 0.22515487670898438, 0.2375640869140625, 0.24997329711914062, 0.26238250732421875, 0.2747917175292969, 0.287200927734375, 0.2996101379394531, 0.31201934814453125, 0.3244285583496094, 0.3368377685546875, 0.3492469787597656, 0.36165618896484375, 0.3740653991699219, 0.386474609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 9.0, 10.0, 12.0, 17.0, 20.0, 25.0, 29.0, 29.0, 26.0, 45.0, 45.0, 63.0, 48.0, 40.0, 57.0, 43.0, 45.0, 40.0, 53.0, 48.0, 45.0, 30.0, 33.0, 30.0, 21.0, 15.0, 20.0, 17.0, 13.0, 12.0, 9.0, 7.0, 3.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7060546875, -0.6832275390625, -0.660400390625, -0.6375732421875, -0.61474609375, -0.5919189453125, -0.569091796875, -0.5462646484375, -0.5234375, -0.5006103515625, -0.477783203125, -0.4549560546875, -0.43212890625, -0.4093017578125, -0.386474609375, -0.3636474609375, -0.3408203125, -0.3179931640625, -0.295166015625, -0.2723388671875, -0.24951171875, -0.2266845703125, -0.203857421875, -0.1810302734375, -0.158203125, -0.1353759765625, -0.112548828125, -0.0897216796875, -0.06689453125, -0.0440673828125, -0.021240234375, 0.0015869140625, 0.0244140625, 0.0472412109375, 0.070068359375, 0.0928955078125, 0.11572265625, 0.1385498046875, 0.161376953125, 0.1842041015625, 0.20703125, 0.2298583984375, 0.252685546875, 0.2755126953125, 0.29833984375, 0.3211669921875, 0.343994140625, 0.3668212890625, 0.3896484375, 0.4124755859375, 0.435302734375, 0.4581298828125, 0.48095703125, 0.5037841796875, 0.526611328125, 0.5494384765625, 0.572265625, 0.5950927734375, 0.617919921875, 0.6407470703125, 0.66357421875, 0.6864013671875, 0.709228515625, 0.7320556640625, 0.7548828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 1.0, 4.0, 16.0, 14.0, 22.0, 28.0, 55.0, 78.0, 96.0, 117.0, 171.0, 260.0, 368.0, 596.0, 1004.0, 1759.0, 3141.0, 6272.0, 13817.0, 36180.0, 109371.0, 406512.0, 326032.0, 88640.0, 29861.0, 11742.0, 5474.0, 2717.0, 1522.0, 926.0, 557.0, 355.0, 246.0, 182.0, 116.0, 98.0, 58.0, 39.0, 31.0, 20.0, 14.0, 12.0, 9.0, 6.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2069091796875, -0.20021438598632812, -0.19351959228515625, -0.18682479858398438, -0.1801300048828125, -0.17343521118164062, -0.16674041748046875, -0.16004562377929688, -0.153350830078125, -0.14665603637695312, -0.13996124267578125, -0.13326644897460938, -0.1265716552734375, -0.11987686157226562, -0.11318206787109375, -0.10648727416992188, -0.09979248046875, -0.09309768676757812, -0.08640289306640625, -0.07970809936523438, -0.0730133056640625, -0.06631851196289062, -0.05962371826171875, -0.052928924560546875, -0.046234130859375, -0.039539337158203125, -0.03284454345703125, -0.026149749755859375, -0.0194549560546875, -0.012760162353515625, -0.00606536865234375, 0.000629425048828125, 0.00732421875, 0.014019012451171875, 0.02071380615234375, 0.027408599853515625, 0.0341033935546875, 0.040798187255859375, 0.04749298095703125, 0.054187774658203125, 0.060882568359375, 0.06757736206054688, 0.07427215576171875, 0.08096694946289062, 0.0876617431640625, 0.09435653686523438, 0.10105133056640625, 0.10774612426757812, 0.11444091796875, 0.12113571166992188, 0.12783050537109375, 0.13452529907226562, 0.1412200927734375, 0.14791488647460938, 0.15460968017578125, 0.16130447387695312, 0.167999267578125, 0.17469406127929688, 0.18138885498046875, 0.18808364868164062, 0.1947784423828125, 0.20147323608398438, 0.20816802978515625, 0.21486282348632812, 0.2215576171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 7.0, 4.0, 7.0, 7.0, 21.0, 18.0, 24.0, 31.0, 35.0, 39.0, 49.0, 83.0, 83.0, 113.0, 83.0, 92.0, 67.0, 51.0, 30.0, 20.0, 22.0, 26.0, 16.0, 12.0, 9.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.892183303833008e-05, -3.7653371691703796e-05, -3.6384910345077515e-05, -3.511644899845123e-05, -3.384798765182495e-05, -3.257952630519867e-05, -3.131106495857239e-05, -3.0042603611946106e-05, -2.8774142265319824e-05, -2.7505680918693542e-05, -2.623721957206726e-05, -2.496875822544098e-05, -2.3700296878814697e-05, -2.2431835532188416e-05, -2.1163374185562134e-05, -1.9894912838935852e-05, -1.862645149230957e-05, -1.735799014568329e-05, -1.6089528799057007e-05, -1.4821067452430725e-05, -1.3552606105804443e-05, -1.2284144759178162e-05, -1.101568341255188e-05, -9.747222065925598e-06, -8.478760719299316e-06, -7.210299372673035e-06, -5.941838026046753e-06, -4.673376679420471e-06, -3.4049153327941895e-06, -2.1364539861679077e-06, -8.67992639541626e-07, 4.0046870708465576e-07, 1.6689300537109375e-06, 2.9373914003372192e-06, 4.205852746963501e-06, 5.474314093589783e-06, 6.7427754402160645e-06, 8.011236786842346e-06, 9.279698133468628e-06, 1.054815948009491e-05, 1.1816620826721191e-05, 1.3085082173347473e-05, 1.4353543519973755e-05, 1.5622004866600037e-05, 1.689046621322632e-05, 1.81589275598526e-05, 1.9427388906478882e-05, 2.0695850253105164e-05, 2.1964311599731445e-05, 2.3232772946357727e-05, 2.450123429298401e-05, 2.576969563961029e-05, 2.7038156986236572e-05, 2.8306618332862854e-05, 2.9575079679489136e-05, 3.084354102611542e-05, 3.21120023727417e-05, 3.338046371936798e-05, 3.464892506599426e-05, 3.5917386412620544e-05, 3.7185847759246826e-05, 3.845430910587311e-05, 3.972277045249939e-05, 4.099123179912567e-05, 4.225969314575195e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 8.0, 14.0, 19.0, 26.0, 45.0, 67.0, 124.0, 141.0, 280.0, 451.0, 753.0, 1388.0, 2472.0, 5001.0, 9705.0, 20621.0, 50976.0, 149548.0, 419668.0, 251261.0, 78778.0, 30002.0, 13225.0, 6426.0, 3261.0, 1773.0, 1005.0, 582.0, 351.0, 198.0, 129.0, 69.0, 68.0, 40.0, 29.0, 16.0, 13.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1748046875, -0.16929244995117188, -0.16378021240234375, -0.15826797485351562, -0.1527557373046875, -0.14724349975585938, -0.14173126220703125, -0.13621902465820312, -0.130706787109375, -0.12519454956054688, -0.11968231201171875, -0.11417007446289062, -0.1086578369140625, -0.10314559936523438, -0.09763336181640625, -0.09212112426757812, -0.08660888671875, -0.08109664916992188, -0.07558441162109375, -0.07007217407226562, -0.0645599365234375, -0.059047698974609375, -0.05353546142578125, -0.048023223876953125, -0.042510986328125, -0.036998748779296875, -0.03148651123046875, -0.025974273681640625, -0.0204620361328125, -0.014949798583984375, -0.00943756103515625, -0.003925323486328125, 0.0015869140625, 0.007099151611328125, 0.01261138916015625, 0.018123626708984375, 0.0236358642578125, 0.029148101806640625, 0.03466033935546875, 0.040172576904296875, 0.045684814453125, 0.051197052001953125, 0.05670928955078125, 0.062221527099609375, 0.0677337646484375, 0.07324600219726562, 0.07875823974609375, 0.08427047729492188, 0.08978271484375, 0.09529495239257812, 0.10080718994140625, 0.10631942749023438, 0.1118316650390625, 0.11734390258789062, 0.12285614013671875, 0.12836837768554688, 0.133880615234375, 0.13939285278320312, 0.14490509033203125, 0.15041732788085938, 0.1559295654296875, 0.16144180297851562, 0.16695404052734375, 0.17246627807617188, 0.177978515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 6.0, 5.0, 3.0, 6.0, 3.0, 6.0, 11.0, 20.0, 18.0, 14.0, 23.0, 21.0, 26.0, 42.0, 49.0, 60.0, 88.0, 76.0, 93.0, 79.0, 61.0, 57.0, 53.0, 32.0, 28.0, 22.0, 21.0, 11.0, 17.0, 6.0, 8.0, 15.0, 10.0, 4.0, 8.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1468505859375, -0.14079856872558594, -0.13474655151367188, -0.1286945343017578, -0.12264251708984375, -0.11659049987792969, -0.11053848266601562, -0.10448646545410156, -0.0984344482421875, -0.09238243103027344, -0.08633041381835938, -0.08027839660644531, -0.07422637939453125, -0.06817436218261719, -0.062122344970703125, -0.05607032775878906, -0.050018310546875, -0.04396629333496094, -0.037914276123046875, -0.03186225891113281, -0.02581024169921875, -0.019758224487304688, -0.013706207275390625, -0.0076541900634765625, -0.0016021728515625, 0.0044498443603515625, 0.010501861572265625, 0.016553878784179688, 0.02260589599609375, 0.028657913208007812, 0.034709930419921875, 0.04076194763183594, 0.04681396484375, 0.05286598205566406, 0.058917999267578125, 0.06497001647949219, 0.07102203369140625, 0.07707405090332031, 0.08312606811523438, 0.08917808532714844, 0.0952301025390625, 0.10128211975097656, 0.10733413696289062, 0.11338615417480469, 0.11943817138671875, 0.1254901885986328, 0.13154220581054688, 0.13759422302246094, 0.143646240234375, 0.14969825744628906, 0.15575027465820312, 0.1618022918701172, 0.16785430908203125, 0.1739063262939453, 0.17995834350585938, 0.18601036071777344, 0.1920623779296875, 0.19811439514160156, 0.20416641235351562, 0.2102184295654297, 0.21627044677734375, 0.2223224639892578, 0.22837448120117188, 0.23442649841308594, 0.240478515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 79.0, 299.0, 430.0, 152.0, 35.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.55536937713623, -13.305806159973145, -13.056242942810059, -12.806678771972656, -12.55711555480957, -12.307552337646484, -12.057989120483398, -11.808425903320312, -11.55886173248291, -11.309298515319824, -11.059735298156738, -10.810171127319336, -10.56060791015625, -10.311044692993164, -10.061481475830078, -9.811918258666992, -9.562355041503906, -9.31279182434082, -9.063228607177734, -8.813664436340332, -8.564101219177246, -8.31453800201416, -8.064974784851074, -7.81541109085083, -7.565847396850586, -7.3162841796875, -7.066720485687256, -6.81715726852417, -6.567593574523926, -6.31803035736084, -6.068467140197754, -5.81890344619751, -5.569340705871582, -5.319777488708496, -5.070213794708252, -4.820650577545166, -4.571086883544922, -4.321523666381836, -4.07196044921875, -3.822396755218506, -3.5728330612182617, -3.3232696056365967, -3.0737061500549316, -2.8241429328918457, -2.5745794773101807, -2.3250160217285156, -2.0754525661468506, -1.825889229774475, -1.5763258934020996, -1.3267624378204346, -1.077199101448059, -0.827635645866394, -0.5780722498893738, -0.3285088539123535, -0.07894539833068848, 0.170617938041687, 0.42018139362335205, 0.6697447896003723, 0.9193081855773926, 1.1688716411590576, 1.4184350967407227, 1.6679984331130981, 1.9175618886947632, 2.1671252250671387, 2.4166886806488037]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 9.0, 11.0, 11.0, 7.0, 16.0, 22.0, 20.0, 19.0, 22.0, 33.0, 21.0, 43.0, 35.0, 43.0, 39.0, 35.0, 44.0, 48.0, 35.0, 46.0, 32.0, 32.0, 30.0, 47.0, 39.0, 31.0, 37.0, 37.0, 22.0, 27.0, 19.0, 11.0, 14.0, 9.0, 6.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3324038982391357, -1.2896915674209595, -1.2469793558120728, -1.2042670249938965, -1.1615548133850098, -1.1188424825668335, -1.0761301517486572, -1.0334179401397705, -0.9907056093215942, -0.9479933381080627, -0.9052810668945312, -0.862568736076355, -0.8198564648628235, -0.777144193649292, -0.7344318628311157, -0.6917195916175842, -0.6490073204040527, -0.6062950491905212, -0.5635827779769897, -0.5208704471588135, -0.478158175945282, -0.4354459047317505, -0.3927336037158966, -0.3500213027000427, -0.30730903148651123, -0.26459676027297974, -0.22188445925712585, -0.17917217314243317, -0.13645988702774048, -0.09374760091304779, -0.0510353147983551, -0.00832301378250122, 0.034389376640319824, 0.07710166275501251, 0.1198139488697052, 0.1625262349843979, 0.20523852109909058, 0.24795080721378326, 0.29066309332847595, 0.33337539434432983, 0.37608766555786133, 0.4187999367713928, 0.4615122377872467, 0.5042245388031006, 0.5469368100166321, 0.5896490812301636, 0.6323614120483398, 0.6750736832618713, 0.7177859544754028, 0.7604982256889343, 0.8032104969024658, 0.8459228277206421, 0.8886350989341736, 0.9313473701477051, 0.9740597009658813, 1.0167720317840576, 1.0594842433929443, 1.1021965742111206, 1.1449087858200073, 1.1876211166381836, 1.2303333282470703, 1.2730456590652466, 1.3157579898834229, 1.3584702014923096, 1.4011825323104858]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 10.0, 9.0, 11.0, 19.0, 20.0, 31.0, 56.0, 77.0, 117.0, 175.0, 279.0, 454.0, 766.0, 1539.0, 2891.0, 6490.0, 15356.0, 43958.0, 187192.0, 1598495.0, 2031862.0, 223300.0, 48815.0, 17303.0, 7369.0, 3539.0, 1714.0, 903.0, 546.0, 307.0, 179.0, 141.0, 106.0, 67.0, 69.0, 40.0, 24.0, 15.0, 15.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.328857421875, -0.318267822265625, -0.30767822265625, -0.297088623046875, -0.2864990234375, -0.275909423828125, -0.26531982421875, -0.254730224609375, -0.244140625, -0.233551025390625, -0.22296142578125, -0.212371826171875, -0.2017822265625, -0.191192626953125, -0.18060302734375, -0.170013427734375, -0.159423828125, -0.148834228515625, -0.13824462890625, -0.127655029296875, -0.1170654296875, -0.106475830078125, -0.09588623046875, -0.085296630859375, -0.07470703125, -0.064117431640625, -0.05352783203125, -0.042938232421875, -0.0323486328125, -0.021759033203125, -0.01116943359375, -0.000579833984375, 0.010009765625, 0.020599365234375, 0.03118896484375, 0.041778564453125, 0.0523681640625, 0.062957763671875, 0.07354736328125, 0.084136962890625, 0.0947265625, 0.105316162109375, 0.11590576171875, 0.126495361328125, 0.1370849609375, 0.147674560546875, 0.15826416015625, 0.168853759765625, 0.179443359375, 0.190032958984375, 0.20062255859375, 0.211212158203125, 0.2218017578125, 0.232391357421875, 0.24298095703125, 0.253570556640625, 0.26416015625, 0.274749755859375, 0.28533935546875, 0.295928955078125, 0.3065185546875, 0.317108154296875, 0.32769775390625, 0.338287353515625, 0.348876953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 27.0, 21.0, 28.0, 39.0, 26.0, 35.0, 45.0, 57.0, 61.0, 68.0, 62.0, 71.0, 65.0, 59.0, 64.0, 41.0, 40.0, 23.0, 35.0, 19.0, 30.0, 7.0, 19.0, 11.0, 7.0, 8.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267333984375, -0.25814056396484375, -0.2489471435546875, -0.23975372314453125, -0.230560302734375, -0.22136688232421875, -0.2121734619140625, -0.20298004150390625, -0.19378662109375, -0.18459320068359375, -0.1753997802734375, -0.16620635986328125, -0.157012939453125, -0.14781951904296875, -0.1386260986328125, -0.12943267822265625, -0.1202392578125, -0.11104583740234375, -0.1018524169921875, -0.09265899658203125, -0.083465576171875, -0.07427215576171875, -0.0650787353515625, -0.05588531494140625, -0.04669189453125, -0.03749847412109375, -0.0283050537109375, -0.01911163330078125, -0.009918212890625, -0.00072479248046875, 0.0084686279296875, 0.01766204833984375, 0.02685546875, 0.03604888916015625, 0.0452423095703125, 0.05443572998046875, 0.063629150390625, 0.07282257080078125, 0.0820159912109375, 0.09120941162109375, 0.10040283203125, 0.10959625244140625, 0.1187896728515625, 0.12798309326171875, 0.137176513671875, 0.14636993408203125, 0.1555633544921875, 0.16475677490234375, 0.1739501953125, 0.18314361572265625, 0.1923370361328125, 0.20153045654296875, 0.210723876953125, 0.21991729736328125, 0.2291107177734375, 0.23830413818359375, 0.24749755859375, 0.25669097900390625, 0.2658843994140625, 0.27507781982421875, 0.284271240234375, 0.29346466064453125, 0.3026580810546875, 0.31185150146484375, 0.321044921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 10.0, 14.0, 19.0, 17.0, 27.0, 30.0, 49.0, 57.0, 78.0, 112.0, 138.0, 200.0, 322.0, 525.0, 948.0, 1897.0, 4494.0, 13226.0, 50761.0, 312210.0, 3191632.0, 520098.0, 70009.0, 16846.0, 5371.0, 2246.0, 1080.0, 603.0, 341.0, 238.0, 162.0, 123.0, 86.0, 57.0, 46.0, 43.0, 37.0, 36.0, 17.0, 18.0, 7.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.7041015625, -0.6837539672851562, -0.6634063720703125, -0.6430587768554688, -0.622711181640625, -0.6023635864257812, -0.5820159912109375, -0.5616683959960938, -0.54132080078125, -0.5209732055664062, -0.5006256103515625, -0.48027801513671875, -0.459930419921875, -0.43958282470703125, -0.4192352294921875, -0.39888763427734375, -0.3785400390625, -0.35819244384765625, -0.3378448486328125, -0.31749725341796875, -0.297149658203125, -0.27680206298828125, -0.2564544677734375, -0.23610687255859375, -0.21575927734375, -0.19541168212890625, -0.1750640869140625, -0.15471649169921875, -0.134368896484375, -0.11402130126953125, -0.0936737060546875, -0.07332611083984375, -0.052978515625, -0.03263092041015625, -0.0122833251953125, 0.00806427001953125, 0.028411865234375, 0.04875946044921875, 0.0691070556640625, 0.08945465087890625, 0.10980224609375, 0.13014984130859375, 0.1504974365234375, 0.17084503173828125, 0.191192626953125, 0.21154022216796875, 0.2318878173828125, 0.25223541259765625, 0.2725830078125, 0.29293060302734375, 0.3132781982421875, 0.33362579345703125, 0.353973388671875, 0.37432098388671875, 0.3946685791015625, 0.41501617431640625, 0.43536376953125, 0.45571136474609375, 0.4760589599609375, 0.49640655517578125, 0.516754150390625, 0.5371017456054688, 0.5574493408203125, 0.5777969360351562, 0.59814453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 9.0, 11.0, 26.0, 35.0, 40.0, 50.0, 102.0, 173.0, 433.0, 1126.0, 1137.0, 449.0, 198.0, 109.0, 60.0, 40.0, 35.0, 18.0, 11.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.400390625, -0.376922607421875, -0.35345458984375, -0.329986572265625, -0.3065185546875, -0.283050537109375, -0.25958251953125, -0.236114501953125, -0.212646484375, -0.189178466796875, -0.16571044921875, -0.142242431640625, -0.1187744140625, -0.095306396484375, -0.07183837890625, -0.048370361328125, -0.02490234375, -0.001434326171875, 0.02203369140625, 0.045501708984375, 0.0689697265625, 0.092437744140625, 0.11590576171875, 0.139373779296875, 0.162841796875, 0.186309814453125, 0.20977783203125, 0.233245849609375, 0.2567138671875, 0.280181884765625, 0.30364990234375, 0.327117919921875, 0.3505859375, 0.374053955078125, 0.39752197265625, 0.420989990234375, 0.4444580078125, 0.467926025390625, 0.49139404296875, 0.514862060546875, 0.538330078125, 0.561798095703125, 0.58526611328125, 0.608734130859375, 0.6322021484375, 0.655670166015625, 0.67913818359375, 0.702606201171875, 0.72607421875, 0.749542236328125, 0.77301025390625, 0.796478271484375, 0.8199462890625, 0.843414306640625, 0.86688232421875, 0.890350341796875, 0.913818359375, 0.937286376953125, 0.96075439453125, 0.984222412109375, 1.0076904296875, 1.031158447265625, 1.05462646484375, 1.078094482421875, 1.1015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 10.0, 8.0, 20.0, 33.0, 45.0, 64.0, 112.0, 121.0, 142.0, 118.0, 89.0, 87.0, 49.0, 35.0, 24.0, 14.0, 6.0, 9.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.508502960205078, -3.4315292835235596, -3.354555368423462, -3.2775816917419434, -3.200608015060425, -3.123634099960327, -3.0466604232788086, -2.969686508178711, -2.8927128314971924, -2.815739154815674, -2.738765239715576, -2.6617915630340576, -2.584817886352539, -2.5078439712524414, -2.430870294570923, -2.3538966178894043, -2.2769227027893066, -2.199949026107788, -2.1229751110076904, -2.046001434326172, -1.9690276384353638, -1.8920538425445557, -1.815080165863037, -1.738106369972229, -1.6611328125, -1.584159016609192, -1.5071853399276733, -1.4302115440368652, -1.3532377481460571, -1.276263952255249, -1.1992902755737305, -1.1223164796829224, -1.0453428030014038, -0.9683690667152405, -0.8913952708244324, -0.814421534538269, -0.7374477386474609, -0.6604740023612976, -0.5835002660751343, -0.5065264701843262, -0.42955273389816284, -0.3525789678096771, -0.2756052017211914, -0.19863146543502808, -0.12165769934654236, -0.04468393325805664, 0.03228980302810669, 0.1092635989189148, 0.18623733520507812, 0.26321110129356384, 0.34018486738204956, 0.4171586036682129, 0.4941323697566986, 0.5711061358451843, 0.6480798721313477, 0.7250536680221558, 0.8020274043083191, 0.8790011405944824, 0.9559749364852905, 1.0329487323760986, 1.1099224090576172, 1.1868962049484253, 1.2638700008392334, 1.340843677520752, 1.41781747341156]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 12.0, 10.0, 18.0, 20.0, 17.0, 16.0, 26.0, 28.0, 24.0, 19.0, 30.0, 47.0, 42.0, 42.0, 30.0, 48.0, 40.0, 36.0, 33.0, 42.0, 39.0, 39.0, 39.0, 36.0, 30.0, 26.0, 18.0, 28.0, 20.0, 19.0, 15.0, 12.0, 15.0, 18.0, 13.0, 6.0, 8.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.2174007892608643, -1.176993727684021, -1.1365866661071777, -1.096179485321045, -1.0557724237442017, -1.0153653621673584, -0.9749583005905151, -0.9345512390136719, -0.8941441178321838, -0.8537370562553406, -0.8133299350738525, -0.7729228734970093, -0.732515811920166, -0.692108690738678, -0.6517016291618347, -0.6112945079803467, -0.5708874464035034, -0.5304803848266602, -0.4900732636451721, -0.44966620206832886, -0.4092591106891632, -0.36885201930999756, -0.3284449577331543, -0.28803786635398865, -0.247630774974823, -0.20722368359565735, -0.1668166071176529, -0.12640953063964844, -0.08600243926048279, -0.04559534788131714, -0.005188271403312683, 0.03521880507469177, 0.07562589645385742, 0.11603298038244247, 0.15644006431102753, 0.19684714078903198, 0.23725423216819763, 0.2776613235473633, 0.31806838512420654, 0.3584754765033722, 0.39888256788253784, 0.4392896592617035, 0.47969675064086914, 0.5201038122177124, 0.5605108737945557, 0.6009179949760437, 0.641325056552887, 0.681732177734375, 0.7221392393112183, 0.7625463008880615, 0.8029534220695496, 0.8433604836463928, 0.8837676048278809, 0.9241746664047241, 0.9645817279815674, 1.0049887895584106, 1.045395851135254, 1.0858029127120972, 1.1262099742889404, 1.1666171550750732, 1.2070242166519165, 1.2474312782287598, 1.287838339805603, 1.3282454013824463, 1.368652582168579]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 11.0, 22.0, 33.0, 34.0, 62.0, 100.0, 144.0, 231.0, 356.0, 535.0, 916.0, 1348.0, 2443.0, 3947.0, 6913.0, 12489.0, 23227.0, 44054.0, 86818.0, 172402.0, 262994.0, 205336.0, 107474.0, 53845.0, 27793.0, 14854.0, 8268.0, 4712.0, 2823.0, 1647.0, 1001.0, 629.0, 389.0, 242.0, 158.0, 108.0, 63.0, 52.0, 28.0, 20.0, 12.0, 9.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24470138549804688, -0.23671722412109375, -0.22873306274414062, -0.2207489013671875, -0.21276473999023438, -0.20478057861328125, -0.19679641723632812, -0.188812255859375, -0.18082809448242188, -0.17284393310546875, -0.16485977172851562, -0.1568756103515625, -0.14889144897460938, -0.14090728759765625, -0.13292312622070312, -0.12493896484375, -0.11695480346679688, -0.10897064208984375, -0.10098648071289062, -0.0930023193359375, -0.08501815795898438, -0.07703399658203125, -0.06904983520507812, -0.061065673828125, -0.053081512451171875, -0.04509735107421875, -0.037113189697265625, -0.0291290283203125, -0.021144866943359375, -0.01316070556640625, -0.005176544189453125, 0.0028076171875, 0.010791778564453125, 0.01877593994140625, 0.026760101318359375, 0.0347442626953125, 0.042728424072265625, 0.05071258544921875, 0.058696746826171875, 0.066680908203125, 0.07466506958007812, 0.08264923095703125, 0.09063339233398438, 0.0986175537109375, 0.10660171508789062, 0.11458587646484375, 0.12257003784179688, 0.13055419921875, 0.13853836059570312, 0.14652252197265625, 0.15450668334960938, 0.1624908447265625, 0.17047500610351562, 0.17845916748046875, 0.18644332885742188, 0.194427490234375, 0.20241165161132812, 0.21039581298828125, 0.21837997436523438, 0.2263641357421875, 0.23434829711914062, 0.24233245849609375, 0.2503166198730469, 0.25830078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 13.0, 10.0, 10.0, 14.0, 19.0, 29.0, 22.0, 35.0, 39.0, 40.0, 51.0, 50.0, 42.0, 57.0, 49.0, 46.0, 58.0, 58.0, 40.0, 35.0, 51.0, 41.0, 30.0, 32.0, 34.0, 23.0, 15.0, 16.0, 12.0, 9.0, 2.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24196624755859375, -0.2336883544921875, -0.22541046142578125, -0.217132568359375, -0.20885467529296875, -0.2005767822265625, -0.19229888916015625, -0.18402099609375, -0.17574310302734375, -0.1674652099609375, -0.15918731689453125, -0.150909423828125, -0.14263153076171875, -0.1343536376953125, -0.12607574462890625, -0.1177978515625, -0.10951995849609375, -0.1012420654296875, -0.09296417236328125, -0.084686279296875, -0.07640838623046875, -0.0681304931640625, -0.05985260009765625, -0.05157470703125, -0.04329681396484375, -0.0350189208984375, -0.02674102783203125, -0.018463134765625, -0.01018524169921875, -0.0019073486328125, 0.00637054443359375, 0.0146484375, 0.02292633056640625, 0.0312042236328125, 0.03948211669921875, 0.047760009765625, 0.05603790283203125, 0.0643157958984375, 0.07259368896484375, 0.08087158203125, 0.08914947509765625, 0.0974273681640625, 0.10570526123046875, 0.113983154296875, 0.12226104736328125, 0.1305389404296875, 0.13881683349609375, 0.1470947265625, 0.15537261962890625, 0.1636505126953125, 0.17192840576171875, 0.180206298828125, 0.18848419189453125, 0.1967620849609375, 0.20503997802734375, 0.21331787109375, 0.22159576416015625, 0.2298736572265625, 0.23815155029296875, 0.246429443359375, 0.25470733642578125, 0.2629852294921875, 0.27126312255859375, 0.279541015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 11.0, 15.0, 16.0, 27.0, 31.0, 34.0, 79.0, 144.0, 183.0, 335.0, 473.0, 750.0, 1302.0, 2337.0, 4005.0, 7319.0, 14069.0, 27579.0, 58374.0, 129055.0, 262493.0, 273983.0, 140753.0, 62283.0, 29857.0, 14795.0, 8014.0, 4258.0, 2375.0, 1347.0, 813.0, 523.0, 330.0, 200.0, 121.0, 89.0, 48.0, 49.0, 28.0, 17.0, 12.0, 8.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2894401550292969, -0.27980804443359375, -0.2701759338378906, -0.2605438232421875, -0.2509117126464844, -0.24127960205078125, -0.23164749145507812, -0.222015380859375, -0.21238327026367188, -0.20275115966796875, -0.19311904907226562, -0.1834869384765625, -0.17385482788085938, -0.16422271728515625, -0.15459060668945312, -0.14495849609375, -0.13532638549804688, -0.12569427490234375, -0.11606216430664062, -0.1064300537109375, -0.09679794311523438, -0.08716583251953125, -0.07753372192382812, -0.067901611328125, -0.058269500732421875, -0.04863739013671875, -0.039005279541015625, -0.0293731689453125, -0.019741058349609375, -0.01010894775390625, -0.000476837158203125, 0.0091552734375, 0.018787384033203125, 0.02841949462890625, 0.038051605224609375, 0.0476837158203125, 0.057315826416015625, 0.06694793701171875, 0.07658004760742188, 0.086212158203125, 0.09584426879882812, 0.10547637939453125, 0.11510848999023438, 0.1247406005859375, 0.13437271118164062, 0.14400482177734375, 0.15363693237304688, 0.16326904296875, 0.17290115356445312, 0.18253326416015625, 0.19216537475585938, 0.2017974853515625, 0.21142959594726562, 0.22106170654296875, 0.23069381713867188, 0.240325927734375, 0.24995803833007812, 0.25959014892578125, 0.2692222595214844, 0.2788543701171875, 0.2884864807128906, 0.29811859130859375, 0.3077507019042969, 0.3173828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 14.0, 14.0, 14.0, 22.0, 31.0, 44.0, 36.0, 42.0, 58.0, 44.0, 59.0, 67.0, 54.0, 50.0, 55.0, 59.0, 53.0, 51.0, 34.0, 35.0, 27.0, 25.0, 26.0, 11.0, 9.0, 14.0, 13.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9677734375, -0.9412460327148438, -0.9147186279296875, -0.8881912231445312, -0.861663818359375, -0.8351364135742188, -0.8086090087890625, -0.7820816040039062, -0.75555419921875, -0.7290267944335938, -0.7024993896484375, -0.6759719848632812, -0.649444580078125, -0.6229171752929688, -0.5963897705078125, -0.5698623657226562, -0.5433349609375, -0.5168075561523438, -0.4902801513671875, -0.46375274658203125, -0.437225341796875, -0.41069793701171875, -0.3841705322265625, -0.35764312744140625, -0.33111572265625, -0.30458831787109375, -0.2780609130859375, -0.25153350830078125, -0.225006103515625, -0.19847869873046875, -0.1719512939453125, -0.14542388916015625, -0.118896484375, -0.09236907958984375, -0.0658416748046875, -0.03931427001953125, -0.012786865234375, 0.01374053955078125, 0.0402679443359375, 0.06679534912109375, 0.09332275390625, 0.11985015869140625, 0.1463775634765625, 0.17290496826171875, 0.199432373046875, 0.22595977783203125, 0.2524871826171875, 0.27901458740234375, 0.3055419921875, 0.33206939697265625, 0.3585968017578125, 0.38512420654296875, 0.411651611328125, 0.43817901611328125, 0.4647064208984375, 0.49123382568359375, 0.51776123046875, 0.5442886352539062, 0.5708160400390625, 0.5973434448242188, 0.623870849609375, 0.6503982543945312, 0.6769256591796875, 0.7034530639648438, 0.72998046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 10.0, 19.0, 32.0, 48.0, 68.0, 123.0, 200.0, 324.0, 578.0, 1015.0, 2100.0, 4250.0, 9239.0, 21513.0, 54501.0, 146524.0, 322243.0, 287455.0, 119726.0, 44753.0, 18056.0, 7919.0, 3764.0, 1853.0, 963.0, 547.0, 305.0, 146.0, 106.0, 54.0, 38.0, 22.0, 17.0, 9.0, 8.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.13934326171875, -0.134521484375, -0.12969970703125, -0.1248779296875, -0.12005615234375, -0.115234375, -0.11041259765625, -0.1055908203125, -0.10076904296875, -0.095947265625, -0.09112548828125, -0.0863037109375, -0.08148193359375, -0.07666015625, -0.07183837890625, -0.0670166015625, -0.06219482421875, -0.057373046875, -0.05255126953125, -0.0477294921875, -0.04290771484375, -0.0380859375, -0.03326416015625, -0.0284423828125, -0.02362060546875, -0.018798828125, -0.01397705078125, -0.0091552734375, -0.00433349609375, 0.00048828125, 0.00531005859375, 0.0101318359375, 0.01495361328125, 0.019775390625, 0.02459716796875, 0.0294189453125, 0.03424072265625, 0.0390625, 0.04388427734375, 0.0487060546875, 0.05352783203125, 0.058349609375, 0.06317138671875, 0.0679931640625, 0.07281494140625, 0.07763671875, 0.08245849609375, 0.0872802734375, 0.09210205078125, 0.096923828125, 0.10174560546875, 0.1065673828125, 0.11138916015625, 0.1162109375, 0.12103271484375, 0.1258544921875, 0.13067626953125, 0.135498046875, 0.14031982421875, 0.1451416015625, 0.14996337890625, 0.15478515625, 0.15960693359375, 0.1644287109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 15.0, 17.0, 15.0, 22.0, 17.0, 32.0, 35.0, 48.0, 67.0, 59.0, 80.0, 88.0, 76.0, 69.0, 62.0, 69.0, 50.0, 38.0, 33.0, 25.0, 12.0, 19.0, 9.0, 5.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.738569259643555e-05, -4.618801176548004e-05, -4.4990330934524536e-05, -4.379265010356903e-05, -4.2594969272613525e-05, -4.139728844165802e-05, -4.0199607610702515e-05, -3.900192677974701e-05, -3.7804245948791504e-05, -3.6606565117836e-05, -3.540888428688049e-05, -3.421120345592499e-05, -3.301352262496948e-05, -3.181584179401398e-05, -3.061816096305847e-05, -2.9420480132102966e-05, -2.822279930114746e-05, -2.7025118470191956e-05, -2.582743763923645e-05, -2.4629756808280945e-05, -2.343207597732544e-05, -2.2234395146369934e-05, -2.103671431541443e-05, -1.9839033484458923e-05, -1.8641352653503418e-05, -1.7443671822547913e-05, -1.6245990991592407e-05, -1.5048310160636902e-05, -1.3850629329681396e-05, -1.2652948498725891e-05, -1.1455267667770386e-05, -1.025758683681488e-05, -9.059906005859375e-06, -7.86222517490387e-06, -6.664544343948364e-06, -5.466863512992859e-06, -4.2691826820373535e-06, -3.071501851081848e-06, -1.8738210201263428e-06, -6.761401891708374e-07, 5.21540641784668e-07, 1.7192214727401733e-06, 2.9169023036956787e-06, 4.114583134651184e-06, 5.3122639656066895e-06, 6.509944796562195e-06, 7.7076256275177e-06, 8.905306458473206e-06, 1.0102987289428711e-05, 1.1300668120384216e-05, 1.2498348951339722e-05, 1.3696029782295227e-05, 1.4893710613250732e-05, 1.6091391444206238e-05, 1.7289072275161743e-05, 1.848675310611725e-05, 1.9684433937072754e-05, 2.088211476802826e-05, 2.2079795598983765e-05, 2.327747642993927e-05, 2.4475157260894775e-05, 2.567283809185028e-05, 2.6870518922805786e-05, 2.806819975376129e-05, 2.9265880584716797e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 13.0, 21.0, 21.0, 42.0, 52.0, 68.0, 107.0, 185.0, 292.0, 474.0, 765.0, 1302.0, 2480.0, 4625.0, 9320.0, 20271.0, 47216.0, 116254.0, 261406.0, 308738.0, 158274.0, 64667.0, 26670.0, 12208.0, 5928.0, 2984.0, 1654.0, 980.0, 563.0, 325.0, 210.0, 122.0, 105.0, 47.0, 46.0, 41.0, 16.0, 16.0, 11.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.132659912109375, -0.12811279296875, -0.123565673828125, -0.1190185546875, -0.114471435546875, -0.10992431640625, -0.105377197265625, -0.100830078125, -0.096282958984375, -0.09173583984375, -0.087188720703125, -0.0826416015625, -0.078094482421875, -0.07354736328125, -0.069000244140625, -0.064453125, -0.059906005859375, -0.05535888671875, -0.050811767578125, -0.0462646484375, -0.041717529296875, -0.03717041015625, -0.032623291015625, -0.028076171875, -0.023529052734375, -0.01898193359375, -0.014434814453125, -0.0098876953125, -0.005340576171875, -0.00079345703125, 0.003753662109375, 0.00830078125, 0.012847900390625, 0.01739501953125, 0.021942138671875, 0.0264892578125, 0.031036376953125, 0.03558349609375, 0.040130615234375, 0.044677734375, 0.049224853515625, 0.05377197265625, 0.058319091796875, 0.0628662109375, 0.067413330078125, 0.07196044921875, 0.076507568359375, 0.0810546875, 0.085601806640625, 0.09014892578125, 0.094696044921875, 0.0992431640625, 0.103790283203125, 0.10833740234375, 0.112884521484375, 0.117431640625, 0.121978759765625, 0.12652587890625, 0.131072998046875, 0.1356201171875, 0.140167236328125, 0.14471435546875, 0.149261474609375, 0.15380859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 7.0, 11.0, 9.0, 9.0, 15.0, 5.0, 13.0, 22.0, 32.0, 24.0, 42.0, 39.0, 44.0, 73.0, 69.0, 64.0, 63.0, 61.0, 57.0, 58.0, 54.0, 43.0, 25.0, 34.0, 15.0, 14.0, 10.0, 22.0, 13.0, 7.0, 9.0, 7.0, 3.0, 8.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1724853515625, -0.16713333129882812, -0.16178131103515625, -0.15642929077148438, -0.1510772705078125, -0.14572525024414062, -0.14037322998046875, -0.13502120971679688, -0.129669189453125, -0.12431716918945312, -0.11896514892578125, -0.11361312866210938, -0.1082611083984375, -0.10290908813476562, -0.09755706787109375, -0.09220504760742188, -0.08685302734375, -0.08150100708007812, -0.07614898681640625, -0.07079696655273438, -0.0654449462890625, -0.060092926025390625, -0.05474090576171875, -0.049388885498046875, -0.044036865234375, -0.038684844970703125, -0.03333282470703125, -0.027980804443359375, -0.0226287841796875, -0.017276763916015625, -0.01192474365234375, -0.006572723388671875, -0.001220703125, 0.004131317138671875, 0.00948333740234375, 0.014835357666015625, 0.0201873779296875, 0.025539398193359375, 0.03089141845703125, 0.036243438720703125, 0.041595458984375, 0.046947479248046875, 0.05229949951171875, 0.057651519775390625, 0.0630035400390625, 0.06835556030273438, 0.07370758056640625, 0.07905960083007812, 0.08441162109375, 0.08976364135742188, 0.09511566162109375, 0.10046768188476562, 0.1058197021484375, 0.11117172241210938, 0.11652374267578125, 0.12187576293945312, 0.127227783203125, 0.13257980346679688, 0.13793182373046875, 0.14328384399414062, 0.1486358642578125, 0.15398788452148438, 0.15933990478515625, 0.16469192504882812, 0.1700439453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 9.0, 20.0, 51.0, 119.0, 192.0, 233.0, 170.0, 117.0, 54.0, 22.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.367371916770935, -1.257999062538147, -1.1486262083053589, -1.0392533540725708, -0.9298804998397827, -0.8205077052116394, -0.7111348509788513, -0.6017619967460632, -0.49238914251327515, -0.38301628828048706, -0.273643434047699, -0.16427060961723328, -0.05489775538444519, 0.05447506904602051, 0.1638479232788086, 0.2732207775115967, 0.38259363174438477, 0.49196648597717285, 0.6013393402099609, 0.710712194442749, 0.8200850486755371, 0.9294578433036804, 1.0388307571411133, 1.1482036113739014, 1.2575764656066895, 1.3669493198394775, 1.4763221740722656, 1.5856950283050537, 1.6950678825378418, 1.8044407367706299, 1.913813591003418, 2.023186445236206, 2.132559061050415, 2.241931915283203, 2.351304769515991, 2.4606776237487793, 2.5700504779815674, 2.6794233322143555, 2.7887961864471436, 2.8981690406799316, 3.0075418949127197, 3.116914749145508, 3.226287603378296, 3.335660457611084, 3.445033311843872, 3.55440616607666, 3.6637790203094482, 3.7731518745422363, 3.8825244903564453, 3.9918973445892334, 4.1012701988220215, 4.2106428146362305, 4.320015907287598, 4.429388523101807, 4.538761615753174, 4.648134231567383, 4.75750732421875, 4.866879940032959, 4.976253032684326, 5.085625648498535, 5.194998741149902, 5.304371356964111, 5.4137444496154785, 5.5231170654296875, 5.632490158081055]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 5.0, 9.0, 12.0, 10.0, 5.0, 11.0, 12.0, 21.0, 21.0, 25.0, 24.0, 27.0, 33.0, 30.0, 44.0, 45.0, 40.0, 43.0, 51.0, 48.0, 45.0, 31.0, 47.0, 51.0, 42.0, 28.0, 26.0, 37.0, 22.0, 27.0, 24.0, 18.0, 15.0, 13.0, 13.0, 5.0, 8.0, 6.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3939929008483887, -1.3468642234802246, -1.2997355461120605, -1.252606987953186, -1.205478310585022, -1.158349633216858, -1.1112209558486938, -1.0640923976898193, -1.0169637203216553, -0.9698350429534912, -0.9227064251899719, -0.8755777478218079, -0.8284491300582886, -0.7813204526901245, -0.7341917753219604, -0.6870631575584412, -0.6399344801902771, -0.592805802822113, -0.5456771850585938, -0.4985485076904297, -0.4514198899269104, -0.40429121255874634, -0.35716256499290466, -0.310033917427063, -0.2629052698612213, -0.21577662229537964, -0.16864797472953796, -0.1215193122625351, -0.07439066469669342, -0.027262017130851746, 0.019866645336151123, 0.0669952929019928, 0.11412394046783447, 0.16125258803367615, 0.20838123559951782, 0.2555099129676819, 0.30263853073120117, 0.34976720809936523, 0.3968958556652069, 0.4440245032310486, 0.49115315079689026, 0.5382817983627319, 0.585410475730896, 0.6325390934944153, 0.6796677708625793, 0.7267963886260986, 0.7739250659942627, 0.8210537433624268, 0.868182361125946, 0.9153110384941101, 0.9624396562576294, 1.0095683336257935, 1.0566970109939575, 1.103825569152832, 1.150954246520996, 1.1980829238891602, 1.2452116012573242, 1.2923402786254883, 1.3394689559936523, 1.3865975141525269, 1.433726191520691, 1.480854868888855, 1.527983546257019, 1.5751121044158936, 1.6222407817840576]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 13.0, 11.0, 19.0, 23.0, 30.0, 51.0, 61.0, 83.0, 141.0, 185.0, 235.0, 384.0, 530.0, 685.0, 1053.0, 1744.0, 2692.0, 4523.0, 7994.0, 15072.0, 30993.0, 75418.0, 244781.0, 944761.0, 1808730.0, 744835.0, 186638.0, 62575.0, 26954.0, 13624.0, 7399.0, 4359.0, 2639.0, 1663.0, 1018.0, 719.0, 480.0, 334.0, 222.0, 164.0, 134.0, 107.0, 55.0, 38.0, 41.0, 28.0, 19.0, 11.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.271240234375, -0.2631206512451172, -0.2550010681152344, -0.24688148498535156, -0.23876190185546875, -0.23064231872558594, -0.22252273559570312, -0.2144031524658203, -0.2062835693359375, -0.1981639862060547, -0.19004440307617188, -0.18192481994628906, -0.17380523681640625, -0.16568565368652344, -0.15756607055664062, -0.1494464874267578, -0.141326904296875, -0.1332073211669922, -0.12508773803710938, -0.11696815490722656, -0.10884857177734375, -0.10072898864746094, -0.09260940551757812, -0.08448982238769531, -0.0763702392578125, -0.06825065612792969, -0.060131072998046875, -0.05201148986816406, -0.04389190673828125, -0.03577232360839844, -0.027652740478515625, -0.019533157348632812, -0.01141357421875, -0.0032939910888671875, 0.004825592041015625, 0.012945175170898438, 0.02106475830078125, 0.029184341430664062, 0.037303924560546875, 0.04542350769042969, 0.0535430908203125, 0.06166267395019531, 0.06978225708007812, 0.07790184020996094, 0.08602142333984375, 0.09414100646972656, 0.10226058959960938, 0.11038017272949219, 0.118499755859375, 0.1266193389892578, 0.13473892211914062, 0.14285850524902344, 0.15097808837890625, 0.15909767150878906, 0.16721725463867188, 0.1753368377685547, 0.1834564208984375, 0.1915760040283203, 0.19969558715820312, 0.20781517028808594, 0.21593475341796875, 0.22405433654785156, 0.23217391967773438, 0.2402935028076172, 0.2484130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 11.0, 15.0, 18.0, 19.0, 25.0, 26.0, 40.0, 40.0, 51.0, 39.0, 49.0, 55.0, 54.0, 61.0, 56.0, 62.0, 44.0, 57.0, 43.0, 40.0, 32.0, 40.0, 32.0, 16.0, 15.0, 9.0, 15.0, 8.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29296875, -0.2837104797363281, -0.27445220947265625, -0.2651939392089844, -0.2559356689453125, -0.24667739868164062, -0.23741912841796875, -0.22816085815429688, -0.218902587890625, -0.20964431762695312, -0.20038604736328125, -0.19112777709960938, -0.1818695068359375, -0.17261123657226562, -0.16335296630859375, -0.15409469604492188, -0.14483642578125, -0.13557815551757812, -0.12631988525390625, -0.11706161499023438, -0.1078033447265625, -0.09854507446289062, -0.08928680419921875, -0.08002853393554688, -0.070770263671875, -0.061511993408203125, -0.05225372314453125, -0.042995452880859375, -0.0337371826171875, -0.024478912353515625, -0.01522064208984375, -0.005962371826171875, 0.0032958984375, 0.012554168701171875, 0.02181243896484375, 0.031070709228515625, 0.0403289794921875, 0.049587249755859375, 0.05884552001953125, 0.06810379028320312, 0.077362060546875, 0.08662033081054688, 0.09587860107421875, 0.10513687133789062, 0.1143951416015625, 0.12365341186523438, 0.13291168212890625, 0.14216995239257812, 0.15142822265625, 0.16068649291992188, 0.16994476318359375, 0.17920303344726562, 0.1884613037109375, 0.19771957397460938, 0.20697784423828125, 0.21623611450195312, 0.225494384765625, 0.23475265502929688, 0.24401092529296875, 0.2532691955566406, 0.2625274658203125, 0.2717857360839844, 0.28104400634765625, 0.2903022766113281, 0.299560546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 6.0, 3.0, 3.0, 8.0, 6.0, 5.0, 15.0, 22.0, 30.0, 38.0, 59.0, 69.0, 116.0, 195.0, 261.0, 465.0, 807.0, 1474.0, 2905.0, 6878.0, 18759.0, 60533.0, 260104.0, 2184286.0, 1400714.0, 184298.0, 45871.0, 14868.0, 5695.0, 2540.0, 1318.0, 714.0, 401.0, 231.0, 160.0, 101.0, 82.0, 69.0, 40.0, 30.0, 27.0, 20.0, 11.0, 8.0, 11.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.478759765625, -0.4637489318847656, -0.44873809814453125, -0.4337272644042969, -0.4187164306640625, -0.4037055969238281, -0.38869476318359375, -0.3736839294433594, -0.358673095703125, -0.3436622619628906, -0.32865142822265625, -0.3136405944824219, -0.2986297607421875, -0.2836189270019531, -0.26860809326171875, -0.2535972595214844, -0.23858642578125, -0.22357559204101562, -0.20856475830078125, -0.19355392456054688, -0.1785430908203125, -0.16353225708007812, -0.14852142333984375, -0.13351058959960938, -0.118499755859375, -0.10348892211914062, -0.08847808837890625, -0.07346725463867188, -0.0584564208984375, -0.043445587158203125, -0.02843475341796875, -0.013423919677734375, 0.0015869140625, 0.016597747802734375, 0.03160858154296875, 0.046619415283203125, 0.0616302490234375, 0.07664108276367188, 0.09165191650390625, 0.10666275024414062, 0.121673583984375, 0.13668441772460938, 0.15169525146484375, 0.16670608520507812, 0.1817169189453125, 0.19672775268554688, 0.21173858642578125, 0.22674942016601562, 0.24176025390625, 0.2567710876464844, 0.27178192138671875, 0.2867927551269531, 0.3018035888671875, 0.3168144226074219, 0.33182525634765625, 0.3468360900878906, 0.361846923828125, 0.3768577575683594, 0.39186859130859375, 0.4068794250488281, 0.4218902587890625, 0.4369010925292969, 0.45191192626953125, 0.4669227600097656, 0.48193359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 7.0, 4.0, 4.0, 11.0, 16.0, 23.0, 29.0, 60.0, 91.0, 169.0, 282.0, 523.0, 1032.0, 889.0, 437.0, 196.0, 99.0, 81.0, 53.0, 25.0, 17.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.57421875, -0.5510482788085938, -0.5278778076171875, -0.5047073364257812, -0.481536865234375, -0.45836639404296875, -0.4351959228515625, -0.41202545166015625, -0.38885498046875, -0.36568450927734375, -0.3425140380859375, -0.31934356689453125, -0.296173095703125, -0.27300262451171875, -0.2498321533203125, -0.22666168212890625, -0.2034912109375, -0.18032073974609375, -0.1571502685546875, -0.13397979736328125, -0.110809326171875, -0.08763885498046875, -0.0644683837890625, -0.04129791259765625, -0.01812744140625, 0.00504302978515625, 0.0282135009765625, 0.05138397216796875, 0.074554443359375, 0.09772491455078125, 0.1208953857421875, 0.14406585693359375, 0.167236328125, 0.19040679931640625, 0.2135772705078125, 0.23674774169921875, 0.259918212890625, 0.28308868408203125, 0.3062591552734375, 0.32942962646484375, 0.35260009765625, 0.37577056884765625, 0.3989410400390625, 0.42211151123046875, 0.445281982421875, 0.46845245361328125, 0.4916229248046875, 0.5147933959960938, 0.5379638671875, 0.5611343383789062, 0.5843048095703125, 0.6074752807617188, 0.630645751953125, 0.6538162231445312, 0.6769866943359375, 0.7001571655273438, 0.72332763671875, 0.7464981079101562, 0.7696685791015625, 0.7928390502929688, 0.816009521484375, 0.8391799926757812, 0.8623504638671875, 0.8855209350585938, 0.90869140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 15.0, 25.0, 34.0, 65.0, 98.0, 135.0, 142.0, 145.0, 119.0, 75.0, 43.0, 35.0, 18.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4869329929351807, -3.3945891857147217, -3.3022453784942627, -3.2099015712738037, -3.1175577640533447, -3.0252139568328857, -2.932870388031006, -2.840526580810547, -2.748182773590088, -2.655838966369629, -2.56349515914917, -2.471151351928711, -2.378807544708252, -2.286463737487793, -2.194119930267334, -2.101776123046875, -2.009432315826416, -1.917088508605957, -1.824744701385498, -1.732400894165039, -1.64005708694458, -1.547713279724121, -1.4553695917129517, -1.3630257844924927, -1.2706819772720337, -1.1783381700515747, -1.0859943628311157, -0.9936506152153015, -0.9013068079948425, -0.8089630007743835, -0.7166192531585693, -0.6242754459381104, -0.5319318771362305, -0.4395880699157715, -0.3472442924976349, -0.2549005150794983, -0.1625567078590393, -0.07021290063858032, 0.022130846977233887, 0.11447465419769287, 0.20681846141815186, 0.29916226863861084, 0.39150604605674744, 0.48384982347488403, 0.576193630695343, 0.668537437915802, 0.7608811855316162, 0.8532249927520752, 0.9455687999725342, 1.0379126071929932, 1.1302564144134521, 1.2226002216339111, 1.3149440288543701, 1.407287836074829, 1.4996315240859985, 1.5919753313064575, 1.6843191385269165, 1.7766629457473755, 1.8690067529678345, 1.961350440979004, 2.053694248199463, 2.146038055419922, 2.238381862640381, 2.33072566986084, 2.423069477081299]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 4.0, 10.0, 12.0, 16.0, 20.0, 17.0, 16.0, 20.0, 29.0, 28.0, 27.0, 37.0, 40.0, 32.0, 44.0, 37.0, 59.0, 51.0, 36.0, 47.0, 41.0, 50.0, 42.0, 43.0, 37.0, 22.0, 22.0, 28.0, 15.0, 22.0, 17.0, 16.0, 14.0, 11.0, 11.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5050649642944336, -1.4561575651168823, -1.407250165939331, -1.3583427667617798, -1.3094353675842285, -1.2605279684066772, -1.211620569229126, -1.1627132892608643, -1.1138057708740234, -1.0648983716964722, -1.015990972518921, -0.9670835733413696, -0.9181761741638184, -0.8692687749862671, -0.8203614354133606, -0.7714540362358093, -0.7225466966629028, -0.6736392974853516, -0.6247318983078003, -0.575824499130249, -0.5269170999526978, -0.47800973057746887, -0.42910236120224, -0.3801949620246887, -0.33128756284713745, -0.2823801636695862, -0.2334727793931961, -0.18456539511680603, -0.13565799593925476, -0.08675059676170349, -0.03784322738647461, 0.01106417179107666, 0.05997157096862793, 0.1088789626955986, 0.15778635442256927, 0.20669373869895935, 0.2556011378765106, 0.3045085370540619, 0.35341590642929077, 0.40232330560684204, 0.4512307047843933, 0.5001381039619446, 0.5490455031394958, 0.5979528427124023, 0.6468602418899536, 0.6957676410675049, 0.7446750402450562, 0.7935824394226074, 0.8424898386001587, 0.89139723777771, 0.9403046369552612, 0.9892120361328125, 1.0381194353103638, 1.087026834487915, 1.1359341144561768, 1.1848416328430176, 1.2337489128112793, 1.2826563119888306, 1.3315637111663818, 1.380471110343933, 1.4293785095214844, 1.4782859086990356, 1.527193307876587, 1.5761005878448486, 1.6250081062316895]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 9.0, 19.0, 24.0, 28.0, 56.0, 92.0, 117.0, 186.0, 290.0, 424.0, 745.0, 1284.0, 2123.0, 3751.0, 6883.0, 13925.0, 31664.0, 81013.0, 224051.0, 370381.0, 188965.0, 68467.0, 27097.0, 12396.0, 6177.0, 3449.0, 1889.0, 1166.0, 716.0, 414.0, 273.0, 155.0, 110.0, 86.0, 44.0, 25.0, 21.0, 16.0, 7.0, 5.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.477294921875, -0.4641876220703125, -0.451080322265625, -0.4379730224609375, -0.42486572265625, -0.4117584228515625, -0.398651123046875, -0.3855438232421875, -0.3724365234375, -0.3593292236328125, -0.346221923828125, -0.3331146240234375, -0.32000732421875, -0.3069000244140625, -0.293792724609375, -0.2806854248046875, -0.267578125, -0.2544708251953125, -0.241363525390625, -0.2282562255859375, -0.21514892578125, -0.2020416259765625, -0.188934326171875, -0.1758270263671875, -0.1627197265625, -0.1496124267578125, -0.136505126953125, -0.1233978271484375, -0.11029052734375, -0.0971832275390625, -0.084075927734375, -0.0709686279296875, -0.057861328125, -0.0447540283203125, -0.031646728515625, -0.0185394287109375, -0.00543212890625, 0.0076751708984375, 0.020782470703125, 0.0338897705078125, 0.0469970703125, 0.0601043701171875, 0.073211669921875, 0.0863189697265625, 0.09942626953125, 0.1125335693359375, 0.125640869140625, 0.1387481689453125, 0.15185546875, 0.1649627685546875, 0.178070068359375, 0.1911773681640625, 0.20428466796875, 0.2173919677734375, 0.230499267578125, 0.2436065673828125, 0.2567138671875, 0.2698211669921875, 0.282928466796875, 0.2960357666015625, 0.30914306640625, 0.3222503662109375, 0.335357666015625, 0.3484649658203125, 0.361572265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 4.0, 14.0, 6.0, 13.0, 18.0, 22.0, 22.0, 28.0, 28.0, 43.0, 36.0, 43.0, 41.0, 67.0, 62.0, 50.0, 64.0, 55.0, 47.0, 47.0, 47.0, 36.0, 36.0, 35.0, 25.0, 18.0, 22.0, 18.0, 13.0, 7.0, 10.0, 9.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30810546875, -0.2987709045410156, -0.28943634033203125, -0.2801017761230469, -0.2707672119140625, -0.2614326477050781, -0.25209808349609375, -0.24276351928710938, -0.233428955078125, -0.22409439086914062, -0.21475982666015625, -0.20542526245117188, -0.1960906982421875, -0.18675613403320312, -0.17742156982421875, -0.16808700561523438, -0.15875244140625, -0.14941787719726562, -0.14008331298828125, -0.13074874877929688, -0.1214141845703125, -0.11207962036132812, -0.10274505615234375, -0.09341049194335938, -0.084075927734375, -0.07474136352539062, -0.06540679931640625, -0.056072235107421875, -0.0467376708984375, -0.037403106689453125, -0.02806854248046875, -0.018733978271484375, -0.0093994140625, -6.4849853515625e-05, 0.00926971435546875, 0.018604278564453125, 0.0279388427734375, 0.037273406982421875, 0.04660797119140625, 0.055942535400390625, 0.065277099609375, 0.07461166381835938, 0.08394622802734375, 0.09328079223632812, 0.1026153564453125, 0.11194992065429688, 0.12128448486328125, 0.13061904907226562, 0.13995361328125, 0.14928817749023438, 0.15862274169921875, 0.16795730590820312, 0.1772918701171875, 0.18662643432617188, 0.19596099853515625, 0.20529556274414062, 0.214630126953125, 0.22396469116210938, 0.23329925537109375, 0.24263381958007812, 0.2519683837890625, 0.2613029479980469, 0.27063751220703125, 0.2799720764160156, 0.289306640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 21.0, 19.0, 28.0, 45.0, 83.0, 147.0, 253.0, 516.0, 1128.0, 2606.0, 6333.0, 17344.0, 53793.0, 215689.0, 519593.0, 164002.0, 43250.0, 14089.0, 5361.0, 2259.0, 981.0, 472.0, 209.0, 126.0, 70.0, 44.0, 23.0, 14.0, 11.0, 16.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5674285888671875, -0.547454833984375, -0.5274810791015625, -0.50750732421875, -0.4875335693359375, -0.467559814453125, -0.4475860595703125, -0.4276123046875, -0.4076385498046875, -0.387664794921875, -0.3676910400390625, -0.34771728515625, -0.3277435302734375, -0.307769775390625, -0.2877960205078125, -0.267822265625, -0.2478485107421875, -0.227874755859375, -0.2079010009765625, -0.18792724609375, -0.1679534912109375, -0.147979736328125, -0.1280059814453125, -0.1080322265625, -0.0880584716796875, -0.068084716796875, -0.0481109619140625, -0.02813720703125, -0.0081634521484375, 0.011810302734375, 0.0317840576171875, 0.0517578125, 0.0717315673828125, 0.091705322265625, 0.1116790771484375, 0.13165283203125, 0.1516265869140625, 0.171600341796875, 0.1915740966796875, 0.2115478515625, 0.2315216064453125, 0.251495361328125, 0.2714691162109375, 0.29144287109375, 0.3114166259765625, 0.331390380859375, 0.3513641357421875, 0.371337890625, 0.3913116455078125, 0.411285400390625, 0.4312591552734375, 0.45123291015625, 0.4712066650390625, 0.491180419921875, 0.5111541748046875, 0.5311279296875, 0.5511016845703125, 0.571075439453125, 0.5910491943359375, 0.61102294921875, 0.6309967041015625, 0.650970458984375, 0.6709442138671875, 0.69091796875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 12.0, 9.0, 11.0, 25.0, 32.0, 22.0, 28.0, 34.0, 42.0, 44.0, 45.0, 47.0, 56.0, 57.0, 55.0, 55.0, 59.0, 45.0, 39.0, 33.0, 36.0, 35.0, 36.0, 23.0, 28.0, 23.0, 17.0, 8.0, 10.0, 9.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8217926025390625, -0.795440673828125, -0.7690887451171875, -0.74273681640625, -0.7163848876953125, -0.690032958984375, -0.6636810302734375, -0.6373291015625, -0.6109771728515625, -0.584625244140625, -0.5582733154296875, -0.53192138671875, -0.5055694580078125, -0.479217529296875, -0.4528656005859375, -0.426513671875, -0.4001617431640625, -0.373809814453125, -0.3474578857421875, -0.32110595703125, -0.2947540283203125, -0.268402099609375, -0.2420501708984375, -0.2156982421875, -0.1893463134765625, -0.162994384765625, -0.1366424560546875, -0.11029052734375, -0.0839385986328125, -0.057586669921875, -0.0312347412109375, -0.0048828125, 0.0214691162109375, 0.047821044921875, 0.0741729736328125, 0.10052490234375, 0.1268768310546875, 0.153228759765625, 0.1795806884765625, 0.2059326171875, 0.2322845458984375, 0.258636474609375, 0.2849884033203125, 0.31134033203125, 0.3376922607421875, 0.364044189453125, 0.3903961181640625, 0.416748046875, 0.4430999755859375, 0.469451904296875, 0.4958038330078125, 0.52215576171875, 0.5485076904296875, 0.574859619140625, 0.6012115478515625, 0.6275634765625, 0.6539154052734375, 0.680267333984375, 0.7066192626953125, 0.73297119140625, 0.7593231201171875, 0.785675048828125, 0.8120269775390625, 0.83837890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 2.0, 4.0, 10.0, 9.0, 10.0, 23.0, 30.0, 47.0, 37.0, 61.0, 81.0, 148.0, 190.0, 288.0, 430.0, 657.0, 1102.0, 1861.0, 3293.0, 5993.0, 11278.0, 22757.0, 49360.0, 109548.0, 225594.0, 285883.0, 174954.0, 81057.0, 36532.0, 17210.0, 8634.0, 4616.0, 2585.0, 1564.0, 914.0, 587.0, 342.0, 259.0, 167.0, 118.0, 85.0, 59.0, 49.0, 43.0, 25.0, 19.0, 11.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.1300048828125, -0.12632274627685547, -0.12264060974121094, -0.1189584732055664, -0.11527633666992188, -0.11159420013427734, -0.10791206359863281, -0.10422992706298828, -0.10054779052734375, -0.09686565399169922, -0.09318351745605469, -0.08950138092041016, -0.08581924438476562, -0.0821371078491211, -0.07845497131347656, -0.07477283477783203, -0.0710906982421875, -0.06740856170654297, -0.06372642517089844, -0.060044288635253906, -0.056362152099609375, -0.052680015563964844, -0.04899787902832031, -0.04531574249267578, -0.04163360595703125, -0.03795146942138672, -0.03426933288574219, -0.030587196350097656, -0.026905059814453125, -0.023222923278808594, -0.019540786743164062, -0.01585865020751953, -0.012176513671875, -0.008494377136230469, -0.0048122406005859375, -0.0011301040649414062, 0.002552032470703125, 0.006234169006347656, 0.009916305541992188, 0.013598442077636719, 0.01728057861328125, 0.02096271514892578, 0.024644851684570312, 0.028326988220214844, 0.032009124755859375, 0.035691261291503906, 0.03937339782714844, 0.04305553436279297, 0.0467376708984375, 0.05041980743408203, 0.05410194396972656, 0.057784080505371094, 0.061466217041015625, 0.06514835357666016, 0.06883049011230469, 0.07251262664794922, 0.07619476318359375, 0.07987689971923828, 0.08355903625488281, 0.08724117279052734, 0.09092330932617188, 0.0946054458618164, 0.09828758239746094, 0.10196971893310547, 0.10565185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 16.0, 20.0, 20.0, 35.0, 40.0, 59.0, 95.0, 104.0, 163.0, 122.0, 92.0, 54.0, 56.0, 38.0, 28.0, 17.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2378902435302734e-05, -4.0502287447452545e-05, -3.8625672459602356e-05, -3.674905747175217e-05, -3.487244248390198e-05, -3.299582749605179e-05, -3.11192125082016e-05, -2.924259752035141e-05, -2.736598253250122e-05, -2.548936754465103e-05, -2.3612752556800842e-05, -2.1736137568950653e-05, -1.9859522581100464e-05, -1.7982907593250275e-05, -1.6106292605400085e-05, -1.4229677617549896e-05, -1.2353062629699707e-05, -1.0476447641849518e-05, -8.599832653999329e-06, -6.723217666149139e-06, -4.84660267829895e-06, -2.969987690448761e-06, -1.0933727025985718e-06, 7.832422852516174e-07, 2.6598572731018066e-06, 4.536472260951996e-06, 6.413087248802185e-06, 8.289702236652374e-06, 1.0166317224502563e-05, 1.2042932212352753e-05, 1.3919547200202942e-05, 1.579616218805313e-05, 1.767277717590332e-05, 1.954939216375351e-05, 2.14260071516037e-05, 2.3302622139453888e-05, 2.5179237127304077e-05, 2.7055852115154266e-05, 2.8932467103004456e-05, 3.0809082090854645e-05, 3.2685697078704834e-05, 3.456231206655502e-05, 3.643892705440521e-05, 3.83155420422554e-05, 4.019215703010559e-05, 4.206877201795578e-05, 4.394538700580597e-05, 4.582200199365616e-05, 4.769861698150635e-05, 4.957523196935654e-05, 5.1451846957206726e-05, 5.3328461945056915e-05, 5.5205076932907104e-05, 5.7081691920757294e-05, 5.895830690860748e-05, 6.083492189645767e-05, 6.271153688430786e-05, 6.458815187215805e-05, 6.646476686000824e-05, 6.834138184785843e-05, 7.021799683570862e-05, 7.209461182355881e-05, 7.3971226811409e-05, 7.584784179925919e-05, 7.772445678710938e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 6.0, 11.0, 20.0, 25.0, 31.0, 53.0, 76.0, 125.0, 222.0, 360.0, 585.0, 974.0, 1672.0, 2908.0, 5326.0, 10414.0, 20497.0, 43339.0, 93785.0, 189851.0, 267664.0, 207519.0, 105872.0, 48854.0, 23125.0, 11545.0, 5975.0, 3192.0, 1861.0, 1051.0, 627.0, 334.0, 227.0, 131.0, 94.0, 69.0, 41.0, 21.0, 21.0, 12.0, 11.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1168212890625, -0.1132354736328125, -0.109649658203125, -0.1060638427734375, -0.10247802734375, -0.0988922119140625, -0.095306396484375, -0.0917205810546875, -0.088134765625, -0.0845489501953125, -0.080963134765625, -0.0773773193359375, -0.07379150390625, -0.0702056884765625, -0.066619873046875, -0.0630340576171875, -0.0594482421875, -0.0558624267578125, -0.052276611328125, -0.0486907958984375, -0.04510498046875, -0.0415191650390625, -0.037933349609375, -0.0343475341796875, -0.03076171875, -0.0271759033203125, -0.023590087890625, -0.0200042724609375, -0.01641845703125, -0.0128326416015625, -0.009246826171875, -0.0056610107421875, -0.0020751953125, 0.0015106201171875, 0.005096435546875, 0.0086822509765625, 0.01226806640625, 0.0158538818359375, 0.019439697265625, 0.0230255126953125, 0.026611328125, 0.0301971435546875, 0.033782958984375, 0.0373687744140625, 0.04095458984375, 0.0445404052734375, 0.048126220703125, 0.0517120361328125, 0.0552978515625, 0.0588836669921875, 0.062469482421875, 0.0660552978515625, 0.06964111328125, 0.0732269287109375, 0.076812744140625, 0.0803985595703125, 0.083984375, 0.0875701904296875, 0.091156005859375, 0.0947418212890625, 0.09832763671875, 0.1019134521484375, 0.105499267578125, 0.1090850830078125, 0.1126708984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 11.0, 10.0, 13.0, 10.0, 22.0, 17.0, 37.0, 48.0, 45.0, 45.0, 45.0, 52.0, 61.0, 98.0, 72.0, 53.0, 58.0, 59.0, 50.0, 38.0, 28.0, 24.0, 21.0, 15.0, 14.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1456298828125, -0.14086532592773438, -0.13610076904296875, -0.13133621215820312, -0.1265716552734375, -0.12180709838867188, -0.11704254150390625, -0.11227798461914062, -0.107513427734375, -0.10274887084960938, -0.09798431396484375, -0.09321975708007812, -0.0884552001953125, -0.08369064331054688, -0.07892608642578125, -0.07416152954101562, -0.06939697265625, -0.06463241577148438, -0.05986785888671875, -0.055103302001953125, -0.0503387451171875, -0.045574188232421875, -0.04080963134765625, -0.036045074462890625, -0.031280517578125, -0.026515960693359375, -0.02175140380859375, -0.016986846923828125, -0.0122222900390625, -0.007457733154296875, -0.00269317626953125, 0.002071380615234375, 0.0068359375, 0.011600494384765625, 0.01636505126953125, 0.021129608154296875, 0.0258941650390625, 0.030658721923828125, 0.03542327880859375, 0.040187835693359375, 0.044952392578125, 0.049716949462890625, 0.05448150634765625, 0.059246063232421875, 0.0640106201171875, 0.06877517700195312, 0.07353973388671875, 0.07830429077148438, 0.08306884765625, 0.08783340454101562, 0.09259796142578125, 0.09736251831054688, 0.1021270751953125, 0.10689163208007812, 0.11165618896484375, 0.11642074584960938, 0.121185302734375, 0.12594985961914062, 0.13071441650390625, 0.13547897338867188, 0.1402435302734375, 0.14500808715820312, 0.14977264404296875, 0.15453720092773438, 0.1593017578125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 6.0, 16.0, 24.0, 34.0, 36.0, 45.0, 87.0, 100.0, 101.0, 115.0, 102.0, 81.0, 84.0, 51.0, 31.0, 24.0, 16.0, 9.0, 7.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1826345920562744, -2.1228837966918945, -2.0631330013275146, -2.0033822059631348, -1.9436314105987549, -1.883880615234375, -1.8241298198699951, -1.7643790245056152, -1.7046282291412354, -1.6448774337768555, -1.5851266384124756, -1.5253758430480957, -1.4656250476837158, -1.405874252319336, -1.346123456954956, -1.2863726615905762, -1.2266217470169067, -1.1668709516525269, -1.107120156288147, -1.047369360923767, -0.9876185655593872, -0.9278677701950073, -0.8681169152259827, -0.8083661198616028, -0.7486153244972229, -0.688864529132843, -0.6291137337684631, -0.5693628787994385, -0.5096120834350586, -0.4498613178730011, -0.39011049270629883, -0.33035969734191895, -0.27060890197753906, -0.21085810661315918, -0.1511072963476181, -0.09135648608207703, -0.031605690717697144, 0.02814510464668274, 0.08789592981338501, 0.1476467251777649, 0.20739752054214478, 0.26714831590652466, 0.32689911127090454, 0.3866499364376068, 0.4464007318019867, 0.506151556968689, 0.5659023523330688, 0.6256531476974487, 0.6854039430618286, 0.7451547384262085, 0.8049055337905884, 0.8646563291549683, 0.9244071245193481, 0.984157919883728, 1.0439088344573975, 1.1036596298217773, 1.1634104251861572, 1.223161220550537, 1.282912015914917, 1.3426628112792969, 1.4024136066436768, 1.4621644020080566, 1.5219151973724365, 1.5816659927368164, 1.6414167881011963]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 5.0, 8.0, 17.0, 18.0, 19.0, 26.0, 28.0, 23.0, 30.0, 40.0, 35.0, 49.0, 35.0, 41.0, 40.0, 51.0, 47.0, 57.0, 56.0, 45.0, 38.0, 44.0, 25.0, 35.0, 33.0, 25.0, 18.0, 23.0, 13.0, 14.0, 11.0, 15.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5793888568878174, -1.5214924812316895, -1.4635961055755615, -1.4056997299194336, -1.3478032350540161, -1.2899068593978882, -1.2320104837417603, -1.1741141080856323, -1.1162177324295044, -1.0583213567733765, -1.0004249811172485, -0.9425285458564758, -0.8846321702003479, -0.8267357349395752, -0.7688393592834473, -0.7109429836273193, -0.6530465483665466, -0.5951501727104187, -0.537253737449646, -0.47935736179351807, -0.42146098613739014, -0.3635645806789398, -0.3056681752204895, -0.24777179956436157, -0.18987539410591125, -0.13197900354862213, -0.07408260554075241, -0.01618620753288269, 0.04171018302440643, 0.09960657358169556, 0.15750297904014587, 0.2153993546962738, 0.2732957601547241, 0.33119216561317444, 0.38908854126930237, 0.4469849467277527, 0.5048813223838806, 0.5627777576446533, 0.6206741333007812, 0.6785705089569092, 0.7364668846130371, 0.794363260269165, 0.8522596955299377, 0.9101560711860657, 0.9680524468421936, 1.0259488821029663, 1.0838452577590942, 1.1417416334152222, 1.1996381282806396, 1.2575345039367676, 1.3154308795928955, 1.3733272552490234, 1.431223750114441, 1.4891201257705688, 1.5470165014266968, 1.6049128770828247, 1.6628092527389526, 1.7207056283950806, 1.7786020040512085, 1.836498498916626, 1.894394874572754, 1.9522912502288818, 2.0101876258850098, 2.0680840015411377, 2.1259803771972656]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 13.0, 10.0, 15.0, 12.0, 23.0, 33.0, 48.0, 62.0, 107.0, 152.0, 237.0, 375.0, 628.0, 1008.0, 1890.0, 3672.0, 7523.0, 17290.0, 49320.0, 213743.0, 1103486.0, 2070414.0, 560971.0, 107714.0, 30911.0, 12326.0, 5691.0, 2833.0, 1498.0, 836.0, 490.0, 345.0, 193.0, 126.0, 94.0, 55.0, 47.0, 22.0, 20.0, 11.0, 8.0, 10.0, 10.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3515625, -0.34067535400390625, -0.3297882080078125, -0.31890106201171875, -0.308013916015625, -0.29712677001953125, -0.2862396240234375, -0.27535247802734375, -0.26446533203125, -0.25357818603515625, -0.2426910400390625, -0.23180389404296875, -0.220916748046875, -0.21002960205078125, -0.1991424560546875, -0.18825531005859375, -0.1773681640625, -0.16648101806640625, -0.1555938720703125, -0.14470672607421875, -0.133819580078125, -0.12293243408203125, -0.1120452880859375, -0.10115814208984375, -0.09027099609375, -0.07938385009765625, -0.0684967041015625, -0.05760955810546875, -0.046722412109375, -0.03583526611328125, -0.0249481201171875, -0.01406097412109375, -0.003173828125, 0.00771331787109375, 0.0186004638671875, 0.02948760986328125, 0.040374755859375, 0.05126190185546875, 0.0621490478515625, 0.07303619384765625, 0.08392333984375, 0.09481048583984375, 0.1056976318359375, 0.11658477783203125, 0.127471923828125, 0.13835906982421875, 0.1492462158203125, 0.16013336181640625, 0.1710205078125, 0.18190765380859375, 0.1927947998046875, 0.20368194580078125, 0.214569091796875, 0.22545623779296875, 0.2363433837890625, 0.24723052978515625, 0.25811767578125, 0.26900482177734375, 0.2798919677734375, 0.29077911376953125, 0.301666259765625, 0.31255340576171875, 0.3234405517578125, 0.33432769775390625, 0.34521484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 8.0, 12.0, 12.0, 14.0, 13.0, 13.0, 27.0, 34.0, 35.0, 41.0, 45.0, 57.0, 46.0, 39.0, 46.0, 48.0, 59.0, 46.0, 44.0, 49.0, 31.0, 36.0, 25.0, 37.0, 37.0, 18.0, 20.0, 17.0, 16.0, 17.0, 12.0, 11.0, 9.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.2791099548339844, -0.27037811279296875, -0.2616462707519531, -0.2529144287109375, -0.24418258666992188, -0.23545074462890625, -0.22671890258789062, -0.217987060546875, -0.20925521850585938, -0.20052337646484375, -0.19179153442382812, -0.1830596923828125, -0.17432785034179688, -0.16559600830078125, -0.15686416625976562, -0.14813232421875, -0.13940048217773438, -0.13066864013671875, -0.12193679809570312, -0.1132049560546875, -0.10447311401367188, -0.09574127197265625, -0.08700942993164062, -0.078277587890625, -0.06954574584960938, -0.06081390380859375, -0.052082061767578125, -0.0433502197265625, -0.034618377685546875, -0.02588653564453125, -0.017154693603515625, -0.0084228515625, 0.000308990478515625, 0.00904083251953125, 0.017772674560546875, 0.0265045166015625, 0.035236358642578125, 0.04396820068359375, 0.052700042724609375, 0.061431884765625, 0.07016372680664062, 0.07889556884765625, 0.08762741088867188, 0.0963592529296875, 0.10509109497070312, 0.11382293701171875, 0.12255477905273438, 0.13128662109375, 0.14001846313476562, 0.14875030517578125, 0.15748214721679688, 0.1662139892578125, 0.17494583129882812, 0.18367767333984375, 0.19240951538085938, 0.201141357421875, 0.20987319946289062, 0.21860504150390625, 0.22733688354492188, 0.2360687255859375, 0.24480056762695312, 0.25353240966796875, 0.2622642517089844, 0.27099609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 7.0, 13.0, 15.0, 22.0, 39.0, 32.0, 68.0, 100.0, 127.0, 198.0, 349.0, 541.0, 918.0, 1898.0, 4120.0, 10401.0, 31109.0, 120460.0, 793150.0, 2764845.0, 359348.0, 72148.0, 20568.0, 7216.0, 3058.0, 1392.0, 792.0, 434.0, 308.0, 175.0, 130.0, 87.0, 45.0, 52.0, 38.0, 20.0, 20.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.513671875, -0.49777984619140625, -0.4818878173828125, -0.46599578857421875, -0.450103759765625, -0.43421173095703125, -0.4183197021484375, -0.40242767333984375, -0.38653564453125, -0.37064361572265625, -0.3547515869140625, -0.33885955810546875, -0.322967529296875, -0.30707550048828125, -0.2911834716796875, -0.27529144287109375, -0.2593994140625, -0.24350738525390625, -0.2276153564453125, -0.21172332763671875, -0.195831298828125, -0.17993927001953125, -0.1640472412109375, -0.14815521240234375, -0.13226318359375, -0.11637115478515625, -0.1004791259765625, -0.08458709716796875, -0.068695068359375, -0.05280303955078125, -0.0369110107421875, -0.02101898193359375, -0.005126953125, 0.01076507568359375, 0.0266571044921875, 0.04254913330078125, 0.058441162109375, 0.07433319091796875, 0.0902252197265625, 0.10611724853515625, 0.12200927734375, 0.13790130615234375, 0.1537933349609375, 0.16968536376953125, 0.185577392578125, 0.20146942138671875, 0.2173614501953125, 0.23325347900390625, 0.2491455078125, 0.26503753662109375, 0.2809295654296875, 0.29682159423828125, 0.312713623046875, 0.32860565185546875, 0.3444976806640625, 0.36038970947265625, 0.37628173828125, 0.39217376708984375, 0.4080657958984375, 0.42395782470703125, 0.439849853515625, 0.45574188232421875, 0.4716339111328125, 0.48752593994140625, 0.50341796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 10.0, 7.0, 9.0, 18.0, 23.0, 31.0, 44.0, 58.0, 101.0, 220.0, 433.0, 874.0, 1030.0, 568.0, 254.0, 151.0, 95.0, 47.0, 37.0, 26.0, 8.0, 18.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.61798095703125, -0.5943603515625, -0.57073974609375, -0.547119140625, -0.52349853515625, -0.4998779296875, -0.47625732421875, -0.45263671875, -0.42901611328125, -0.4053955078125, -0.38177490234375, -0.358154296875, -0.33453369140625, -0.3109130859375, -0.28729248046875, -0.263671875, -0.24005126953125, -0.2164306640625, -0.19281005859375, -0.169189453125, -0.14556884765625, -0.1219482421875, -0.09832763671875, -0.07470703125, -0.05108642578125, -0.0274658203125, -0.00384521484375, 0.019775390625, 0.04339599609375, 0.0670166015625, 0.09063720703125, 0.1142578125, 0.13787841796875, 0.1614990234375, 0.18511962890625, 0.208740234375, 0.23236083984375, 0.2559814453125, 0.27960205078125, 0.30322265625, 0.32684326171875, 0.3504638671875, 0.37408447265625, 0.397705078125, 0.42132568359375, 0.4449462890625, 0.46856689453125, 0.4921875, 0.51580810546875, 0.5394287109375, 0.56304931640625, 0.586669921875, 0.61029052734375, 0.6339111328125, 0.65753173828125, 0.68115234375, 0.70477294921875, 0.7283935546875, 0.75201416015625, 0.775634765625, 0.79925537109375, 0.8228759765625, 0.84649658203125, 0.8701171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 5.0, 5.0, 10.0, 18.0, 39.0, 84.0, 127.0, 170.0, 180.0, 151.0, 99.0, 52.0, 26.0, 17.0, 9.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.797063112258911, -3.682469129562378, -3.567875385284424, -3.4532814025878906, -3.3386874198913574, -3.224093437194824, -3.10949969291687, -2.994905710220337, -2.880311965942383, -2.7657179832458496, -2.6511242389678955, -2.5365302562713623, -2.421936273574829, -2.307342529296875, -2.192748546600342, -2.0781545639038086, -1.9635605812072754, -1.8489667177200317, -1.7343727350234985, -1.6197788715362549, -1.5051848888397217, -1.390591025352478, -1.2759971618652344, -1.1614031791687012, -1.0468093156814575, -0.9322153925895691, -0.8176214694976807, -0.703027606010437, -0.5884336829185486, -0.47383975982666016, -0.3592458963394165, -0.24465197324752808, -0.13005781173706055, -0.015463903546333313, 0.09913000464439392, 0.21372389793395996, 0.3283178210258484, 0.4429117441177368, 0.5575056076049805, 0.6720995306968689, 0.7866934537887573, 0.9012873768806458, 1.0158812999725342, 1.1304751634597778, 1.2450690269470215, 1.3596630096435547, 1.4742568731307983, 1.588850736618042, 1.7034447193145752, 1.8180385828018188, 1.932632565498352, 2.0472264289855957, 2.161820411682129, 2.276414394378662, 2.391008138656616, 2.5056021213531494, 2.6201958656311035, 2.7347898483276367, 2.849383592605591, 2.963977575302124, 3.0785715579986572, 3.1931653022766113, 3.3077592849731445, 3.4223532676696777, 3.536947250366211]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 12.0, 12.0, 8.0, 12.0, 19.0, 18.0, 20.0, 21.0, 25.0, 36.0, 20.0, 33.0, 36.0, 38.0, 50.0, 44.0, 39.0, 36.0, 43.0, 49.0, 41.0, 38.0, 40.0, 38.0, 32.0, 32.0, 39.0, 16.0, 21.0, 17.0, 25.0, 14.0, 16.0, 15.0, 9.0, 2.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435516357421875, -1.3848820924758911, -1.3342478275299072, -1.2836135625839233, -1.2329792976379395, -1.1823451519012451, -1.1317108869552612, -1.0810766220092773, -1.0304423570632935, -0.9798080921173096, -0.9291738271713257, -0.8785396218299866, -0.8279053568840027, -0.7772710919380188, -0.7266368865966797, -0.6760026216506958, -0.6253683567047119, -0.574734091758728, -0.5240998268127441, -0.47346562147140503, -0.42283135652542114, -0.37219709157943726, -0.32156285643577576, -0.27092862129211426, -0.22029435634613037, -0.16966010630130768, -0.11902585625648499, -0.06839160621166229, -0.0177573561668396, 0.03287690877914429, 0.08351114392280579, 0.13414537906646729, 0.18477964401245117, 0.23541389405727386, 0.28604814410209656, 0.33668237924575806, 0.38731664419174194, 0.43795090913772583, 0.48858514428138733, 0.5392193794250488, 0.5898536443710327, 0.6404879093170166, 0.6911221742630005, 0.7417563796043396, 0.7923906445503235, 0.8430249094963074, 0.8936591148376465, 0.9442933797836304, 0.9949276447296143, 1.0455619096755981, 1.096196174621582, 1.146830439567566, 1.1974647045135498, 1.2480988502502441, 1.298733115196228, 1.349367380142212, 1.4000016450881958, 1.4506359100341797, 1.5012701749801636, 1.5519044399261475, 1.6025385856628418, 1.6531729698181152, 1.7038071155548096, 1.7544413805007935, 1.8050756454467773]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 8.0, 15.0, 12.0, 36.0, 42.0, 43.0, 74.0, 111.0, 198.0, 308.0, 492.0, 768.0, 1215.0, 2064.0, 3460.0, 5709.0, 10296.0, 18862.0, 37275.0, 83403.0, 205178.0, 335178.0, 190445.0, 77001.0, 35020.0, 17816.0, 9678.0, 5503.0, 3216.0, 1978.0, 1173.0, 685.0, 438.0, 296.0, 196.0, 112.0, 83.0, 46.0, 43.0, 21.0, 16.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.3521270751953125, -0.339752197265625, -0.3273773193359375, -0.31500244140625, -0.3026275634765625, -0.290252685546875, -0.2778778076171875, -0.2655029296875, -0.2531280517578125, -0.240753173828125, -0.2283782958984375, -0.21600341796875, -0.2036285400390625, -0.191253662109375, -0.1788787841796875, -0.16650390625, -0.1541290283203125, -0.141754150390625, -0.1293792724609375, -0.11700439453125, -0.1046295166015625, -0.092254638671875, -0.0798797607421875, -0.0675048828125, -0.0551300048828125, -0.042755126953125, -0.0303802490234375, -0.01800537109375, -0.0056304931640625, 0.006744384765625, 0.0191192626953125, 0.031494140625, 0.0438690185546875, 0.056243896484375, 0.0686187744140625, 0.08099365234375, 0.0933685302734375, 0.105743408203125, 0.1181182861328125, 0.1304931640625, 0.1428680419921875, 0.155242919921875, 0.1676177978515625, 0.17999267578125, 0.1923675537109375, 0.204742431640625, 0.2171173095703125, 0.2294921875, 0.2418670654296875, 0.254241943359375, 0.2666168212890625, 0.27899169921875, 0.2913665771484375, 0.303741455078125, 0.3161163330078125, 0.3284912109375, 0.3408660888671875, 0.353240966796875, 0.3656158447265625, 0.37799072265625, 0.3903656005859375, 0.402740478515625, 0.4151153564453125, 0.427490234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 8.0, 7.0, 2.0, 10.0, 14.0, 13.0, 19.0, 19.0, 11.0, 24.0, 32.0, 36.0, 47.0, 38.0, 28.0, 51.0, 45.0, 48.0, 55.0, 44.0, 39.0, 42.0, 44.0, 32.0, 42.0, 34.0, 30.0, 33.0, 25.0, 21.0, 16.0, 19.0, 19.0, 12.0, 10.0, 9.0, 5.0, 4.0, 1.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2783203125, -0.27010345458984375, -0.2618865966796875, -0.25366973876953125, -0.245452880859375, -0.23723602294921875, -0.2290191650390625, -0.22080230712890625, -0.21258544921875, -0.20436859130859375, -0.1961517333984375, -0.18793487548828125, -0.179718017578125, -0.17150115966796875, -0.1632843017578125, -0.15506744384765625, -0.1468505859375, -0.13863372802734375, -0.1304168701171875, -0.12220001220703125, -0.113983154296875, -0.10576629638671875, -0.0975494384765625, -0.08933258056640625, -0.08111572265625, -0.07289886474609375, -0.0646820068359375, -0.05646514892578125, -0.048248291015625, -0.04003143310546875, -0.0318145751953125, -0.02359771728515625, -0.015380859375, -0.00716400146484375, 0.0010528564453125, 0.00926971435546875, 0.017486572265625, 0.02570343017578125, 0.0339202880859375, 0.04213714599609375, 0.05035400390625, 0.05857086181640625, 0.0667877197265625, 0.07500457763671875, 0.083221435546875, 0.09143829345703125, 0.0996551513671875, 0.10787200927734375, 0.1160888671875, 0.12430572509765625, 0.1325225830078125, 0.14073944091796875, 0.148956298828125, 0.15717315673828125, 0.1653900146484375, 0.17360687255859375, 0.18182373046875, 0.19004058837890625, 0.1982574462890625, 0.20647430419921875, 0.214691162109375, 0.22290802001953125, 0.2311248779296875, 0.23934173583984375, 0.24755859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 12.0, 16.0, 18.0, 31.0, 54.0, 91.0, 160.0, 270.0, 457.0, 872.0, 1819.0, 4107.0, 10653.0, 32558.0, 137120.0, 578825.0, 213335.0, 44604.0, 13774.0, 5219.0, 2157.0, 1038.0, 540.0, 308.0, 182.0, 125.0, 64.0, 45.0, 23.0, 17.0, 12.0, 15.0, 1.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8408203125, -0.8150482177734375, -0.789276123046875, -0.7635040283203125, -0.73773193359375, -0.7119598388671875, -0.686187744140625, -0.6604156494140625, -0.6346435546875, -0.6088714599609375, -0.583099365234375, -0.5573272705078125, -0.53155517578125, -0.5057830810546875, -0.480010986328125, -0.4542388916015625, -0.428466796875, -0.4026947021484375, -0.376922607421875, -0.3511505126953125, -0.32537841796875, -0.2996063232421875, -0.273834228515625, -0.2480621337890625, -0.2222900390625, -0.1965179443359375, -0.170745849609375, -0.1449737548828125, -0.11920166015625, -0.0934295654296875, -0.067657470703125, -0.0418853759765625, -0.01611328125, 0.0096588134765625, 0.035430908203125, 0.0612030029296875, 0.08697509765625, 0.1127471923828125, 0.138519287109375, 0.1642913818359375, 0.1900634765625, 0.2158355712890625, 0.241607666015625, 0.2673797607421875, 0.29315185546875, 0.3189239501953125, 0.344696044921875, 0.3704681396484375, 0.396240234375, 0.4220123291015625, 0.447784423828125, 0.4735565185546875, 0.49932861328125, 0.5251007080078125, 0.550872802734375, 0.5766448974609375, 0.6024169921875, 0.6281890869140625, 0.653961181640625, 0.6797332763671875, 0.70550537109375, 0.7312774658203125, 0.757049560546875, 0.7828216552734375, 0.80859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 9.0, 16.0, 13.0, 30.0, 31.0, 27.0, 32.0, 38.0, 61.0, 49.0, 50.0, 66.0, 72.0, 68.0, 58.0, 63.0, 48.0, 48.0, 32.0, 36.0, 30.0, 19.0, 20.0, 9.0, 12.0, 4.0, 12.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2666015625, -1.231842041015625, -1.19708251953125, -1.162322998046875, -1.1275634765625, -1.092803955078125, -1.05804443359375, -1.023284912109375, -0.988525390625, -0.953765869140625, -0.91900634765625, -0.884246826171875, -0.8494873046875, -0.814727783203125, -0.77996826171875, -0.745208740234375, -0.71044921875, -0.675689697265625, -0.64093017578125, -0.606170654296875, -0.5714111328125, -0.536651611328125, -0.50189208984375, -0.467132568359375, -0.432373046875, -0.397613525390625, -0.36285400390625, -0.328094482421875, -0.2933349609375, -0.258575439453125, -0.22381591796875, -0.189056396484375, -0.154296875, -0.119537353515625, -0.08477783203125, -0.050018310546875, -0.0152587890625, 0.019500732421875, 0.05426025390625, 0.089019775390625, 0.123779296875, 0.158538818359375, 0.19329833984375, 0.228057861328125, 0.2628173828125, 0.297576904296875, 0.33233642578125, 0.367095947265625, 0.40185546875, 0.436614990234375, 0.47137451171875, 0.506134033203125, 0.5408935546875, 0.575653076171875, 0.61041259765625, 0.645172119140625, 0.679931640625, 0.714691162109375, 0.74945068359375, 0.784210205078125, 0.8189697265625, 0.853729248046875, 0.88848876953125, 0.923248291015625, 0.9580078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 9.0, 17.0, 25.0, 26.0, 46.0, 72.0, 128.0, 151.0, 241.0, 420.0, 647.0, 958.0, 1817.0, 3275.0, 6331.0, 13592.0, 32898.0, 100441.0, 373108.0, 359830.0, 95574.0, 31740.0, 13322.0, 6217.0, 3170.0, 1743.0, 996.0, 626.0, 349.0, 245.0, 178.0, 106.0, 66.0, 58.0, 32.0, 28.0, 19.0, 14.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25537109375, -0.24785614013671875, -0.2403411865234375, -0.23282623291015625, -0.225311279296875, -0.21779632568359375, -0.2102813720703125, -0.20276641845703125, -0.19525146484375, -0.18773651123046875, -0.1802215576171875, -0.17270660400390625, -0.165191650390625, -0.15767669677734375, -0.1501617431640625, -0.14264678955078125, -0.1351318359375, -0.12761688232421875, -0.1201019287109375, -0.11258697509765625, -0.105072021484375, -0.09755706787109375, -0.0900421142578125, -0.08252716064453125, -0.07501220703125, -0.06749725341796875, -0.0599822998046875, -0.05246734619140625, -0.044952392578125, -0.03743743896484375, -0.0299224853515625, -0.02240753173828125, -0.014892578125, -0.00737762451171875, 0.0001373291015625, 0.00765228271484375, 0.015167236328125, 0.02268218994140625, 0.0301971435546875, 0.03771209716796875, 0.04522705078125, 0.05274200439453125, 0.0602569580078125, 0.06777191162109375, 0.075286865234375, 0.08280181884765625, 0.0903167724609375, 0.09783172607421875, 0.1053466796875, 0.11286163330078125, 0.1203765869140625, 0.12789154052734375, 0.135406494140625, 0.14292144775390625, 0.1504364013671875, 0.15795135498046875, 0.16546630859375, 0.17298126220703125, 0.1804962158203125, 0.18801116943359375, 0.195526123046875, 0.20304107666015625, 0.2105560302734375, 0.21807098388671875, 0.2255859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 12.0, 10.0, 14.0, 26.0, 15.0, 32.0, 65.0, 113.0, 164.0, 161.0, 124.0, 93.0, 46.0, 38.0, 24.0, 4.0, 12.0, 10.0, 4.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00012421607971191406, -0.00012127123773097992, -0.00011832639575004578, -0.00011538155376911163, -0.00011243671178817749, -0.00010949186980724335, -0.0001065470278263092, -0.00010360218584537506, -0.00010065734386444092, -9.771250188350677e-05, -9.476765990257263e-05, -9.182281792163849e-05, -8.887797594070435e-05, -8.59331339597702e-05, -8.298829197883606e-05, -8.004344999790192e-05, -7.709860801696777e-05, -7.415376603603363e-05, -7.120892405509949e-05, -6.826408207416534e-05, -6.53192400932312e-05, -6.237439811229706e-05, -5.9429556131362915e-05, -5.648471415042877e-05, -5.353987216949463e-05, -5.0595030188560486e-05, -4.765018820762634e-05, -4.47053462266922e-05, -4.176050424575806e-05, -3.8815662264823914e-05, -3.587082028388977e-05, -3.292597830295563e-05, -2.9981136322021484e-05, -2.703629434108734e-05, -2.4091452360153198e-05, -2.1146610379219055e-05, -1.8201768398284912e-05, -1.5256926417350769e-05, -1.2312084436416626e-05, -9.367242455482483e-06, -6.42240047454834e-06, -3.4775584936141968e-06, -5.327165126800537e-07, 2.4121254682540894e-06, 5.356967449188232e-06, 8.301809430122375e-06, 1.1246651411056519e-05, 1.4191493391990662e-05, 1.7136335372924805e-05, 2.0081177353858948e-05, 2.302601933479309e-05, 2.5970861315727234e-05, 2.8915703296661377e-05, 3.186054527759552e-05, 3.480538725852966e-05, 3.7750229239463806e-05, 4.069507122039795e-05, 4.363991320133209e-05, 4.6584755182266235e-05, 4.952959716320038e-05, 5.247443914413452e-05, 5.5419281125068665e-05, 5.836412310600281e-05, 6.130896508693695e-05, 6.42538070678711e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 16.0, 23.0, 38.0, 43.0, 92.0, 135.0, 237.0, 487.0, 915.0, 2159.0, 5270.0, 15181.0, 52100.0, 243955.0, 535856.0, 140852.0, 33894.0, 10354.0, 3775.0, 1523.0, 726.0, 372.0, 220.0, 112.0, 72.0, 42.0, 23.0, 19.0, 19.0, 14.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23285675048828125, -0.2240142822265625, -0.21517181396484375, -0.206329345703125, -0.19748687744140625, -0.1886444091796875, -0.17980194091796875, -0.17095947265625, -0.16211700439453125, -0.1532745361328125, -0.14443206787109375, -0.135589599609375, -0.12674713134765625, -0.1179046630859375, -0.10906219482421875, -0.1002197265625, -0.09137725830078125, -0.0825347900390625, -0.07369232177734375, -0.064849853515625, -0.05600738525390625, -0.0471649169921875, -0.03832244873046875, -0.02947998046875, -0.02063751220703125, -0.0117950439453125, -0.00295257568359375, 0.005889892578125, 0.01473236083984375, 0.0235748291015625, 0.03241729736328125, 0.041259765625, 0.05010223388671875, 0.0589447021484375, 0.06778717041015625, 0.076629638671875, 0.08547210693359375, 0.0943145751953125, 0.10315704345703125, 0.11199951171875, 0.12084197998046875, 0.1296844482421875, 0.13852691650390625, 0.147369384765625, 0.15621185302734375, 0.1650543212890625, 0.17389678955078125, 0.1827392578125, 0.19158172607421875, 0.2004241943359375, 0.20926666259765625, 0.218109130859375, 0.22695159912109375, 0.2357940673828125, 0.24463653564453125, 0.25347900390625, 0.26232147216796875, 0.2711639404296875, 0.28000640869140625, 0.288848876953125, 0.29769134521484375, 0.3065338134765625, 0.31537628173828125, 0.32421875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 16.0, 8.0, 10.0, 26.0, 40.0, 48.0, 97.0, 141.0, 156.0, 158.0, 101.0, 50.0, 36.0, 26.0, 18.0, 7.0, 8.0, 8.0, 7.0, 10.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32080078125, -0.3086967468261719, -0.29659271240234375, -0.2844886779785156, -0.2723846435546875, -0.2602806091308594, -0.24817657470703125, -0.23607254028320312, -0.223968505859375, -0.21186447143554688, -0.19976043701171875, -0.18765640258789062, -0.1755523681640625, -0.16344833374023438, -0.15134429931640625, -0.13924026489257812, -0.12713623046875, -0.11503219604492188, -0.10292816162109375, -0.09082412719726562, -0.0787200927734375, -0.06661605834960938, -0.05451202392578125, -0.042407989501953125, -0.030303955078125, -0.018199920654296875, -0.00609588623046875, 0.006008148193359375, 0.0181121826171875, 0.030216217041015625, 0.04232025146484375, 0.054424285888671875, 0.0665283203125, 0.07863235473632812, 0.09073638916015625, 0.10284042358398438, 0.1149444580078125, 0.12704849243164062, 0.13915252685546875, 0.15125656127929688, 0.163360595703125, 0.17546463012695312, 0.18756866455078125, 0.19967269897460938, 0.2117767333984375, 0.22388076782226562, 0.23598480224609375, 0.24808883666992188, 0.26019287109375, 0.2722969055175781, 0.28440093994140625, 0.2965049743652344, 0.3086090087890625, 0.3207130432128906, 0.33281707763671875, 0.3449211120605469, 0.357025146484375, 0.3691291809082031, 0.38123321533203125, 0.3933372497558594, 0.4054412841796875, 0.4175453186035156, 0.42964935302734375, 0.4417533874511719, 0.453857421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 14.0, 12.0, 32.0, 49.0, 70.0, 118.0, 148.0, 145.0, 124.0, 91.0, 91.0, 30.0, 26.0, 20.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9044694900512695, -3.8074872493743896, -3.7105047702789307, -3.613522529602051, -3.516540288925171, -3.419558048248291, -3.322575569152832, -3.225593328475952, -3.1286110877990723, -3.0316288471221924, -2.9346463680267334, -2.8376641273498535, -2.7406818866729736, -2.6436996459960938, -2.5467171669006348, -2.449734926223755, -2.352752447128296, -2.255770206451416, -2.158787727355957, -2.061805486679077, -1.9648232460021973, -1.8678408861160278, -1.7708585262298584, -1.6738762855529785, -1.576893925666809, -1.4799115657806396, -1.3829293251037598, -1.2859469652175903, -1.188964605331421, -1.091982364654541, -0.9950000047683716, -0.8980177044868469, -0.8010356426239014, -0.7040533423423767, -0.607071042060852, -0.5100886821746826, -0.41310638189315796, -0.3161240816116333, -0.21914172172546387, -0.12215942144393921, -0.02517712116241455, 0.0718051940202713, 0.16878750920295715, 0.2657698392868042, 0.36275213956832886, 0.4597344398498535, 0.556716799736023, 0.6536991000175476, 0.7506814002990723, 0.8476637005805969, 0.9446460008621216, 1.041628360748291, 1.138610601425171, 1.2355929613113403, 1.3325753211975098, 1.4295575618743896, 1.526539921760559, 1.6235222816467285, 1.7205045223236084, 1.8174868822097778, 1.9144692420959473, 2.011451482772827, 2.108433723449707, 2.205416202545166, 2.302398443222046]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 7.0, 7.0, 8.0, 10.0, 5.0, 14.0, 17.0, 9.0, 20.0, 28.0, 22.0, 22.0, 23.0, 31.0, 47.0, 30.0, 34.0, 31.0, 39.0, 35.0, 32.0, 46.0, 45.0, 41.0, 26.0, 38.0, 30.0, 30.0, 34.0, 24.0, 32.0, 25.0, 27.0, 17.0, 28.0, 14.0, 15.0, 8.0, 7.0, 7.0, 2.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4954466819763184, -1.4461283683776855, -1.3968101739883423, -1.3474918603897095, -1.2981736660003662, -1.2488553524017334, -1.1995370388031006, -1.1502188444137573, -1.1009005308151245, -1.0515822172164917, -1.0022640228271484, -0.9529457092285156, -0.9036274552345276, -0.8543092012405396, -0.8049909472465515, -0.7556726932525635, -0.7063544392585754, -0.6570361852645874, -0.6077179312705994, -0.5583996772766113, -0.5090813636779785, -0.4597631096839905, -0.41044485569000244, -0.361126571893692, -0.311808317899704, -0.26249006390571594, -0.21317178010940552, -0.16385352611541748, -0.11453525722026825, -0.06521698832511902, -0.01589873433113098, 0.03341954946517944, 0.08273780345916748, 0.1320560723543167, 0.18137434124946594, 0.23069259524345398, 0.2800108790397644, 0.32932913303375244, 0.3786473870277405, 0.4279656708240509, 0.47728392481803894, 0.5266022086143494, 0.5759204626083374, 0.6252387166023254, 0.6745569705963135, 0.7238752841949463, 0.7731934785842896, 0.8225117921829224, 0.8718300461769104, 0.9211483001708984, 0.9704665541648865, 1.0197848081588745, 1.0691031217575073, 1.1184213161468506, 1.1677396297454834, 1.2170579433441162, 1.2663761377334595, 1.3156944513320923, 1.3650126457214355, 1.4143309593200684, 1.4636491537094116, 1.5129674673080444, 1.5622856616973877, 1.6116039752960205, 1.6609222888946533]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 14.0, 18.0, 26.0, 37.0, 60.0, 99.0, 181.0, 323.0, 421.0, 804.0, 1486.0, 2664.0, 4829.0, 9131.0, 18542.0, 40191.0, 97967.0, 274392.0, 719923.0, 1292136.0, 1017231.0, 445022.0, 157452.0, 58470.0, 25545.0, 12442.0, 6509.0, 3557.0, 1878.0, 1175.0, 658.0, 392.0, 239.0, 143.0, 100.0, 68.0, 57.0, 30.0, 17.0, 10.0, 13.0, 6.0, 3.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.2431640625, -0.23595619201660156, -0.22874832153320312, -0.2215404510498047, -0.21433258056640625, -0.2071247100830078, -0.19991683959960938, -0.19270896911621094, -0.1855010986328125, -0.17829322814941406, -0.17108535766601562, -0.1638774871826172, -0.15666961669921875, -0.1494617462158203, -0.14225387573242188, -0.13504600524902344, -0.127838134765625, -0.12063026428222656, -0.11342239379882812, -0.10621452331542969, -0.09900665283203125, -0.09179878234863281, -0.08459091186523438, -0.07738304138183594, -0.0701751708984375, -0.06296730041503906, -0.055759429931640625, -0.04855155944824219, -0.04134368896484375, -0.03413581848144531, -0.026927947998046875, -0.019720077514648438, -0.01251220703125, -0.0053043365478515625, 0.001903533935546875, 0.009111404418945312, 0.01631927490234375, 0.023527145385742188, 0.030735015869140625, 0.03794288635253906, 0.0451507568359375, 0.05235862731933594, 0.059566497802734375, 0.06677436828613281, 0.07398223876953125, 0.08119010925292969, 0.08839797973632812, 0.09560585021972656, 0.102813720703125, 0.11002159118652344, 0.11722946166992188, 0.12443733215332031, 0.13164520263671875, 0.1388530731201172, 0.14606094360351562, 0.15326881408691406, 0.1604766845703125, 0.16768455505371094, 0.17489242553710938, 0.1821002960205078, 0.18930816650390625, 0.1965160369873047, 0.20372390747070312, 0.21093177795410156, 0.2181396484375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 2.0, 8.0, 8.0, 10.0, 14.0, 17.0, 13.0, 12.0, 29.0, 29.0, 19.0, 30.0, 38.0, 33.0, 34.0, 48.0, 50.0, 39.0, 49.0, 47.0, 47.0, 48.0, 31.0, 38.0, 41.0, 37.0, 38.0, 21.0, 24.0, 28.0, 20.0, 20.0, 17.0, 15.0, 7.0, 9.0, 8.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.261474609375, -0.2536029815673828, -0.24573135375976562, -0.23785972595214844, -0.22998809814453125, -0.22211647033691406, -0.21424484252929688, -0.2063732147216797, -0.1985015869140625, -0.1906299591064453, -0.18275833129882812, -0.17488670349121094, -0.16701507568359375, -0.15914344787597656, -0.15127182006835938, -0.1434001922607422, -0.135528564453125, -0.1276569366455078, -0.11978530883789062, -0.11191368103027344, -0.10404205322265625, -0.09617042541503906, -0.08829879760742188, -0.08042716979980469, -0.0725555419921875, -0.06468391418457031, -0.056812286376953125, -0.04894065856933594, -0.04106903076171875, -0.03319740295410156, -0.025325775146484375, -0.017454147338867188, -0.00958251953125, -0.0017108917236328125, 0.006160736083984375, 0.014032363891601562, 0.02190399169921875, 0.029775619506835938, 0.037647247314453125, 0.04551887512207031, 0.0533905029296875, 0.06126213073730469, 0.06913375854492188, 0.07700538635253906, 0.08487701416015625, 0.09274864196777344, 0.10062026977539062, 0.10849189758300781, 0.116363525390625, 0.12423515319824219, 0.13210678100585938, 0.13997840881347656, 0.14785003662109375, 0.15572166442871094, 0.16359329223632812, 0.1714649200439453, 0.1793365478515625, 0.1872081756591797, 0.19507980346679688, 0.20295143127441406, 0.21082305908203125, 0.21869468688964844, 0.22656631469726562, 0.2344379425048828, 0.2423095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 12.0, 11.0, 24.0, 29.0, 51.0, 84.0, 156.0, 304.0, 762.0, 2625.0, 12685.0, 101715.0, 1899623.0, 2050818.0, 107502.0, 13417.0, 2883.0, 825.0, 330.0, 169.0, 96.0, 44.0, 30.0, 21.0, 13.0, 10.0, 17.0, 7.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.1923828125, -1.16400146484375, -1.1356201171875, -1.10723876953125, -1.078857421875, -1.05047607421875, -1.0220947265625, -0.99371337890625, -0.96533203125, -0.93695068359375, -0.9085693359375, -0.88018798828125, -0.851806640625, -0.82342529296875, -0.7950439453125, -0.76666259765625, -0.73828125, -0.70989990234375, -0.6815185546875, -0.65313720703125, -0.624755859375, -0.59637451171875, -0.5679931640625, -0.53961181640625, -0.51123046875, -0.48284912109375, -0.4544677734375, -0.42608642578125, -0.397705078125, -0.36932373046875, -0.3409423828125, -0.31256103515625, -0.2841796875, -0.25579833984375, -0.2274169921875, -0.19903564453125, -0.170654296875, -0.14227294921875, -0.1138916015625, -0.08551025390625, -0.05712890625, -0.02874755859375, -0.0003662109375, 0.02801513671875, 0.056396484375, 0.08477783203125, 0.1131591796875, 0.14154052734375, 0.169921875, 0.19830322265625, 0.2266845703125, 0.25506591796875, 0.283447265625, 0.31182861328125, 0.3402099609375, 0.36859130859375, 0.39697265625, 0.42535400390625, 0.4537353515625, 0.48211669921875, 0.510498046875, 0.53887939453125, 0.5672607421875, 0.59564208984375, 0.6240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 16.0, 18.0, 32.0, 55.0, 87.0, 120.0, 208.0, 372.0, 684.0, 862.0, 670.0, 376.0, 230.0, 130.0, 78.0, 44.0, 23.0, 25.0, 13.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3749580383300781, -0.35074615478515625, -0.3265342712402344, -0.3023223876953125, -0.2781105041503906, -0.25389862060546875, -0.22968673706054688, -0.205474853515625, -0.18126296997070312, -0.15705108642578125, -0.13283920288085938, -0.1086273193359375, -0.08441543579101562, -0.06020355224609375, -0.035991668701171875, -0.01177978515625, 0.012432098388671875, 0.03664398193359375, 0.060855865478515625, 0.0850677490234375, 0.10927963256835938, 0.13349151611328125, 0.15770339965820312, 0.181915283203125, 0.20612716674804688, 0.23033905029296875, 0.2545509338378906, 0.2787628173828125, 0.3029747009277344, 0.32718658447265625, 0.3513984680175781, 0.3756103515625, 0.3998222351074219, 0.42403411865234375, 0.4482460021972656, 0.4724578857421875, 0.4966697692871094, 0.5208816528320312, 0.5450935363769531, 0.569305419921875, 0.5935173034667969, 0.6177291870117188, 0.6419410705566406, 0.6661529541015625, 0.6903648376464844, 0.7145767211914062, 0.7387886047363281, 0.76300048828125, 0.7872123718261719, 0.8114242553710938, 0.8356361389160156, 0.8598480224609375, 0.8840599060058594, 0.9082717895507812, 0.9324836730957031, 0.956695556640625, 0.9809074401855469, 1.0051193237304688, 1.0293312072753906, 1.0535430908203125, 1.0777549743652344, 1.1019668579101562, 1.1261787414550781, 1.150390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 9.0, 11.0, 16.0, 57.0, 127.0, 200.0, 230.0, 182.0, 89.0, 49.0, 21.0, 8.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8434247970581055, -5.662446022033691, -5.4814677238464355, -5.3004889488220215, -5.119510650634766, -4.938531875610352, -4.7575531005859375, -4.576574802398682, -4.395596504211426, -4.214617729187012, -4.033639430999756, -3.852660655975342, -3.671682357788086, -3.490703582763672, -3.309725046157837, -3.128746509552002, -2.947767734527588, -2.766789197921753, -2.585810661315918, -2.404831886291504, -2.223853588104248, -2.042874813079834, -1.861896276473999, -1.680917739868164, -1.499939203262329, -1.3189606666564941, -1.1379821300506592, -0.9570034742355347, -0.7760249376296997, -0.5950464010238647, -0.41406774520874023, -0.23308920860290527, -0.05211019515991211, 0.12886837124824524, 0.3098469376564026, 0.4908255338668823, 0.6718040704727173, 0.8527826070785522, 1.0337612628936768, 1.2147397994995117, 1.3957183361053467, 1.5766968727111816, 1.7576754093170166, 1.9386540651321411, 2.1196327209472656, 2.3006110191345215, 2.4815897941589355, 2.6625683307647705, 2.8435468673706055, 3.0245254039764404, 3.2055039405822754, 3.3864827156066895, 3.5674610137939453, 3.7484397888183594, 3.9294183254241943, 4.110396862030029, 4.291375160217285, 4.472353935241699, 4.653332233428955, 4.834311008453369, 5.015289306640625, 5.196268081665039, 5.377246856689453, 5.558225154876709, 5.739203929901123]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 2.0, 7.0, 8.0, 6.0, 7.0, 8.0, 14.0, 15.0, 16.0, 25.0, 22.0, 16.0, 29.0, 23.0, 25.0, 26.0, 30.0, 31.0, 32.0, 40.0, 34.0, 38.0, 42.0, 31.0, 51.0, 49.0, 28.0, 48.0, 26.0, 26.0, 23.0, 25.0, 24.0, 27.0, 23.0, 13.0, 20.0, 15.0, 14.0, 9.0, 4.0, 7.0, 13.0, 7.0, 7.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4265673160552979, -1.3828784227371216, -1.3391895294189453, -1.2955005168914795, -1.2518116235733032, -1.208122730255127, -1.1644338369369507, -1.1207449436187744, -1.0770559310913086, -1.0333670377731323, -0.9896780848503113, -0.945989191532135, -0.902300238609314, -0.8586113452911377, -0.8149224519729614, -0.7712334990501404, -0.7275446057319641, -0.6838557124137878, -0.6401667594909668, -0.5964778661727905, -0.5527889132499695, -0.5091000199317932, -0.46541109681129456, -0.4217221736907959, -0.37803325057029724, -0.3343443274497986, -0.2906554043292999, -0.24696649610996246, -0.2032775729894638, -0.15958864986896515, -0.11589974164962769, -0.07221081852912903, -0.02852189540863037, 0.015167023986577988, 0.058855943381786346, 0.1025448590517044, 0.14623378217220306, 0.18992270529270172, 0.23361161351203918, 0.27730053663253784, 0.3209894597530365, 0.36467838287353516, 0.4083673059940338, 0.45205622911453247, 0.49574512243270874, 0.5394340753555298, 0.583122968673706, 0.6268118619918823, 0.6705008149147034, 0.7141897082328796, 0.7578786611557007, 0.801567554473877, 0.845256507396698, 0.8889454007148743, 0.9326343536376953, 0.9763232469558716, 1.0200121402740479, 1.0637010335922241, 1.1073899269104004, 1.1510789394378662, 1.1947678327560425, 1.2384567260742188, 1.282145619392395, 1.3258345127105713, 1.369523525238037]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 10.0, 9.0, 17.0, 23.0, 37.0, 54.0, 83.0, 120.0, 180.0, 245.0, 389.0, 677.0, 1154.0, 1810.0, 2931.0, 5151.0, 9116.0, 16005.0, 29979.0, 58043.0, 120243.0, 235782.0, 265912.0, 148603.0, 71353.0, 35986.0, 19011.0, 10788.0, 5907.0, 3532.0, 2067.0, 1138.0, 789.0, 471.0, 321.0, 178.0, 153.0, 77.0, 58.0, 44.0, 22.0, 24.0, 19.0, 10.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3236122131347656, -0.31250762939453125, -0.3014030456542969, -0.2902984619140625, -0.2791938781738281, -0.26808929443359375, -0.2569847106933594, -0.245880126953125, -0.23477554321289062, -0.22367095947265625, -0.21256637573242188, -0.2014617919921875, -0.19035720825195312, -0.17925262451171875, -0.16814804077148438, -0.15704345703125, -0.14593887329101562, -0.13483428955078125, -0.12372970581054688, -0.1126251220703125, -0.10152053833007812, -0.09041595458984375, -0.07931137084960938, -0.068206787109375, -0.057102203369140625, -0.04599761962890625, -0.034893035888671875, -0.0237884521484375, -0.012683868408203125, -0.00157928466796875, 0.009525299072265625, 0.0206298828125, 0.031734466552734375, 0.04283905029296875, 0.053943634033203125, 0.0650482177734375, 0.07615280151367188, 0.08725738525390625, 0.09836196899414062, 0.109466552734375, 0.12057113647460938, 0.13167572021484375, 0.14278030395507812, 0.1538848876953125, 0.16498947143554688, 0.17609405517578125, 0.18719863891601562, 0.19830322265625, 0.20940780639648438, 0.22051239013671875, 0.23161697387695312, 0.2427215576171875, 0.2538261413574219, 0.26493072509765625, 0.2760353088378906, 0.287139892578125, 0.2982444763183594, 0.30934906005859375, 0.3204536437988281, 0.3315582275390625, 0.3426628112792969, 0.35376739501953125, 0.3648719787597656, 0.3759765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 11.0, 12.0, 8.0, 14.0, 11.0, 16.0, 15.0, 17.0, 22.0, 23.0, 24.0, 37.0, 37.0, 32.0, 46.0, 30.0, 35.0, 54.0, 30.0, 45.0, 41.0, 41.0, 42.0, 28.0, 26.0, 31.0, 30.0, 30.0, 37.0, 14.0, 20.0, 16.0, 24.0, 15.0, 16.0, 12.0, 8.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.2391357421875, -0.23189926147460938, -0.22466278076171875, -0.21742630004882812, -0.2101898193359375, -0.20295333862304688, -0.19571685791015625, -0.18848037719726562, -0.181243896484375, -0.17400741577148438, -0.16677093505859375, -0.15953445434570312, -0.1522979736328125, -0.14506149291992188, -0.13782501220703125, -0.13058853149414062, -0.12335205078125, -0.11611557006835938, -0.10887908935546875, -0.10164260864257812, -0.0944061279296875, -0.08716964721679688, -0.07993316650390625, -0.07269668579101562, -0.065460205078125, -0.058223724365234375, -0.05098724365234375, -0.043750762939453125, -0.0365142822265625, -0.029277801513671875, -0.02204132080078125, -0.014804840087890625, -0.007568359375, -0.000331878662109375, 0.00690460205078125, 0.014141082763671875, 0.0213775634765625, 0.028614044189453125, 0.03585052490234375, 0.043087005615234375, 0.050323486328125, 0.057559967041015625, 0.06479644775390625, 0.07203292846679688, 0.0792694091796875, 0.08650588989257812, 0.09374237060546875, 0.10097885131835938, 0.10821533203125, 0.11545181274414062, 0.12268829345703125, 0.12992477416992188, 0.1371612548828125, 0.14439773559570312, 0.15163421630859375, 0.15887069702148438, 0.166107177734375, 0.17334365844726562, 0.18058013916015625, 0.18781661987304688, 0.1950531005859375, 0.20228958129882812, 0.20952606201171875, 0.21676254272460938, 0.2239990234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 9.0, 7.0, 12.0, 11.0, 13.0, 17.0, 25.0, 55.0, 71.0, 106.0, 139.0, 220.0, 357.0, 572.0, 978.0, 1740.0, 3504.0, 7403.0, 16274.0, 39296.0, 109551.0, 337314.0, 345335.0, 113014.0, 40601.0, 16620.0, 7349.0, 3518.0, 1766.0, 1032.0, 547.0, 361.0, 254.0, 141.0, 90.0, 67.0, 54.0, 38.0, 22.0, 17.0, 12.0, 10.0, 9.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5986328125, -0.5799331665039062, -0.5612335205078125, -0.5425338745117188, -0.523834228515625, -0.5051345825195312, -0.4864349365234375, -0.46773529052734375, -0.44903564453125, -0.43033599853515625, -0.4116363525390625, -0.39293670654296875, -0.374237060546875, -0.35553741455078125, -0.3368377685546875, -0.31813812255859375, -0.2994384765625, -0.28073883056640625, -0.2620391845703125, -0.24333953857421875, -0.224639892578125, -0.20594024658203125, -0.1872406005859375, -0.16854095458984375, -0.14984130859375, -0.13114166259765625, -0.1124420166015625, -0.09374237060546875, -0.075042724609375, -0.05634307861328125, -0.0376434326171875, -0.01894378662109375, -0.000244140625, 0.01845550537109375, 0.0371551513671875, 0.05585479736328125, 0.074554443359375, 0.09325408935546875, 0.1119537353515625, 0.13065338134765625, 0.14935302734375, 0.16805267333984375, 0.1867523193359375, 0.20545196533203125, 0.224151611328125, 0.24285125732421875, 0.2615509033203125, 0.28025054931640625, 0.2989501953125, 0.31764984130859375, 0.3363494873046875, 0.35504913330078125, 0.373748779296875, 0.39244842529296875, 0.4111480712890625, 0.42984771728515625, 0.44854736328125, 0.46724700927734375, 0.4859466552734375, 0.5046463012695312, 0.523345947265625, 0.5420455932617188, 0.5607452392578125, 0.5794448852539062, 0.59814453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 8.0, 7.0, 6.0, 9.0, 11.0, 18.0, 22.0, 25.0, 34.0, 22.0, 50.0, 55.0, 58.0, 54.0, 50.0, 55.0, 64.0, 60.0, 65.0, 37.0, 47.0, 45.0, 37.0, 32.0, 33.0, 21.0, 17.0, 11.0, 10.0, 13.0, 7.0, 6.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.021484375, -0.9895782470703125, -0.957672119140625, -0.9257659912109375, -0.89385986328125, -0.8619537353515625, -0.830047607421875, -0.7981414794921875, -0.7662353515625, -0.7343292236328125, -0.702423095703125, -0.6705169677734375, -0.63861083984375, -0.6067047119140625, -0.574798583984375, -0.5428924560546875, -0.510986328125, -0.4790802001953125, -0.447174072265625, -0.4152679443359375, -0.38336181640625, -0.3514556884765625, -0.319549560546875, -0.2876434326171875, -0.2557373046875, -0.2238311767578125, -0.191925048828125, -0.1600189208984375, -0.12811279296875, -0.0962066650390625, -0.064300537109375, -0.0323944091796875, -0.00048828125, 0.0314178466796875, 0.063323974609375, 0.0952301025390625, 0.12713623046875, 0.1590423583984375, 0.190948486328125, 0.2228546142578125, 0.2547607421875, 0.2866668701171875, 0.318572998046875, 0.3504791259765625, 0.38238525390625, 0.4142913818359375, 0.446197509765625, 0.4781036376953125, 0.510009765625, 0.5419158935546875, 0.573822021484375, 0.6057281494140625, 0.63763427734375, 0.6695404052734375, 0.701446533203125, 0.7333526611328125, 0.7652587890625, 0.7971649169921875, 0.829071044921875, 0.8609771728515625, 0.89288330078125, 0.9247894287109375, 0.956695556640625, 0.9886016845703125, 1.0205078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 1.0, 5.0, 3.0, 16.0, 11.0, 27.0, 33.0, 42.0, 90.0, 116.0, 186.0, 314.0, 431.0, 740.0, 1229.0, 2030.0, 3819.0, 7277.0, 15448.0, 39132.0, 131299.0, 395329.0, 308472.0, 88151.0, 28596.0, 12038.0, 5977.0, 3111.0, 1783.0, 1081.0, 688.0, 418.0, 235.0, 151.0, 92.0, 60.0, 40.0, 34.0, 19.0, 12.0, 6.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.27490234375, -0.2670135498046875, -0.259124755859375, -0.2512359619140625, -0.24334716796875, -0.2354583740234375, -0.227569580078125, -0.2196807861328125, -0.2117919921875, -0.2039031982421875, -0.196014404296875, -0.1881256103515625, -0.18023681640625, -0.1723480224609375, -0.164459228515625, -0.1565704345703125, -0.148681640625, -0.1407928466796875, -0.132904052734375, -0.1250152587890625, -0.11712646484375, -0.1092376708984375, -0.101348876953125, -0.0934600830078125, -0.0855712890625, -0.0776824951171875, -0.069793701171875, -0.0619049072265625, -0.05401611328125, -0.0461273193359375, -0.038238525390625, -0.0303497314453125, -0.0224609375, -0.0145721435546875, -0.006683349609375, 0.0012054443359375, 0.00909423828125, 0.0169830322265625, 0.024871826171875, 0.0327606201171875, 0.0406494140625, 0.0485382080078125, 0.056427001953125, 0.0643157958984375, 0.07220458984375, 0.0800933837890625, 0.087982177734375, 0.0958709716796875, 0.103759765625, 0.1116485595703125, 0.119537353515625, 0.1274261474609375, 0.13531494140625, 0.1432037353515625, 0.151092529296875, 0.1589813232421875, 0.1668701171875, 0.1747589111328125, 0.182647705078125, 0.1905364990234375, 0.19842529296875, 0.2063140869140625, 0.214202880859375, 0.2220916748046875, 0.22998046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 10.0, 13.0, 17.0, 25.0, 44.0, 77.0, 102.0, 134.0, 139.0, 143.0, 74.0, 54.0, 46.0, 27.0, 20.0, 10.0, 9.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.065866470336914e-05, -8.78339633345604e-05, -8.500926196575165e-05, -8.21845605969429e-05, -7.935985922813416e-05, -7.653515785932541e-05, -7.371045649051666e-05, -7.088575512170792e-05, -6.806105375289917e-05, -6.523635238409042e-05, -6.241165101528168e-05, -5.958694964647293e-05, -5.6762248277664185e-05, -5.393754690885544e-05, -5.111284554004669e-05, -4.8288144171237946e-05, -4.54634428024292e-05, -4.263874143362045e-05, -3.9814040064811707e-05, -3.698933869600296e-05, -3.4164637327194214e-05, -3.133993595838547e-05, -2.851523458957672e-05, -2.5690533220767975e-05, -2.286583185195923e-05, -2.0041130483150482e-05, -1.7216429114341736e-05, -1.439172774553299e-05, -1.1567026376724243e-05, -8.742325007915497e-06, -5.9176236391067505e-06, -3.092922270298004e-06, -2.682209014892578e-07, 2.5564804673194885e-06, 5.381181836128235e-06, 8.205883204936981e-06, 1.1030584573745728e-05, 1.3855285942554474e-05, 1.667998731136322e-05, 1.9504688680171967e-05, 2.2329390048980713e-05, 2.515409141778946e-05, 2.7978792786598206e-05, 3.080349415540695e-05, 3.36281955242157e-05, 3.6452896893024445e-05, 3.927759826183319e-05, 4.210229963064194e-05, 4.4927000999450684e-05, 4.775170236825943e-05, 5.0576403737068176e-05, 5.340110510587692e-05, 5.622580647468567e-05, 5.9050507843494415e-05, 6.187520921230316e-05, 6.469991058111191e-05, 6.752461194992065e-05, 7.03493133187294e-05, 7.317401468753815e-05, 7.59987160563469e-05, 7.882341742515564e-05, 8.164811879396439e-05, 8.447282016277313e-05, 8.729752153158188e-05, 9.012222290039062e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 6.0, 8.0, 6.0, 20.0, 33.0, 40.0, 47.0, 65.0, 102.0, 206.0, 285.0, 465.0, 746.0, 1307.0, 2147.0, 3779.0, 7216.0, 14626.0, 34178.0, 91998.0, 246695.0, 351661.0, 178712.0, 64701.0, 24879.0, 11416.0, 5516.0, 3084.0, 1781.0, 1075.0, 663.0, 379.0, 258.0, 154.0, 94.0, 63.0, 37.0, 25.0, 22.0, 14.0, 16.0, 9.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19482421875, -0.1887969970703125, -0.182769775390625, -0.1767425537109375, -0.17071533203125, -0.1646881103515625, -0.158660888671875, -0.1526336669921875, -0.1466064453125, -0.1405792236328125, -0.134552001953125, -0.1285247802734375, -0.12249755859375, -0.1164703369140625, -0.110443115234375, -0.1044158935546875, -0.098388671875, -0.0923614501953125, -0.086334228515625, -0.0803070068359375, -0.07427978515625, -0.0682525634765625, -0.062225341796875, -0.0561981201171875, -0.0501708984375, -0.0441436767578125, -0.038116455078125, -0.0320892333984375, -0.02606201171875, -0.0200347900390625, -0.014007568359375, -0.0079803466796875, -0.001953125, 0.0040740966796875, 0.010101318359375, 0.0161285400390625, 0.02215576171875, 0.0281829833984375, 0.034210205078125, 0.0402374267578125, 0.0462646484375, 0.0522918701171875, 0.058319091796875, 0.0643463134765625, 0.07037353515625, 0.0764007568359375, 0.082427978515625, 0.0884552001953125, 0.094482421875, 0.1005096435546875, 0.106536865234375, 0.1125640869140625, 0.11859130859375, 0.1246185302734375, 0.130645751953125, 0.1366729736328125, 0.1427001953125, 0.1487274169921875, 0.154754638671875, 0.1607818603515625, 0.16680908203125, 0.1728363037109375, 0.178863525390625, 0.1848907470703125, 0.19091796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 11.0, 12.0, 9.0, 8.0, 14.0, 23.0, 40.0, 50.0, 61.0, 82.0, 94.0, 104.0, 94.0, 87.0, 70.0, 54.0, 53.0, 43.0, 22.0, 17.0, 13.0, 9.0, 6.0, 5.0, 5.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289306640625, -0.2807579040527344, -0.27220916748046875, -0.2636604309082031, -0.2551116943359375, -0.24656295776367188, -0.23801422119140625, -0.22946548461914062, -0.220916748046875, -0.21236801147460938, -0.20381927490234375, -0.19527053833007812, -0.1867218017578125, -0.17817306518554688, -0.16962432861328125, -0.16107559204101562, -0.15252685546875, -0.14397811889648438, -0.13542938232421875, -0.12688064575195312, -0.1183319091796875, -0.10978317260742188, -0.10123443603515625, -0.09268569946289062, -0.084136962890625, -0.07558822631835938, -0.06703948974609375, -0.058490753173828125, -0.0499420166015625, -0.041393280029296875, -0.03284454345703125, -0.024295806884765625, -0.0157470703125, -0.007198333740234375, 0.00135040283203125, 0.009899139404296875, 0.0184478759765625, 0.026996612548828125, 0.03554534912109375, 0.044094085693359375, 0.052642822265625, 0.061191558837890625, 0.06974029541015625, 0.07828903198242188, 0.0868377685546875, 0.09538650512695312, 0.10393524169921875, 0.11248397827148438, 0.12103271484375, 0.12958145141601562, 0.13813018798828125, 0.14667892456054688, 0.1552276611328125, 0.16377639770507812, 0.17232513427734375, 0.18087387084960938, 0.189422607421875, 0.19797134399414062, 0.20652008056640625, 0.21506881713867188, 0.2236175537109375, 0.23216629028320312, 0.24071502685546875, 0.24926376342773438, 0.2578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 5.0, 21.0, 44.0, 61.0, 79.0, 126.0, 144.0, 151.0, 129.0, 91.0, 67.0, 31.0, 13.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2687220573425293, -3.166614294052124, -3.0645065307617188, -2.9623987674713135, -2.860291004180908, -2.758183002471924, -2.6560752391815186, -2.5539674758911133, -2.451859712600708, -2.3497519493103027, -2.2476441860198975, -2.145536422729492, -2.043428421020508, -1.941320776939392, -1.8392128944396973, -1.737105131149292, -1.6349973678588867, -1.5328896045684814, -1.4307818412780762, -1.3286739587783813, -1.226566195487976, -1.1244584321975708, -1.022350549697876, -0.9202427864074707, -0.8181350231170654, -0.7160272598266602, -0.6139194369316101, -0.5118116140365601, -0.4097038507461548, -0.3075960874557495, -0.20548826456069946, -0.10338044166564941, -0.001272439956665039, 0.10083535313606262, 0.20294314622879028, 0.30505093932151794, 0.4071587324142456, 0.5092664957046509, 0.6113743185997009, 0.713482141494751, 0.8155899047851562, 0.9176976680755615, 1.0198054313659668, 1.1219133138656616, 1.224021077156067, 1.3261288404464722, 1.428236722946167, 1.5303444862365723, 1.6324522495269775, 1.7345600128173828, 1.836667776107788, 1.938775658607483, 2.0408835411071777, 2.142991065979004, 2.2450990676879883, 2.3472068309783936, 2.449314594268799, 2.551422357559204, 2.6535301208496094, 2.7556378841400146, 2.85774564743042, 2.9598536491394043, 3.0619614124298096, 3.164069175720215, 3.26617693901062]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 8.0, 9.0, 11.0, 21.0, 20.0, 17.0, 26.0, 21.0, 26.0, 29.0, 34.0, 30.0, 39.0, 28.0, 42.0, 46.0, 37.0, 35.0, 31.0, 42.0, 48.0, 37.0, 33.0, 46.0, 26.0, 28.0, 27.0, 36.0, 20.0, 17.0, 22.0, 13.0, 14.0, 7.0, 13.0, 6.0, 7.0, 9.0, 2.0, 8.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.8717982769012451, -1.8183579444885254, -1.7649176120758057, -1.711477279663086, -1.6580369472503662, -1.6045966148376465, -1.5511561632156372, -1.4977158308029175, -1.4442754983901978, -1.390835165977478, -1.3373948335647583, -1.2839545011520386, -1.2305140495300293, -1.1770737171173096, -1.1236333847045898, -1.0701930522918701, -1.0167527198791504, -0.9633123874664307, -0.9098720550537109, -0.8564316630363464, -0.8029913306236267, -0.749550998210907, -0.6961106061935425, -0.6426702737808228, -0.589229941368103, -0.5357896089553833, -0.4823492467403412, -0.4289088845252991, -0.37546855211257935, -0.3220282196998596, -0.2685878574848175, -0.2151474952697754, -0.16170716285705566, -0.10826681554317474, -0.05482646822929382, -0.0013861209154129028, 0.05205422639846802, 0.10549455881118774, 0.15893492102622986, 0.21237528324127197, 0.2658156156539917, 0.3192559480667114, 0.37269631028175354, 0.42613667249679565, 0.4795770049095154, 0.5330173373222351, 0.5864577293395996, 0.6398980617523193, 0.6933383941650391, 0.7467787265777588, 0.8002190589904785, 0.853659451007843, 0.9070997834205627, 0.9605401158332825, 1.013980507850647, 1.0674208402633667, 1.1208611726760864, 1.1743015050888062, 1.2277418375015259, 1.2811821699142456, 1.3346226215362549, 1.3880629539489746, 1.4415032863616943, 1.494943618774414, 1.5483839511871338]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 1.0, 3.0, 13.0, 9.0, 7.0, 11.0, 21.0, 32.0, 40.0, 62.0, 70.0, 95.0, 173.0, 237.0, 393.0, 721.0, 1251.0, 2385.0, 4707.0, 9807.0, 22067.0, 57071.0, 185534.0, 695755.0, 1668815.0, 1085190.0, 315961.0, 87118.0, 30878.0, 12996.0, 6047.0, 3038.0, 1466.0, 897.0, 491.0, 317.0, 168.0, 126.0, 84.0, 55.0, 51.0, 29.0, 17.0, 20.0, 8.0, 12.0, 10.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.314208984375, -0.3042945861816406, -0.29438018798828125, -0.2844657897949219, -0.2745513916015625, -0.2646369934082031, -0.25472259521484375, -0.24480819702148438, -0.234893798828125, -0.22497940063476562, -0.21506500244140625, -0.20515060424804688, -0.1952362060546875, -0.18532180786132812, -0.17540740966796875, -0.16549301147460938, -0.15557861328125, -0.14566421508789062, -0.13574981689453125, -0.12583541870117188, -0.1159210205078125, -0.10600662231445312, -0.09609222412109375, -0.08617782592773438, -0.076263427734375, -0.06634902954101562, -0.05643463134765625, -0.046520233154296875, -0.0366058349609375, -0.026691436767578125, -0.01677703857421875, -0.006862640380859375, 0.0030517578125, 0.012966156005859375, 0.02288055419921875, 0.032794952392578125, 0.0427093505859375, 0.052623748779296875, 0.06253814697265625, 0.07245254516601562, 0.082366943359375, 0.09228134155273438, 0.10219573974609375, 0.11211013793945312, 0.1220245361328125, 0.13193893432617188, 0.14185333251953125, 0.15176773071289062, 0.16168212890625, 0.17159652709960938, 0.18151092529296875, 0.19142532348632812, 0.2013397216796875, 0.21125411987304688, 0.22116851806640625, 0.23108291625976562, 0.240997314453125, 0.2509117126464844, 0.26082611083984375, 0.2707405090332031, 0.2806549072265625, 0.2905693054199219, 0.30048370361328125, 0.3103981018066406, 0.3203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 10.0, 7.0, 5.0, 22.0, 23.0, 26.0, 21.0, 21.0, 36.0, 34.0, 35.0, 29.0, 52.0, 46.0, 51.0, 57.0, 66.0, 51.0, 35.0, 50.0, 55.0, 35.0, 44.0, 27.0, 24.0, 19.0, 28.0, 17.0, 11.0, 14.0, 11.0, 7.0, 1.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.25722503662109375, -0.2483367919921875, -0.23944854736328125, -0.230560302734375, -0.22167205810546875, -0.2127838134765625, -0.20389556884765625, -0.19500732421875, -0.18611907958984375, -0.1772308349609375, -0.16834259033203125, -0.159454345703125, -0.15056610107421875, -0.1416778564453125, -0.13278961181640625, -0.1239013671875, -0.11501312255859375, -0.1061248779296875, -0.09723663330078125, -0.088348388671875, -0.07946014404296875, -0.0705718994140625, -0.06168365478515625, -0.05279541015625, -0.04390716552734375, -0.0350189208984375, -0.02613067626953125, -0.017242431640625, -0.00835418701171875, 0.0005340576171875, 0.00942230224609375, 0.018310546875, 0.02719879150390625, 0.0360870361328125, 0.04497528076171875, 0.053863525390625, 0.06275177001953125, 0.0716400146484375, 0.08052825927734375, 0.08941650390625, 0.09830474853515625, 0.1071929931640625, 0.11608123779296875, 0.124969482421875, 0.13385772705078125, 0.1427459716796875, 0.15163421630859375, 0.1605224609375, 0.16941070556640625, 0.1782989501953125, 0.18718719482421875, 0.196075439453125, 0.20496368408203125, 0.2138519287109375, 0.22274017333984375, 0.23162841796875, 0.24051666259765625, 0.2494049072265625, 0.25829315185546875, 0.267181396484375, 0.27606964111328125, 0.2849578857421875, 0.29384613037109375, 0.302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 19.0, 12.0, 36.0, 46.0, 69.0, 112.0, 201.0, 489.0, 1397.0, 5403.0, 30235.0, 293975.0, 3335582.0, 473647.0, 43229.0, 6948.0, 1726.0, 602.0, 217.0, 119.0, 72.0, 50.0, 27.0, 20.0, 15.0, 7.0, 11.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1337890625, -1.1027984619140625, -1.071807861328125, -1.0408172607421875, -1.00982666015625, -0.9788360595703125, -0.947845458984375, -0.9168548583984375, -0.8858642578125, -0.8548736572265625, -0.823883056640625, -0.7928924560546875, -0.76190185546875, -0.7309112548828125, -0.699920654296875, -0.6689300537109375, -0.637939453125, -0.6069488525390625, -0.575958251953125, -0.5449676513671875, -0.51397705078125, -0.4829864501953125, -0.451995849609375, -0.4210052490234375, -0.3900146484375, -0.3590240478515625, -0.328033447265625, -0.2970428466796875, -0.26605224609375, -0.2350616455078125, -0.204071044921875, -0.1730804443359375, -0.14208984375, -0.1110992431640625, -0.080108642578125, -0.0491180419921875, -0.01812744140625, 0.0128631591796875, 0.043853759765625, 0.0748443603515625, 0.1058349609375, 0.1368255615234375, 0.167816162109375, 0.1988067626953125, 0.22979736328125, 0.2607879638671875, 0.291778564453125, 0.3227691650390625, 0.353759765625, 0.3847503662109375, 0.415740966796875, 0.4467315673828125, 0.47772216796875, 0.5087127685546875, 0.539703369140625, 0.5706939697265625, 0.6016845703125, 0.6326751708984375, 0.663665771484375, 0.6946563720703125, 0.72564697265625, 0.7566375732421875, 0.787628173828125, 0.8186187744140625, 0.849609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 11.0, 17.0, 23.0, 44.0, 70.0, 151.0, 291.0, 586.0, 1215.0, 865.0, 382.0, 182.0, 97.0, 65.0, 44.0, 12.0, 15.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91650390625, -0.8821945190429688, -0.8478851318359375, -0.8135757446289062, -0.779266357421875, -0.7449569702148438, -0.7106475830078125, -0.6763381958007812, -0.64202880859375, -0.6077194213867188, -0.5734100341796875, -0.5391006469726562, -0.504791259765625, -0.47048187255859375, -0.4361724853515625, -0.40186309814453125, -0.3675537109375, -0.33324432373046875, -0.2989349365234375, -0.26462554931640625, -0.230316162109375, -0.19600677490234375, -0.1616973876953125, -0.12738800048828125, -0.09307861328125, -0.05876922607421875, -0.0244598388671875, 0.00984954833984375, 0.044158935546875, 0.07846832275390625, 0.1127777099609375, 0.14708709716796875, 0.181396484375, 0.21570587158203125, 0.2500152587890625, 0.28432464599609375, 0.318634033203125, 0.35294342041015625, 0.3872528076171875, 0.42156219482421875, 0.45587158203125, 0.49018096923828125, 0.5244903564453125, 0.5587997436523438, 0.593109130859375, 0.6274185180664062, 0.6617279052734375, 0.6960372924804688, 0.7303466796875, 0.7646560668945312, 0.7989654541015625, 0.8332748413085938, 0.867584228515625, 0.9018936157226562, 0.9362030029296875, 0.9705123901367188, 1.00482177734375, 1.0391311645507812, 1.0734405517578125, 1.1077499389648438, 1.142059326171875, 1.1763687133789062, 1.2106781005859375, 1.2449874877929688, 1.279296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 18.0, 41.0, 57.0, 105.0, 106.0, 151.0, 140.0, 120.0, 109.0, 55.0, 39.0, 23.0, 11.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.128225803375244, -5.003354549407959, -4.878483295440674, -4.753612041473389, -4.6287407875061035, -4.503869533538818, -4.378998279571533, -4.25412654876709, -4.129255294799805, -4.0043840408325195, -3.8795127868652344, -3.754641532897949, -3.629770278930664, -3.504899024963379, -3.3800275325775146, -3.2551562786102295, -3.1302852630615234, -3.0054140090942383, -2.880542755126953, -2.755671501159668, -2.630800247192383, -2.5059289932250977, -2.3810575008392334, -2.2561862468719482, -2.131314992904663, -2.006443738937378, -1.8815724849700928, -1.756701111793518, -1.631829857826233, -1.5069586038589478, -1.382087230682373, -1.257215976715088, -1.1323447227478027, -1.0074734687805176, -0.8826021552085876, -0.7577308416366577, -0.6328595876693726, -0.5079883337020874, -0.38311702013015747, -0.25824570655822754, -0.13337445259094238, -0.008503168821334839, 0.1163681149482727, 0.24123939871788025, 0.3661106824874878, 0.49098193645477295, 0.6158532500267029, 0.7407245635986328, 0.865595817565918, 0.9904670715332031, 1.1153383255004883, 1.240209698677063, 1.3650809526443481, 1.4899522066116333, 1.614823579788208, 1.7396948337554932, 1.8645660877227783, 1.9894373416900635, 2.1143085956573486, 2.239179849624634, 2.364051342010498, 2.488922595977783, 2.6137938499450684, 2.7386651039123535, 2.8635363578796387]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 8.0, 7.0, 11.0, 15.0, 12.0, 14.0, 16.0, 23.0, 23.0, 29.0, 29.0, 36.0, 39.0, 45.0, 34.0, 40.0, 50.0, 43.0, 36.0, 40.0, 46.0, 40.0, 33.0, 44.0, 30.0, 38.0, 43.0, 32.0, 16.0, 20.0, 17.0, 16.0, 19.0, 16.0, 9.0, 6.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6856870651245117, -1.6349207162857056, -1.5841543674468994, -1.5333881378173828, -1.4826217889785767, -1.4318554401397705, -1.3810890913009644, -1.3303227424621582, -1.2795565128326416, -1.2287901639938354, -1.1780238151550293, -1.1272575855255127, -1.0764912366867065, -1.0257248878479004, -0.9749585390090942, -0.9241921901702881, -0.8734258413314819, -0.8226594924926758, -0.7718932032585144, -0.7211268544197083, -0.6703605651855469, -0.6195942163467407, -0.5688278675079346, -0.5180615186691284, -0.46729522943496704, -0.4165289103984833, -0.3657625913619995, -0.31499624252319336, -0.2642299234867096, -0.21346360445022583, -0.16269725561141968, -0.11193093657493591, -0.06116461753845215, -0.010398291051387787, 0.040368035435676575, 0.09113436937332153, 0.1419006884098053, 0.19266700744628906, 0.24343335628509521, 0.294199675321579, 0.34496599435806274, 0.3957323133945465, 0.4464986324310303, 0.4972649812698364, 0.5480313301086426, 0.598797619342804, 0.6495639681816101, 0.7003302574157715, 0.7510966062545776, 0.8018629550933838, 0.8526292443275452, 0.9033955931663513, 0.9541618824005127, 1.0049282312393188, 1.055694580078125, 1.1064609289169312, 1.1572272777557373, 1.2079936265945435, 1.2587599754333496, 1.3095262050628662, 1.3602925539016724, 1.4110589027404785, 1.4618252515792847, 1.5125916004180908, 1.5633578300476074]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 16.0, 15.0, 19.0, 23.0, 44.0, 52.0, 91.0, 113.0, 211.0, 339.0, 565.0, 843.0, 1443.0, 2314.0, 3945.0, 6459.0, 10702.0, 17374.0, 28705.0, 46395.0, 73712.0, 109444.0, 145918.0, 160979.0, 143342.0, 107669.0, 71540.0, 45177.0, 28108.0, 16925.0, 10238.0, 6186.0, 3677.0, 2295.0, 1371.0, 824.0, 541.0, 345.0, 192.0, 152.0, 78.0, 64.0, 41.0, 21.0, 18.0, 16.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.2092914581298828, -0.20264053344726562, -0.19598960876464844, -0.18933868408203125, -0.18268775939941406, -0.17603683471679688, -0.1693859100341797, -0.1627349853515625, -0.1560840606689453, -0.14943313598632812, -0.14278221130371094, -0.13613128662109375, -0.12948036193847656, -0.12282943725585938, -0.11617851257324219, -0.109527587890625, -0.10287666320800781, -0.09622573852539062, -0.08957481384277344, -0.08292388916015625, -0.07627296447753906, -0.06962203979492188, -0.06297111511230469, -0.0563201904296875, -0.04966926574707031, -0.043018341064453125, -0.03636741638183594, -0.02971649169921875, -0.023065567016601562, -0.016414642333984375, -0.009763717651367188, -0.00311279296875, 0.0035381317138671875, 0.010189056396484375, 0.016839981079101562, 0.02349090576171875, 0.030141830444335938, 0.036792755126953125, 0.04344367980957031, 0.0500946044921875, 0.05674552917480469, 0.06339645385742188, 0.07004737854003906, 0.07669830322265625, 0.08334922790527344, 0.09000015258789062, 0.09665107727050781, 0.103302001953125, 0.10995292663574219, 0.11660385131835938, 0.12325477600097656, 0.12990570068359375, 0.13655662536621094, 0.14320755004882812, 0.1498584747314453, 0.1565093994140625, 0.1631603240966797, 0.16981124877929688, 0.17646217346191406, 0.18311309814453125, 0.18976402282714844, 0.19641494750976562, 0.2030658721923828, 0.209716796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 16.0, 10.0, 19.0, 17.0, 32.0, 22.0, 28.0, 32.0, 25.0, 41.0, 45.0, 45.0, 40.0, 43.0, 48.0, 40.0, 50.0, 36.0, 38.0, 32.0, 37.0, 44.0, 35.0, 28.0, 22.0, 18.0, 16.0, 24.0, 20.0, 15.0, 10.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2666015625, -0.2584953308105469, -0.25038909912109375, -0.24228286743164062, -0.2341766357421875, -0.22607040405273438, -0.21796417236328125, -0.20985794067382812, -0.201751708984375, -0.19364547729492188, -0.18553924560546875, -0.17743301391601562, -0.1693267822265625, -0.16122055053710938, -0.15311431884765625, -0.14500808715820312, -0.13690185546875, -0.12879562377929688, -0.12068939208984375, -0.11258316040039062, -0.1044769287109375, -0.09637069702148438, -0.08826446533203125, -0.08015823364257812, -0.072052001953125, -0.06394577026367188, -0.05583953857421875, -0.047733306884765625, -0.0396270751953125, -0.031520843505859375, -0.02341461181640625, -0.015308380126953125, -0.0072021484375, 0.000904083251953125, 0.00901031494140625, 0.017116546630859375, 0.0252227783203125, 0.033329010009765625, 0.04143524169921875, 0.049541473388671875, 0.057647705078125, 0.06575393676757812, 0.07386016845703125, 0.08196640014648438, 0.0900726318359375, 0.09817886352539062, 0.10628509521484375, 0.11439132690429688, 0.12249755859375, 0.13060379028320312, 0.13871002197265625, 0.14681625366210938, 0.1549224853515625, 0.16302871704101562, 0.17113494873046875, 0.17924118041992188, 0.187347412109375, 0.19545364379882812, 0.20355987548828125, 0.21166610717773438, 0.2197723388671875, 0.22787857055664062, 0.23598480224609375, 0.24409103393554688, 0.252197265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 15.0, 26.0, 31.0, 73.0, 121.0, 173.0, 289.0, 565.0, 1120.0, 2203.0, 5266.0, 14176.0, 43147.0, 137343.0, 341004.0, 320323.0, 122622.0, 38072.0, 12744.0, 4837.0, 2078.0, 1033.0, 545.0, 281.0, 172.0, 98.0, 71.0, 23.0, 23.0, 17.0, 19.0, 12.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48583984375, -0.46781158447265625, -0.4497833251953125, -0.43175506591796875, -0.413726806640625, -0.39569854736328125, -0.3776702880859375, -0.35964202880859375, -0.34161376953125, -0.32358551025390625, -0.3055572509765625, -0.28752899169921875, -0.269500732421875, -0.25147247314453125, -0.2334442138671875, -0.21541595458984375, -0.1973876953125, -0.17935943603515625, -0.1613311767578125, -0.14330291748046875, -0.125274658203125, -0.10724639892578125, -0.0892181396484375, -0.07118988037109375, -0.05316162109375, -0.03513336181640625, -0.0171051025390625, 0.00092315673828125, 0.018951416015625, 0.03697967529296875, 0.0550079345703125, 0.07303619384765625, 0.091064453125, 0.10909271240234375, 0.1271209716796875, 0.14514923095703125, 0.163177490234375, 0.18120574951171875, 0.1992340087890625, 0.21726226806640625, 0.23529052734375, 0.25331878662109375, 0.2713470458984375, 0.28937530517578125, 0.307403564453125, 0.32543182373046875, 0.3434600830078125, 0.36148834228515625, 0.3795166015625, 0.39754486083984375, 0.4155731201171875, 0.43360137939453125, 0.451629638671875, 0.46965789794921875, 0.4876861572265625, 0.5057144165039062, 0.52374267578125, 0.5417709350585938, 0.5597991943359375, 0.5778274536132812, 0.595855712890625, 0.6138839721679688, 0.6319122314453125, 0.6499404907226562, 0.66796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 10.0, 10.0, 14.0, 15.0, 16.0, 33.0, 35.0, 21.0, 33.0, 44.0, 30.0, 60.0, 47.0, 46.0, 37.0, 66.0, 51.0, 58.0, 51.0, 43.0, 40.0, 39.0, 33.0, 29.0, 23.0, 24.0, 15.0, 18.0, 12.0, 16.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79736328125, -0.7682571411132812, -0.7391510009765625, -0.7100448608398438, -0.680938720703125, -0.6518325805664062, -0.6227264404296875, -0.5936203002929688, -0.56451416015625, -0.5354080200195312, -0.5063018798828125, -0.47719573974609375, -0.448089599609375, -0.41898345947265625, -0.3898773193359375, -0.36077117919921875, -0.3316650390625, -0.30255889892578125, -0.2734527587890625, -0.24434661865234375, -0.215240478515625, -0.18613433837890625, -0.1570281982421875, -0.12792205810546875, -0.09881591796875, -0.06970977783203125, -0.0406036376953125, -0.01149749755859375, 0.017608642578125, 0.04671478271484375, 0.0758209228515625, 0.10492706298828125, 0.134033203125, 0.16313934326171875, 0.1922454833984375, 0.22135162353515625, 0.250457763671875, 0.27956390380859375, 0.3086700439453125, 0.33777618408203125, 0.36688232421875, 0.39598846435546875, 0.4250946044921875, 0.45420074462890625, 0.483306884765625, 0.5124130249023438, 0.5415191650390625, 0.5706253051757812, 0.5997314453125, 0.6288375854492188, 0.6579437255859375, 0.6870498657226562, 0.716156005859375, 0.7452621459960938, 0.7743682861328125, 0.8034744262695312, 0.83258056640625, 0.8616867065429688, 0.8907928466796875, 0.9198989868164062, 0.949005126953125, 0.9781112670898438, 1.0072174072265625, 1.0363235473632812, 1.0654296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 10.0, 13.0, 15.0, 24.0, 32.0, 36.0, 62.0, 98.0, 135.0, 207.0, 287.0, 524.0, 806.0, 1268.0, 2268.0, 3850.0, 7078.0, 13371.0, 25126.0, 49898.0, 97691.0, 171935.0, 226987.0, 196238.0, 119767.0, 62626.0, 31688.0, 16315.0, 8831.0, 4664.0, 2635.0, 1531.0, 896.0, 572.0, 365.0, 227.0, 139.0, 103.0, 66.0, 51.0, 46.0, 17.0, 24.0, 14.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.14453125, -0.14023780822753906, -0.13594436645507812, -0.1316509246826172, -0.12735748291015625, -0.12306404113769531, -0.11877059936523438, -0.11447715759277344, -0.1101837158203125, -0.10589027404785156, -0.10159683227539062, -0.09730339050292969, -0.09300994873046875, -0.08871650695800781, -0.08442306518554688, -0.08012962341308594, -0.075836181640625, -0.07154273986816406, -0.06724929809570312, -0.06295585632324219, -0.05866241455078125, -0.05436897277832031, -0.050075531005859375, -0.04578208923339844, -0.0414886474609375, -0.03719520568847656, -0.032901763916015625, -0.028608322143554688, -0.02431488037109375, -0.020021438598632812, -0.015727996826171875, -0.011434555053710938, -0.00714111328125, -0.0028476715087890625, 0.001445770263671875, 0.0057392120361328125, 0.01003265380859375, 0.014326095581054688, 0.018619537353515625, 0.022912979125976562, 0.0272064208984375, 0.03149986267089844, 0.035793304443359375, 0.04008674621582031, 0.04438018798828125, 0.04867362976074219, 0.052967071533203125, 0.05726051330566406, 0.061553955078125, 0.06584739685058594, 0.07014083862304688, 0.07443428039550781, 0.07872772216796875, 0.08302116394042969, 0.08731460571289062, 0.09160804748535156, 0.0959014892578125, 0.10019493103027344, 0.10448837280273438, 0.10878181457519531, 0.11307525634765625, 0.11736869812011719, 0.12166213989257812, 0.12595558166503906, 0.1302490234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 7.0, 11.0, 5.0, 14.0, 10.0, 27.0, 29.0, 26.0, 44.0, 56.0, 66.0, 83.0, 80.0, 92.0, 88.0, 76.0, 45.0, 47.0, 43.0, 28.0, 27.0, 27.0, 20.0, 15.0, 7.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.808208465576172e-05, -7.618311792612076e-05, -7.42841511964798e-05, -7.238518446683884e-05, -7.048621773719788e-05, -6.858725100755692e-05, -6.668828427791595e-05, -6.4789317548275e-05, -6.289035081863403e-05, -6.099138408899307e-05, -5.909241735935211e-05, -5.719345062971115e-05, -5.529448390007019e-05, -5.339551717042923e-05, -5.149655044078827e-05, -4.959758371114731e-05, -4.769861698150635e-05, -4.579965025186539e-05, -4.3900683522224426e-05, -4.2001716792583466e-05, -4.0102750062942505e-05, -3.8203783333301544e-05, -3.6304816603660583e-05, -3.440584987401962e-05, -3.250688314437866e-05, -3.06079164147377e-05, -2.870894968509674e-05, -2.680998295545578e-05, -2.491101622581482e-05, -2.301204949617386e-05, -2.1113082766532898e-05, -1.9214116036891937e-05, -1.7315149307250977e-05, -1.5416182577610016e-05, -1.3517215847969055e-05, -1.1618249118328094e-05, -9.719282388687134e-06, -7.820315659046173e-06, -5.921348929405212e-06, -4.022382199764252e-06, -2.123415470123291e-06, -2.2444874048233032e-07, 1.6745179891586304e-06, 3.573484718799591e-06, 5.472451448440552e-06, 7.3714181780815125e-06, 9.270384907722473e-06, 1.1169351637363434e-05, 1.3068318367004395e-05, 1.4967285096645355e-05, 1.6866251826286316e-05, 1.8765218555927277e-05, 2.0664185285568237e-05, 2.2563152015209198e-05, 2.446211874485016e-05, 2.636108547449112e-05, 2.826005220413208e-05, 3.015901893377304e-05, 3.2057985663414e-05, 3.395695239305496e-05, 3.585591912269592e-05, 3.7754885852336884e-05, 3.9653852581977844e-05, 4.1552819311618805e-05, 4.3451786041259766e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 8.0, 17.0, 25.0, 48.0, 63.0, 115.0, 204.0, 300.0, 500.0, 1032.0, 1882.0, 3760.0, 7215.0, 14969.0, 33298.0, 73263.0, 152067.0, 242623.0, 238662.0, 146319.0, 70632.0, 31956.0, 14890.0, 7089.0, 3548.0, 1816.0, 980.0, 514.0, 322.0, 159.0, 116.0, 49.0, 43.0, 24.0, 29.0, 4.0, 8.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.153564453125, -0.14876174926757812, -0.14395904541015625, -0.13915634155273438, -0.1343536376953125, -0.12955093383789062, -0.12474822998046875, -0.11994552612304688, -0.115142822265625, -0.11034011840820312, -0.10553741455078125, -0.10073471069335938, -0.0959320068359375, -0.09112930297851562, -0.08632659912109375, -0.08152389526367188, -0.07672119140625, -0.07191848754882812, -0.06711578369140625, -0.062313079833984375, -0.0575103759765625, -0.052707672119140625, -0.04790496826171875, -0.043102264404296875, -0.038299560546875, -0.033496856689453125, -0.02869415283203125, -0.023891448974609375, -0.0190887451171875, -0.014286041259765625, -0.00948333740234375, -0.004680633544921875, 0.0001220703125, 0.004924774169921875, 0.00972747802734375, 0.014530181884765625, 0.0193328857421875, 0.024135589599609375, 0.02893829345703125, 0.033740997314453125, 0.038543701171875, 0.043346405029296875, 0.04814910888671875, 0.052951812744140625, 0.0577545166015625, 0.06255722045898438, 0.06735992431640625, 0.07216262817382812, 0.07696533203125, 0.08176803588867188, 0.08657073974609375, 0.09137344360351562, 0.0961761474609375, 0.10097885131835938, 0.10578155517578125, 0.11058425903320312, 0.115386962890625, 0.12018966674804688, 0.12499237060546875, 0.12979507446289062, 0.1345977783203125, 0.13940048217773438, 0.14420318603515625, 0.14900588989257812, 0.15380859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 13.0, 3.0, 10.0, 8.0, 14.0, 18.0, 19.0, 30.0, 28.0, 34.0, 43.0, 39.0, 52.0, 52.0, 53.0, 63.0, 41.0, 43.0, 49.0, 57.0, 40.0, 52.0, 33.0, 35.0, 26.0, 23.0, 20.0, 14.0, 13.0, 13.0, 18.0, 2.0, 2.0, 8.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.166015625, -0.16106414794921875, -0.1561126708984375, -0.15116119384765625, -0.146209716796875, -0.14125823974609375, -0.1363067626953125, -0.13135528564453125, -0.12640380859375, -0.12145233154296875, -0.1165008544921875, -0.11154937744140625, -0.106597900390625, -0.10164642333984375, -0.0966949462890625, -0.09174346923828125, -0.0867919921875, -0.08184051513671875, -0.0768890380859375, -0.07193756103515625, -0.066986083984375, -0.06203460693359375, -0.0570831298828125, -0.05213165283203125, -0.04718017578125, -0.04222869873046875, -0.0372772216796875, -0.03232574462890625, -0.027374267578125, -0.02242279052734375, -0.0174713134765625, -0.01251983642578125, -0.007568359375, -0.00261688232421875, 0.0023345947265625, 0.00728607177734375, 0.012237548828125, 0.01718902587890625, 0.0221405029296875, 0.02709197998046875, 0.03204345703125, 0.03699493408203125, 0.0419464111328125, 0.04689788818359375, 0.051849365234375, 0.05680084228515625, 0.0617523193359375, 0.06670379638671875, 0.0716552734375, 0.07660675048828125, 0.0815582275390625, 0.08650970458984375, 0.091461181640625, 0.09641265869140625, 0.1013641357421875, 0.10631561279296875, 0.11126708984375, 0.11621856689453125, 0.1211700439453125, 0.12612152099609375, 0.131072998046875, 0.13602447509765625, 0.1409759521484375, 0.14592742919921875, 0.15087890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 8.0, 16.0, 27.0, 63.0, 134.0, 203.0, 211.0, 184.0, 95.0, 35.0, 15.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7088701725006104, -2.5702273845672607, -2.431584596633911, -2.2929418087005615, -2.154299259185791, -2.0156564712524414, -1.8770136833190918, -1.7383708953857422, -1.5997281074523926, -1.461085319519043, -1.3224425315856934, -1.1837998628616333, -1.0451570749282837, -0.9065142869949341, -0.7678715586662292, -0.6292288303375244, -0.4905860424041748, -0.3519432842731476, -0.21330052614212036, -0.07465776801109314, 0.06398499011993408, 0.2026277780532837, 0.3412705063819885, 0.47991323471069336, 0.618556022644043, 0.7571988105773926, 0.8958415389060974, 1.0344842672348022, 1.1731270551681519, 1.3117698431015015, 1.4504125118255615, 1.5890552997589111, 1.7276978492736816, 1.8663406372070312, 2.004983425140381, 2.1436262130737305, 2.28226900100708, 2.4209117889404297, 2.5595543384552, 2.69819712638855, 2.8368399143218994, 2.975482702255249, 3.1141254901885986, 3.2527682781219482, 3.3914108276367188, 3.5300536155700684, 3.668696403503418, 3.8073391914367676, 3.945981979370117, 4.084624767303467, 4.223267555236816, 4.361910343170166, 4.500553131103516, 4.639195919036865, 4.777838706970215, 4.916481018066406, 5.055124282836914, 5.193767070770264, 5.332409858703613, 5.471052646636963, 5.6096954345703125, 5.748338222503662, 5.886981010437012, 6.025623321533203, 6.164266109466553]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 7.0, 9.0, 5.0, 10.0, 21.0, 17.0, 30.0, 27.0, 37.0, 38.0, 33.0, 43.0, 38.0, 41.0, 49.0, 36.0, 41.0, 41.0, 37.0, 38.0, 34.0, 32.0, 33.0, 26.0, 45.0, 43.0, 30.0, 30.0, 20.0, 17.0, 8.0, 17.0, 9.0, 12.0, 3.0, 4.0, 5.0, 5.0, 3.0, 4.0, 5.0, 0.0, 3.0], "bins": [-2.3717381954193115, -2.308588981628418, -2.2454397678375244, -2.182290554046631, -2.119141101837158, -2.0559918880462646, -1.992842674255371, -1.9296934604644775, -1.866544246673584, -1.8033950328826904, -1.7402458190917969, -1.6770964860916138, -1.6139472723007202, -1.5507980585098267, -1.4876487255096436, -1.42449951171875, -1.3613502979278564, -1.298201084136963, -1.2350518703460693, -1.1719025373458862, -1.1087533235549927, -1.0456041097640991, -0.9824548363685608, -0.9193055629730225, -0.8561563491821289, -0.7930071353912354, -0.729857861995697, -0.6667085886001587, -0.6035593748092651, -0.5404101610183716, -0.47726088762283325, -0.4141116440296173, -0.35096216201782227, -0.2878129184246063, -0.22466367483139038, -0.16151443123817444, -0.0983651876449585, -0.035215944051742554, 0.02793329954147339, 0.09108254313468933, 0.15423178672790527, 0.21738103032112122, 0.28053027391433716, 0.3436795175075531, 0.40682876110076904, 0.469978004693985, 0.5331272482872009, 0.5962765216827393, 0.6594257354736328, 0.7225749492645264, 0.7857242226600647, 0.848873496055603, 0.9120227098464966, 0.9751719236373901, 1.0383212566375732, 1.1014704704284668, 1.1646196842193604, 1.227768898010254, 1.2909181118011475, 1.3540674448013306, 1.4172166585922241, 1.4803658723831177, 1.5435152053833008, 1.6066644191741943, 1.669813632965088]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 8.0, 6.0, 1.0, 6.0, 6.0, 8.0, 25.0, 21.0, 30.0, 43.0, 67.0, 89.0, 146.0, 208.0, 268.0, 409.0, 701.0, 1026.0, 1703.0, 2970.0, 5238.0, 10299.0, 22603.0, 63638.0, 261151.0, 1068990.0, 1780980.0, 729123.0, 161576.0, 45311.0, 17820.0, 8433.0, 4447.0, 2628.0, 1496.0, 967.0, 581.0, 395.0, 283.0, 169.0, 131.0, 78.0, 69.0, 45.0, 26.0, 22.0, 17.0, 12.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.368408203125, -0.3566551208496094, -0.34490203857421875, -0.3331489562988281, -0.3213958740234375, -0.3096427917480469, -0.29788970947265625, -0.2861366271972656, -0.274383544921875, -0.2626304626464844, -0.25087738037109375, -0.23912429809570312, -0.2273712158203125, -0.21561813354492188, -0.20386505126953125, -0.19211196899414062, -0.18035888671875, -0.16860580444335938, -0.15685272216796875, -0.14509963989257812, -0.1333465576171875, -0.12159347534179688, -0.10984039306640625, -0.09808731079101562, -0.086334228515625, -0.07458114624023438, -0.06282806396484375, -0.051074981689453125, -0.0393218994140625, -0.027568817138671875, -0.01581573486328125, -0.004062652587890625, 0.0076904296875, 0.019443511962890625, 0.03119659423828125, 0.042949676513671875, 0.0547027587890625, 0.06645584106445312, 0.07820892333984375, 0.08996200561523438, 0.101715087890625, 0.11346817016601562, 0.12522125244140625, 0.13697433471679688, 0.1487274169921875, 0.16048049926757812, 0.17223358154296875, 0.18398666381835938, 0.19573974609375, 0.20749282836914062, 0.21924591064453125, 0.23099899291992188, 0.2427520751953125, 0.2545051574707031, 0.26625823974609375, 0.2780113220214844, 0.289764404296875, 0.3015174865722656, 0.31327056884765625, 0.3250236511230469, 0.3367767333984375, 0.3485298156738281, 0.36028289794921875, 0.3720359802246094, 0.3837890625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 11.0, 5.0, 12.0, 12.0, 12.0, 20.0, 20.0, 20.0, 33.0, 26.0, 31.0, 39.0, 30.0, 45.0, 36.0, 34.0, 35.0, 46.0, 56.0, 34.0, 47.0, 39.0, 37.0, 49.0, 42.0, 31.0, 31.0, 26.0, 21.0, 21.0, 20.0, 14.0, 9.0, 15.0, 11.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.3369140625, -0.3276634216308594, -0.31841278076171875, -0.3091621398925781, -0.2999114990234375, -0.2906608581542969, -0.28141021728515625, -0.2721595764160156, -0.262908935546875, -0.2536582946777344, -0.24440765380859375, -0.23515701293945312, -0.2259063720703125, -0.21665573120117188, -0.20740509033203125, -0.19815444946289062, -0.18890380859375, -0.17965316772460938, -0.17040252685546875, -0.16115188598632812, -0.1519012451171875, -0.14265060424804688, -0.13339996337890625, -0.12414932250976562, -0.114898681640625, -0.10564804077148438, -0.09639739990234375, -0.08714675903320312, -0.0778961181640625, -0.06864547729492188, -0.05939483642578125, -0.050144195556640625, -0.0408935546875, -0.031642913818359375, -0.02239227294921875, -0.013141632080078125, -0.0038909912109375, 0.005359649658203125, 0.01461029052734375, 0.023860931396484375, 0.033111572265625, 0.042362213134765625, 0.05161285400390625, 0.060863494873046875, 0.0701141357421875, 0.07936477661132812, 0.08861541748046875, 0.09786605834960938, 0.10711669921875, 0.11636734008789062, 0.12561798095703125, 0.13486862182617188, 0.1441192626953125, 0.15336990356445312, 0.16262054443359375, 0.17187118530273438, 0.181121826171875, 0.19037246704101562, 0.19962310791015625, 0.20887374877929688, 0.2181243896484375, 0.22737503051757812, 0.23662567138671875, 0.24587631225585938, 0.255126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 12.0, 15.0, 21.0, 32.0, 58.0, 69.0, 138.0, 203.0, 415.0, 987.0, 2473.0, 8124.0, 34527.0, 258108.0, 3275956.0, 540105.0, 55632.0, 11605.0, 3381.0, 1268.0, 506.0, 233.0, 121.0, 91.0, 53.0, 40.0, 28.0, 15.0, 11.0, 14.0, 11.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.024139404296875, -0.99456787109375, -0.964996337890625, -0.9354248046875, -0.905853271484375, -0.87628173828125, -0.846710205078125, -0.817138671875, -0.787567138671875, -0.75799560546875, -0.728424072265625, -0.6988525390625, -0.669281005859375, -0.63970947265625, -0.610137939453125, -0.58056640625, -0.550994873046875, -0.52142333984375, -0.491851806640625, -0.4622802734375, -0.432708740234375, -0.40313720703125, -0.373565673828125, -0.343994140625, -0.314422607421875, -0.28485107421875, -0.255279541015625, -0.2257080078125, -0.196136474609375, -0.16656494140625, -0.136993408203125, -0.107421875, -0.077850341796875, -0.04827880859375, -0.018707275390625, 0.0108642578125, 0.040435791015625, 0.07000732421875, 0.099578857421875, 0.129150390625, 0.158721923828125, 0.18829345703125, 0.217864990234375, 0.2474365234375, 0.277008056640625, 0.30657958984375, 0.336151123046875, 0.36572265625, 0.395294189453125, 0.42486572265625, 0.454437255859375, 0.4840087890625, 0.513580322265625, 0.54315185546875, 0.572723388671875, 0.602294921875, 0.631866455078125, 0.66143798828125, 0.691009521484375, 0.7205810546875, 0.750152587890625, 0.77972412109375, 0.809295654296875, 0.8388671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 14.0, 18.0, 36.0, 45.0, 71.0, 150.0, 300.0, 645.0, 1188.0, 827.0, 356.0, 161.0, 96.0, 47.0, 36.0, 23.0, 24.0, 8.0, 7.0, 2.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86767578125, -0.8351211547851562, -0.8025665283203125, -0.7700119018554688, -0.737457275390625, -0.7049026489257812, -0.6723480224609375, -0.6397933959960938, -0.60723876953125, -0.5746841430664062, -0.5421295166015625, -0.5095748901367188, -0.477020263671875, -0.44446563720703125, -0.4119110107421875, -0.37935638427734375, -0.3468017578125, -0.31424713134765625, -0.2816925048828125, -0.24913787841796875, -0.216583251953125, -0.18402862548828125, -0.1514739990234375, -0.11891937255859375, -0.08636474609375, -0.05381011962890625, -0.0212554931640625, 0.01129913330078125, 0.043853759765625, 0.07640838623046875, 0.1089630126953125, 0.14151763916015625, 0.174072265625, 0.20662689208984375, 0.2391815185546875, 0.27173614501953125, 0.304290771484375, 0.33684539794921875, 0.3694000244140625, 0.40195465087890625, 0.43450927734375, 0.46706390380859375, 0.4996185302734375, 0.5321731567382812, 0.564727783203125, 0.5972824096679688, 0.6298370361328125, 0.6623916625976562, 0.6949462890625, 0.7275009155273438, 0.7600555419921875, 0.7926101684570312, 0.825164794921875, 0.8577194213867188, 0.8902740478515625, 0.9228286743164062, 0.95538330078125, 0.9879379272460938, 1.0204925537109375, 1.0530471801757812, 1.085601806640625, 1.1181564331054688, 1.1507110595703125, 1.1832656860351562, 1.2158203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 15.0, 19.0, 59.0, 107.0, 157.0, 207.0, 182.0, 118.0, 60.0, 35.0, 14.0, 13.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.482821464538574, -4.320553302764893, -4.158285617828369, -3.9960174560546875, -3.833749532699585, -3.6714816093444824, -3.509213447570801, -3.3469455242156982, -3.1846776008605957, -3.022409677505493, -2.8601417541503906, -2.697873592376709, -2.5356056690216064, -2.373337745666504, -2.2110695838928223, -2.0488016605377197, -1.8865337371826172, -1.7242658138275146, -1.5619977712631226, -1.3997297286987305, -1.237461805343628, -1.0751938819885254, -0.9129258394241333, -0.7506577968597412, -0.5883898735046387, -0.42612189054489136, -0.26385390758514404, -0.10158592462539673, 0.060682058334350586, 0.2229500412940979, 0.3852180242538452, 0.5474860668182373, 0.7097539901733398, 0.8720219731330872, 1.0342899560928345, 1.1965579986572266, 1.358825922012329, 1.5210938453674316, 1.6833618879318237, 1.8456299304962158, 2.0078978538513184, 2.170165777206421, 2.3324337005615234, 2.494701862335205, 2.6569697856903076, 2.81923770904541, 2.981505870819092, 3.1437737941741943, 3.306041717529297, 3.4683096408843994, 3.630577564239502, 3.7928457260131836, 3.955113649368286, 4.117381572723389, 4.27964973449707, 4.441917419433594, 4.604185581207275, 4.766453742980957, 4.9287214279174805, 5.090989589691162, 5.253257751464844, 5.415525436401367, 5.577793598175049, 5.7400617599487305, 5.902329444885254]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 5.0, 10.0, 6.0, 7.0, 15.0, 17.0, 12.0, 13.0, 22.0, 20.0, 25.0, 28.0, 31.0, 26.0, 34.0, 46.0, 38.0, 42.0, 32.0, 36.0, 41.0, 41.0, 47.0, 37.0, 34.0, 28.0, 38.0, 34.0, 27.0, 25.0, 32.0, 21.0, 20.0, 25.0, 16.0, 12.0, 16.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-1.791930079460144, -1.741934895515442, -1.6919398307800293, -1.6419446468353271, -1.591949462890625, -1.5419542789459229, -1.4919590950012207, -1.441964030265808, -1.391968846321106, -1.3419736623764038, -1.2919785976409912, -1.241983413696289, -1.191988229751587, -1.1419930458068848, -1.0919978618621826, -1.04200279712677, -0.9920076131820679, -0.9420124292373657, -0.8920173048973083, -0.842022180557251, -0.7920269966125488, -0.7420318126678467, -0.6920366883277893, -0.6420415639877319, -0.5920463800430298, -0.5420511960983276, -0.49205607175827026, -0.4420609176158905, -0.39206576347351074, -0.342070609331131, -0.2920754551887512, -0.24208030104637146, -0.1920851469039917, -0.14208999276161194, -0.09209483861923218, -0.04209968447685242, 0.007895469665527344, 0.057890623807907104, 0.10788577795028687, 0.15788093209266663, 0.2078760862350464, 0.25787124037742615, 0.3078663945198059, 0.35786154866218567, 0.40785670280456543, 0.4578518569469452, 0.507847011089325, 0.5578421354293823, 0.6078373193740845, 0.6578325033187866, 0.707827627658844, 0.7578227519989014, 0.8078179359436035, 0.8578131198883057, 0.907808244228363, 0.9578033685684204, 1.0077985525131226, 1.0577937364578247, 1.1077888011932373, 1.1577839851379395, 1.2077791690826416, 1.2577743530273438, 1.307769536972046, 1.3577646017074585, 1.4077597856521606]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 9.0, 13.0, 5.0, 16.0, 21.0, 34.0, 53.0, 72.0, 121.0, 169.0, 215.0, 373.0, 628.0, 942.0, 1625.0, 2571.0, 4487.0, 7714.0, 13643.0, 24648.0, 46155.0, 88509.0, 161081.0, 230709.0, 202649.0, 120598.0, 64529.0, 33811.0, 18067.0, 10230.0, 5869.0, 3510.0, 2022.0, 1193.0, 800.0, 486.0, 320.0, 209.0, 156.0, 99.0, 61.0, 30.0, 30.0, 20.0, 16.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.360595703125, -0.3492393493652344, -0.33788299560546875, -0.3265266418457031, -0.3151702880859375, -0.3038139343261719, -0.29245758056640625, -0.2811012268066406, -0.269744873046875, -0.2583885192871094, -0.24703216552734375, -0.23567581176757812, -0.2243194580078125, -0.21296310424804688, -0.20160675048828125, -0.19025039672851562, -0.17889404296875, -0.16753768920898438, -0.15618133544921875, -0.14482498168945312, -0.1334686279296875, -0.12211227416992188, -0.11075592041015625, -0.09939956665039062, -0.088043212890625, -0.07668685913085938, -0.06533050537109375, -0.053974151611328125, -0.0426177978515625, -0.031261444091796875, -0.01990509033203125, -0.008548736572265625, 0.0028076171875, 0.014163970947265625, 0.02552032470703125, 0.036876678466796875, 0.0482330322265625, 0.059589385986328125, 0.07094573974609375, 0.08230209350585938, 0.093658447265625, 0.10501480102539062, 0.11637115478515625, 0.12772750854492188, 0.1390838623046875, 0.15044021606445312, 0.16179656982421875, 0.17315292358398438, 0.18450927734375, 0.19586563110351562, 0.20722198486328125, 0.21857833862304688, 0.2299346923828125, 0.24129104614257812, 0.25264739990234375, 0.2640037536621094, 0.275360107421875, 0.2867164611816406, 0.29807281494140625, 0.3094291687011719, 0.3207855224609375, 0.3321418762207031, 0.34349822998046875, 0.3548545837402344, 0.3662109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 11.0, 7.0, 13.0, 13.0, 17.0, 32.0, 28.0, 30.0, 35.0, 31.0, 37.0, 40.0, 30.0, 48.0, 44.0, 41.0, 43.0, 54.0, 55.0, 45.0, 44.0, 33.0, 36.0, 42.0, 25.0, 30.0, 23.0, 24.0, 15.0, 9.0, 10.0, 7.0, 10.0, 7.0, 4.0, 5.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3505859375, -0.3406524658203125, -0.330718994140625, -0.3207855224609375, -0.31085205078125, -0.3009185791015625, -0.290985107421875, -0.2810516357421875, -0.2711181640625, -0.2611846923828125, -0.251251220703125, -0.2413177490234375, -0.23138427734375, -0.2214508056640625, -0.211517333984375, -0.2015838623046875, -0.191650390625, -0.1817169189453125, -0.171783447265625, -0.1618499755859375, -0.15191650390625, -0.1419830322265625, -0.132049560546875, -0.1221160888671875, -0.1121826171875, -0.1022491455078125, -0.092315673828125, -0.0823822021484375, -0.07244873046875, -0.0625152587890625, -0.052581787109375, -0.0426483154296875, -0.03271484375, -0.0227813720703125, -0.012847900390625, -0.0029144287109375, 0.00701904296875, 0.0169525146484375, 0.026885986328125, 0.0368194580078125, 0.0467529296875, 0.0566864013671875, 0.066619873046875, 0.0765533447265625, 0.08648681640625, 0.0964202880859375, 0.106353759765625, 0.1162872314453125, 0.126220703125, 0.1361541748046875, 0.146087646484375, 0.1560211181640625, 0.16595458984375, 0.1758880615234375, 0.185821533203125, 0.1957550048828125, 0.2056884765625, 0.2156219482421875, 0.225555419921875, 0.2354888916015625, 0.24542236328125, 0.2553558349609375, 0.265289306640625, 0.2752227783203125, 0.28515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 2.0, 4.0, 8.0, 10.0, 11.0, 18.0, 31.0, 39.0, 75.0, 105.0, 143.0, 239.0, 360.0, 624.0, 1130.0, 2159.0, 4139.0, 8295.0, 18229.0, 41964.0, 109888.0, 282984.0, 336760.0, 143916.0, 53653.0, 22663.0, 10379.0, 4881.0, 2522.0, 1302.0, 758.0, 444.0, 298.0, 180.0, 125.0, 70.0, 37.0, 28.0, 19.0, 17.0, 15.0, 13.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.607421875, -0.5879135131835938, -0.5684051513671875, -0.5488967895507812, -0.529388427734375, -0.5098800659179688, -0.4903717041015625, -0.47086334228515625, -0.45135498046875, -0.43184661865234375, -0.4123382568359375, -0.39282989501953125, -0.373321533203125, -0.35381317138671875, -0.3343048095703125, -0.31479644775390625, -0.2952880859375, -0.27577972412109375, -0.2562713623046875, -0.23676300048828125, -0.217254638671875, -0.19774627685546875, -0.1782379150390625, -0.15872955322265625, -0.13922119140625, -0.11971282958984375, -0.1002044677734375, -0.08069610595703125, -0.061187744140625, -0.04167938232421875, -0.0221710205078125, -0.00266265869140625, 0.016845703125, 0.03635406494140625, 0.0558624267578125, 0.07537078857421875, 0.094879150390625, 0.11438751220703125, 0.1338958740234375, 0.15340423583984375, 0.17291259765625, 0.19242095947265625, 0.2119293212890625, 0.23143768310546875, 0.250946044921875, 0.27045440673828125, 0.2899627685546875, 0.30947113037109375, 0.3289794921875, 0.34848785400390625, 0.3679962158203125, 0.38750457763671875, 0.407012939453125, 0.42652130126953125, 0.4460296630859375, 0.46553802490234375, 0.48504638671875, 0.5045547485351562, 0.5240631103515625, 0.5435714721679688, 0.563079833984375, 0.5825881958007812, 0.6020965576171875, 0.6216049194335938, 0.64111328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 5.0, 9.0, 9.0, 11.0, 3.0, 11.0, 8.0, 14.0, 19.0, 18.0, 20.0, 23.0, 25.0, 31.0, 23.0, 34.0, 39.0, 50.0, 54.0, 40.0, 45.0, 51.0, 50.0, 36.0, 36.0, 50.0, 44.0, 36.0, 37.0, 24.0, 22.0, 25.0, 11.0, 18.0, 10.0, 12.0, 12.0, 6.0, 6.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.083984375, -1.0531997680664062, -1.0224151611328125, -0.9916305541992188, -0.960845947265625, -0.9300613403320312, -0.8992767333984375, -0.8684921264648438, -0.83770751953125, -0.8069229125976562, -0.7761383056640625, -0.7453536987304688, -0.714569091796875, -0.6837844848632812, -0.6529998779296875, -0.6222152709960938, -0.5914306640625, -0.5606460571289062, -0.5298614501953125, -0.49907684326171875, -0.468292236328125, -0.43750762939453125, -0.4067230224609375, -0.37593841552734375, -0.34515380859375, -0.31436920166015625, -0.2835845947265625, -0.25279998779296875, -0.222015380859375, -0.19123077392578125, -0.1604461669921875, -0.12966156005859375, -0.098876953125, -0.06809234619140625, -0.0373077392578125, -0.00652313232421875, 0.024261474609375, 0.05504608154296875, 0.0858306884765625, 0.11661529541015625, 0.14739990234375, 0.17818450927734375, 0.2089691162109375, 0.23975372314453125, 0.270538330078125, 0.30132293701171875, 0.3321075439453125, 0.36289215087890625, 0.3936767578125, 0.42446136474609375, 0.4552459716796875, 0.48603057861328125, 0.516815185546875, 0.5475997924804688, 0.5783843994140625, 0.6091690063476562, 0.63995361328125, 0.6707382202148438, 0.7015228271484375, 0.7323074340820312, 0.763092041015625, 0.7938766479492188, 0.8246612548828125, 0.8554458618164062, 0.88623046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 14.0, 9.0, 20.0, 27.0, 37.0, 61.0, 67.0, 118.0, 177.0, 235.0, 345.0, 491.0, 796.0, 1255.0, 2191.0, 4016.0, 7939.0, 17320.0, 44466.0, 127406.0, 305916.0, 316078.0, 135437.0, 47337.0, 18164.0, 8202.0, 4219.0, 2404.0, 1347.0, 865.0, 488.0, 346.0, 227.0, 159.0, 107.0, 70.0, 54.0, 34.0, 35.0, 17.0, 14.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2303466796875, -0.22292327880859375, -0.2154998779296875, -0.20807647705078125, -0.200653076171875, -0.19322967529296875, -0.1858062744140625, -0.17838287353515625, -0.17095947265625, -0.16353607177734375, -0.1561126708984375, -0.14868927001953125, -0.141265869140625, -0.13384246826171875, -0.1264190673828125, -0.11899566650390625, -0.111572265625, -0.10414886474609375, -0.0967254638671875, -0.08930206298828125, -0.081878662109375, -0.07445526123046875, -0.0670318603515625, -0.05960845947265625, -0.05218505859375, -0.04476165771484375, -0.0373382568359375, -0.02991485595703125, -0.022491455078125, -0.01506805419921875, -0.0076446533203125, -0.00022125244140625, 0.0072021484375, 0.01462554931640625, 0.0220489501953125, 0.02947235107421875, 0.036895751953125, 0.04431915283203125, 0.0517425537109375, 0.05916595458984375, 0.06658935546875, 0.07401275634765625, 0.0814361572265625, 0.08885955810546875, 0.096282958984375, 0.10370635986328125, 0.1111297607421875, 0.11855316162109375, 0.1259765625, 0.13339996337890625, 0.1408233642578125, 0.14824676513671875, 0.155670166015625, 0.16309356689453125, 0.1705169677734375, 0.17794036865234375, 0.18536376953125, 0.19278717041015625, 0.2002105712890625, 0.20763397216796875, 0.215057373046875, 0.22248077392578125, 0.2299041748046875, 0.23732757568359375, 0.2447509765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 13.0, 11.0, 16.0, 26.0, 39.0, 58.0, 80.0, 104.0, 115.0, 112.0, 120.0, 77.0, 65.0, 42.0, 38.0, 24.0, 14.0, 9.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.85264778137207e-05, -9.529106318950653e-05, -9.205564856529236e-05, -8.882023394107819e-05, -8.558481931686401e-05, -8.234940469264984e-05, -7.911399006843567e-05, -7.58785754442215e-05, -7.264316082000732e-05, -6.940774619579315e-05, -6.617233157157898e-05, -6.293691694736481e-05, -5.9701502323150635e-05, -5.646608769893646e-05, -5.323067307472229e-05, -4.999525845050812e-05, -4.6759843826293945e-05, -4.352442920207977e-05, -4.02890145778656e-05, -3.705359995365143e-05, -3.3818185329437256e-05, -3.0582770705223083e-05, -2.734735608100891e-05, -2.411194145679474e-05, -2.0876526832580566e-05, -1.7641112208366394e-05, -1.4405697584152222e-05, -1.117028295993805e-05, -7.934868335723877e-06, -4.699453711509705e-06, -1.4640390872955322e-06, 1.7713755369186401e-06, 5.0067901611328125e-06, 8.242204785346985e-06, 1.1477619409561157e-05, 1.471303403377533e-05, 1.7948448657989502e-05, 2.1183863282203674e-05, 2.4419277906417847e-05, 2.765469253063202e-05, 3.089010715484619e-05, 3.4125521779060364e-05, 3.7360936403274536e-05, 4.059635102748871e-05, 4.383176565170288e-05, 4.706718027591705e-05, 5.0302594900131226e-05, 5.35380095243454e-05, 5.677342414855957e-05, 6.000883877277374e-05, 6.324425339698792e-05, 6.647966802120209e-05, 6.971508264541626e-05, 7.295049726963043e-05, 7.61859118938446e-05, 7.942132651805878e-05, 8.265674114227295e-05, 8.589215576648712e-05, 8.91275703907013e-05, 9.236298501491547e-05, 9.559839963912964e-05, 9.883381426334381e-05, 0.00010206922888755798, 0.00010530464351177216, 0.00010854005813598633]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 4.0, 7.0, 8.0, 11.0, 22.0, 42.0, 54.0, 94.0, 156.0, 233.0, 444.0, 805.0, 1571.0, 3192.0, 7022.0, 17660.0, 49144.0, 139472.0, 309749.0, 304537.0, 135665.0, 48120.0, 17289.0, 6747.0, 3077.0, 1531.0, 789.0, 466.0, 233.0, 154.0, 102.0, 53.0, 25.0, 28.0, 14.0, 8.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.267822265625, -0.2603797912597656, -0.25293731689453125, -0.24549484252929688, -0.2380523681640625, -0.23060989379882812, -0.22316741943359375, -0.21572494506835938, -0.208282470703125, -0.20083999633789062, -0.19339752197265625, -0.18595504760742188, -0.1785125732421875, -0.17107009887695312, -0.16362762451171875, -0.15618515014648438, -0.14874267578125, -0.14130020141601562, -0.13385772705078125, -0.12641525268554688, -0.1189727783203125, -0.11153030395507812, -0.10408782958984375, -0.09664535522460938, -0.089202880859375, -0.08176040649414062, -0.07431793212890625, -0.06687545776367188, -0.0594329833984375, -0.051990509033203125, -0.04454803466796875, -0.037105560302734375, -0.0296630859375, -0.022220611572265625, -0.01477813720703125, -0.007335662841796875, 0.0001068115234375, 0.007549285888671875, 0.01499176025390625, 0.022434234619140625, 0.029876708984375, 0.037319183349609375, 0.04476165771484375, 0.052204132080078125, 0.0596466064453125, 0.06708908081054688, 0.07453155517578125, 0.08197402954101562, 0.08941650390625, 0.09685897827148438, 0.10430145263671875, 0.11174392700195312, 0.1191864013671875, 0.12662887573242188, 0.13407135009765625, 0.14151382446289062, 0.148956298828125, 0.15639877319335938, 0.16384124755859375, 0.17128372192382812, 0.1787261962890625, 0.18616867065429688, 0.19361114501953125, 0.20105361938476562, 0.20849609375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 1.0, 6.0, 4.0, 7.0, 9.0, 10.0, 21.0, 38.0, 33.0, 52.0, 53.0, 58.0, 72.0, 89.0, 97.0, 83.0, 82.0, 66.0, 45.0, 39.0, 27.0, 20.0, 18.0, 11.0, 11.0, 10.0, 10.0, 0.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.30517578125, -0.29670143127441406, -0.2882270812988281, -0.2797527313232422, -0.27127838134765625, -0.2628040313720703, -0.2543296813964844, -0.24585533142089844, -0.2373809814453125, -0.22890663146972656, -0.22043228149414062, -0.2119579315185547, -0.20348358154296875, -0.1950092315673828, -0.18653488159179688, -0.17806053161621094, -0.169586181640625, -0.16111183166503906, -0.15263748168945312, -0.1441631317138672, -0.13568878173828125, -0.1272144317626953, -0.11874008178710938, -0.11026573181152344, -0.1017913818359375, -0.09331703186035156, -0.08484268188476562, -0.07636833190917969, -0.06789398193359375, -0.05941963195800781, -0.050945281982421875, -0.04247093200683594, -0.03399658203125, -0.025522232055664062, -0.017047882080078125, -0.008573532104492188, -9.918212890625e-05, 0.008375167846679688, 0.016849517822265625, 0.025323867797851562, 0.0337982177734375, 0.04227256774902344, 0.050746917724609375, 0.05922126770019531, 0.06769561767578125, 0.07616996765136719, 0.08464431762695312, 0.09311866760253906, 0.101593017578125, 0.11006736755371094, 0.11854171752929688, 0.1270160675048828, 0.13549041748046875, 0.1439647674560547, 0.15243911743164062, 0.16091346740722656, 0.1693878173828125, 0.17786216735839844, 0.18633651733398438, 0.1948108673095703, 0.20328521728515625, 0.2117595672607422, 0.22023391723632812, 0.22870826721191406, 0.2371826171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 11.0, 29.0, 66.0, 108.0, 207.0, 204.0, 168.0, 109.0, 42.0, 28.0, 20.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.675130844116211, -4.51101016998291, -4.346889495849609, -4.182768821716309, -4.018648147583008, -3.854527473449707, -3.690406560897827, -3.5262858867645264, -3.3621652126312256, -3.198044538497925, -3.033923864364624, -2.8698031902313232, -2.7056822776794434, -2.5415616035461426, -2.377440929412842, -2.213320255279541, -2.0491995811462402, -1.8850789070129395, -1.7209582328796387, -1.5568374395370483, -1.3927167654037476, -1.2285960912704468, -1.0644752979278564, -0.9003546237945557, -0.7362339496612549, -0.5721132755279541, -0.40799254179000854, -0.24387183785438538, -0.07975113391876221, 0.08436954021453857, 0.24849027395248413, 0.4126110076904297, 0.5767312049865723, 0.740851879119873, 0.9049726128578186, 1.0690933465957642, 1.233214020729065, 1.3973346948623657, 1.561455488204956, 1.7255761623382568, 1.8896968364715576, 2.0538175106048584, 2.217938184738159, 2.38205885887146, 2.54617977142334, 2.7103004455566406, 2.8744211196899414, 3.038541793823242, 3.202662467956543, 3.3667831420898438, 3.5309038162231445, 3.6950244903564453, 3.859145164489746, 4.023265838623047, 4.187386512756348, 4.351507186889648, 4.515627861022949, 4.67974853515625, 4.843869209289551, 5.007989883422852, 5.172110557556152, 5.336231231689453, 5.500351905822754, 5.664472579956055, 5.828593730926514]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 9.0, 11.0, 8.0, 9.0, 21.0, 18.0, 23.0, 23.0, 25.0, 34.0, 39.0, 27.0, 35.0, 36.0, 35.0, 41.0, 45.0, 34.0, 43.0, 43.0, 45.0, 44.0, 39.0, 35.0, 34.0, 25.0, 27.0, 29.0, 18.0, 19.0, 26.0, 17.0, 15.0, 12.0, 13.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2096409797668457, -2.138277530670166, -2.0669138431549072, -1.995550274848938, -1.9241867065429688, -1.852823257446289, -1.7814596891403198, -1.7100961208343506, -1.6387325525283813, -1.567368984222412, -1.4960054159164429, -1.4246418476104736, -1.353278398513794, -1.2819147109985352, -1.2105512619018555, -1.1391876935958862, -1.067824125289917, -0.9964605569839478, -0.9250969886779785, -0.853733479976654, -0.7823699116706848, -0.7110063433647156, -0.6396428346633911, -0.5682792663574219, -0.49691569805145264, -0.4255521297454834, -0.35418859124183655, -0.2828250527381897, -0.21146148443222046, -0.14009791612625122, -0.06873437762260437, 0.0026291608810424805, 0.07399249076843262, 0.14535604417324066, 0.2167195975780487, 0.28808313608169556, 0.3594467043876648, 0.43081027269363403, 0.5021737813949585, 0.5735373497009277, 0.644900918006897, 0.7162644863128662, 0.7876280546188354, 0.8589915633201599, 0.9303551316261292, 1.0017187595367432, 1.0730822086334229, 1.144445776939392, 1.2158093452453613, 1.2871729135513306, 1.3585364818572998, 1.429900050163269, 1.5012636184692383, 1.572627067565918, 1.6439906358718872, 1.7153542041778564, 1.7867177724838257, 1.858081340789795, 1.9294449090957642, 2.0008084774017334, 2.072171926498413, 2.143535614013672, 2.2148990631103516, 2.2862625122070312, 2.35762619972229]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 15.0, 16.0, 16.0, 29.0, 39.0, 57.0, 69.0, 121.0, 165.0, 226.0, 346.0, 553.0, 898.0, 1527.0, 2673.0, 4879.0, 9531.0, 21341.0, 59244.0, 202658.0, 663553.0, 1363660.0, 1165566.0, 472490.0, 144286.0, 44755.0, 17214.0, 8021.0, 4247.0, 2300.0, 1373.0, 821.0, 533.0, 316.0, 220.0, 148.0, 108.0, 70.0, 54.0, 43.0, 29.0, 19.0, 12.0, 12.0, 9.0, 5.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.3515625, -0.3405265808105469, -0.32949066162109375, -0.3184547424316406, -0.3074188232421875, -0.2963829040527344, -0.28534698486328125, -0.2743110656738281, -0.263275146484375, -0.2522392272949219, -0.24120330810546875, -0.23016738891601562, -0.2191314697265625, -0.20809555053710938, -0.19705963134765625, -0.18602371215820312, -0.17498779296875, -0.16395187377929688, -0.15291595458984375, -0.14188003540039062, -0.1308441162109375, -0.11980819702148438, -0.10877227783203125, -0.09773635864257812, -0.086700439453125, -0.07566452026367188, -0.06462860107421875, -0.053592681884765625, -0.0425567626953125, -0.031520843505859375, -0.02048492431640625, -0.009449005126953125, 0.0015869140625, 0.012622833251953125, 0.02365875244140625, 0.034694671630859375, 0.0457305908203125, 0.056766510009765625, 0.06780242919921875, 0.07883834838867188, 0.089874267578125, 0.10091018676757812, 0.11194610595703125, 0.12298202514648438, 0.1340179443359375, 0.14505386352539062, 0.15608978271484375, 0.16712570190429688, 0.17816162109375, 0.18919754028320312, 0.20023345947265625, 0.21126937866210938, 0.2223052978515625, 0.23334121704101562, 0.24437713623046875, 0.2554130554199219, 0.266448974609375, 0.2774848937988281, 0.28852081298828125, 0.2995567321777344, 0.3105926513671875, 0.3216285705566406, 0.33266448974609375, 0.3437004089355469, 0.354736328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 7.0, 10.0, 13.0, 11.0, 16.0, 15.0, 24.0, 19.0, 25.0, 22.0, 24.0, 34.0, 38.0, 35.0, 37.0, 53.0, 50.0, 40.0, 45.0, 47.0, 36.0, 41.0, 31.0, 37.0, 36.0, 31.0, 30.0, 29.0, 38.0, 15.0, 22.0, 11.0, 12.0, 14.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.3184700012207031, -0.30759429931640625, -0.2967185974121094, -0.2858428955078125, -0.2749671936035156, -0.26409149169921875, -0.2532157897949219, -0.242340087890625, -0.23146438598632812, -0.22058868408203125, -0.20971298217773438, -0.1988372802734375, -0.18796157836914062, -0.17708587646484375, -0.16621017456054688, -0.15533447265625, -0.14445877075195312, -0.13358306884765625, -0.12270736694335938, -0.1118316650390625, -0.10095596313476562, -0.09008026123046875, -0.07920455932617188, -0.068328857421875, -0.057453155517578125, -0.04657745361328125, -0.035701751708984375, -0.0248260498046875, -0.013950347900390625, -0.00307464599609375, 0.007801055908203125, 0.0186767578125, 0.029552459716796875, 0.04042816162109375, 0.051303863525390625, 0.0621795654296875, 0.07305526733398438, 0.08393096923828125, 0.09480667114257812, 0.105682373046875, 0.11655807495117188, 0.12743377685546875, 0.13830947875976562, 0.1491851806640625, 0.16006088256835938, 0.17093658447265625, 0.18181228637695312, 0.19268798828125, 0.20356369018554688, 0.21443939208984375, 0.22531509399414062, 0.2361907958984375, 0.24706649780273438, 0.25794219970703125, 0.2688179016113281, 0.279693603515625, 0.2905693054199219, 0.30144500732421875, 0.3123207092285156, 0.3231964111328125, 0.3340721130371094, 0.34494781494140625, 0.3558235168457031, 0.36669921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 12.0, 13.0, 14.0, 32.0, 27.0, 45.0, 74.0, 113.0, 188.0, 385.0, 877.0, 2494.0, 9294.0, 48179.0, 520554.0, 3313508.0, 257427.0, 30967.0, 6609.0, 1941.0, 689.0, 301.0, 186.0, 115.0, 63.0, 42.0, 34.0, 18.0, 18.0, 12.0, 10.0, 4.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0859375, -1.05133056640625, -1.0167236328125, -0.98211669921875, -0.947509765625, -0.91290283203125, -0.8782958984375, -0.84368896484375, -0.80908203125, -0.77447509765625, -0.7398681640625, -0.70526123046875, -0.670654296875, -0.63604736328125, -0.6014404296875, -0.56683349609375, -0.5322265625, -0.49761962890625, -0.4630126953125, -0.42840576171875, -0.393798828125, -0.35919189453125, -0.3245849609375, -0.28997802734375, -0.25537109375, -0.22076416015625, -0.1861572265625, -0.15155029296875, -0.116943359375, -0.08233642578125, -0.0477294921875, -0.01312255859375, 0.021484375, 0.05609130859375, 0.0906982421875, 0.12530517578125, 0.159912109375, 0.19451904296875, 0.2291259765625, 0.26373291015625, 0.29833984375, 0.33294677734375, 0.3675537109375, 0.40216064453125, 0.436767578125, 0.47137451171875, 0.5059814453125, 0.54058837890625, 0.5751953125, 0.60980224609375, 0.6444091796875, 0.67901611328125, 0.713623046875, 0.74822998046875, 0.7828369140625, 0.81744384765625, 0.85205078125, 0.88665771484375, 0.9212646484375, 0.95587158203125, 0.990478515625, 1.02508544921875, 1.0596923828125, 1.09429931640625, 1.12890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 8.0, 10.0, 11.0, 18.0, 34.0, 56.0, 87.0, 194.0, 331.0, 764.0, 1042.0, 736.0, 342.0, 189.0, 87.0, 60.0, 36.0, 23.0, 10.0, 11.0, 11.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7379226684570312, -0.7019195556640625, -0.6659164428710938, -0.629913330078125, -0.5939102172851562, -0.5579071044921875, -0.5219039916992188, -0.48590087890625, -0.44989776611328125, -0.4138946533203125, -0.37789154052734375, -0.341888427734375, -0.30588531494140625, -0.2698822021484375, -0.23387908935546875, -0.1978759765625, -0.16187286376953125, -0.1258697509765625, -0.08986663818359375, -0.053863525390625, -0.01786041259765625, 0.0181427001953125, 0.05414581298828125, 0.09014892578125, 0.12615203857421875, 0.1621551513671875, 0.19815826416015625, 0.234161376953125, 0.27016448974609375, 0.3061676025390625, 0.34217071533203125, 0.378173828125, 0.41417694091796875, 0.4501800537109375, 0.48618316650390625, 0.522186279296875, 0.5581893920898438, 0.5941925048828125, 0.6301956176757812, 0.66619873046875, 0.7022018432617188, 0.7382049560546875, 0.7742080688476562, 0.810211181640625, 0.8462142944335938, 0.8822174072265625, 0.9182205200195312, 0.9542236328125, 0.9902267456054688, 1.0262298583984375, 1.0622329711914062, 1.098236083984375, 1.1342391967773438, 1.1702423095703125, 1.2062454223632812, 1.24224853515625, 1.2782516479492188, 1.3142547607421875, 1.3502578735351562, 1.386260986328125, 1.4222640991210938, 1.4582672119140625, 1.4942703247070312, 1.5302734375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 9.0, 24.0, 41.0, 59.0, 109.0, 119.0, 140.0, 130.0, 106.0, 93.0, 54.0, 38.0, 22.0, 16.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.293895721435547, -4.162692070007324, -4.03148889541626, -3.900285482406616, -3.7690820693969727, -3.637878656387329, -3.5066752433776855, -3.375471830368042, -3.2442684173583984, -3.113065004348755, -2.9818615913391113, -2.8506581783294678, -2.719454765319824, -2.5882513523101807, -2.457047939300537, -2.3258445262908936, -2.19464111328125, -2.0634377002716064, -1.932234287261963, -1.8010308742523193, -1.6698274612426758, -1.5386240482330322, -1.4074206352233887, -1.2762172222137451, -1.1450138092041016, -1.013810396194458, -0.8826069831848145, -0.7514035701751709, -0.6202001571655273, -0.4889967441558838, -0.35779333114624023, -0.22658991813659668, -0.09538698196411133, 0.03581643104553223, 0.16701984405517578, 0.29822325706481934, 0.4294266700744629, 0.5606300830841064, 0.69183349609375, 0.8230369091033936, 0.9542403221130371, 1.0854437351226807, 1.2166471481323242, 1.3478505611419678, 1.4790539741516113, 1.6102573871612549, 1.7414608001708984, 1.872664213180542, 2.0038676261901855, 2.135071039199829, 2.2662744522094727, 2.397477865219116, 2.5286812782287598, 2.6598846912384033, 2.791088104248047, 2.9222915172576904, 3.053494930267334, 3.1846983432769775, 3.315901756286621, 3.4471051692962646, 3.578308582305908, 3.7095119953155518, 3.8407154083251953, 3.971918821334839, 4.103122234344482]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 7.0, 10.0, 13.0, 14.0, 11.0, 13.0, 21.0, 18.0, 24.0, 35.0, 35.0, 31.0, 37.0, 39.0, 42.0, 49.0, 46.0, 48.0, 40.0, 44.0, 39.0, 28.0, 34.0, 40.0, 36.0, 30.0, 32.0, 23.0, 27.0, 16.0, 15.0, 12.0, 17.0, 7.0, 12.0, 6.0, 11.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.9300289154052734, -1.8679583072662354, -1.8058876991271973, -1.7438170909881592, -1.681746482849121, -1.619675874710083, -1.557605266571045, -1.4955346584320068, -1.4334640502929688, -1.3713934421539307, -1.3093228340148926, -1.2472522258758545, -1.1851816177368164, -1.1231110095977783, -1.0610404014587402, -0.9989697933197021, -0.9368991851806641, -0.874828577041626, -0.8127579689025879, -0.7506873607635498, -0.6886167526245117, -0.6265461444854736, -0.5644755363464355, -0.5024049282073975, -0.4403343200683594, -0.3782637119293213, -0.3161931037902832, -0.2541224956512451, -0.19205188751220703, -0.12998127937316895, -0.06791067123413086, -0.0058400630950927734, 0.05623054504394531, 0.1183011531829834, 0.18037176132202148, 0.24244236946105957, 0.30451297760009766, 0.36658358573913574, 0.42865419387817383, 0.4907248020172119, 0.55279541015625, 0.6148660182952881, 0.6769366264343262, 0.7390072345733643, 0.8010778427124023, 0.8631484508514404, 0.9252190589904785, 0.9872896671295166, 1.0493602752685547, 1.1114308834075928, 1.1735014915466309, 1.235572099685669, 1.297642707824707, 1.3597133159637451, 1.4217839241027832, 1.4838545322418213, 1.5459251403808594, 1.6079957485198975, 1.6700663566589355, 1.7321369647979736, 1.7942075729370117, 1.8562781810760498, 1.918348789215088, 1.980419397354126, 2.042490005493164]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 6.0, 8.0, 10.0, 13.0, 22.0, 28.0, 40.0, 45.0, 103.0, 165.0, 215.0, 377.0, 551.0, 977.0, 1529.0, 2509.0, 4296.0, 7267.0, 13035.0, 23398.0, 44424.0, 86515.0, 162183.0, 235535.0, 206567.0, 122303.0, 62281.0, 32492.0, 17538.0, 9790.0, 5681.0, 3305.0, 1991.0, 1218.0, 798.0, 495.0, 296.0, 181.0, 129.0, 87.0, 48.0, 35.0, 21.0, 20.0, 7.0, 8.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.452880859375, -0.439056396484375, -0.42523193359375, -0.411407470703125, -0.3975830078125, -0.383758544921875, -0.36993408203125, -0.356109619140625, -0.34228515625, -0.328460693359375, -0.31463623046875, -0.300811767578125, -0.2869873046875, -0.273162841796875, -0.25933837890625, -0.245513916015625, -0.231689453125, -0.217864990234375, -0.20404052734375, -0.190216064453125, -0.1763916015625, -0.162567138671875, -0.14874267578125, -0.134918212890625, -0.12109375, -0.107269287109375, -0.09344482421875, -0.079620361328125, -0.0657958984375, -0.051971435546875, -0.03814697265625, -0.024322509765625, -0.010498046875, 0.003326416015625, 0.01715087890625, 0.030975341796875, 0.0447998046875, 0.058624267578125, 0.07244873046875, 0.086273193359375, 0.10009765625, 0.113922119140625, 0.12774658203125, 0.141571044921875, 0.1553955078125, 0.169219970703125, 0.18304443359375, 0.196868896484375, 0.210693359375, 0.224517822265625, 0.23834228515625, 0.252166748046875, 0.2659912109375, 0.279815673828125, 0.29364013671875, 0.307464599609375, 0.3212890625, 0.335113525390625, 0.34893798828125, 0.362762451171875, 0.3765869140625, 0.390411376953125, 0.40423583984375, 0.418060302734375, 0.431884765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 10.0, 10.0, 7.0, 16.0, 14.0, 10.0, 13.0, 19.0, 23.0, 26.0, 26.0, 37.0, 29.0, 35.0, 36.0, 34.0, 51.0, 43.0, 48.0, 42.0, 49.0, 46.0, 38.0, 48.0, 36.0, 38.0, 31.0, 27.0, 31.0, 21.0, 14.0, 17.0, 11.0, 13.0, 13.0, 6.0, 11.0, 5.0, 5.0, 8.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38525390625, -0.3739166259765625, -0.362579345703125, -0.3512420654296875, -0.33990478515625, -0.3285675048828125, -0.317230224609375, -0.3058929443359375, -0.2945556640625, -0.2832183837890625, -0.271881103515625, -0.2605438232421875, -0.24920654296875, -0.2378692626953125, -0.226531982421875, -0.2151947021484375, -0.203857421875, -0.1925201416015625, -0.181182861328125, -0.1698455810546875, -0.15850830078125, -0.1471710205078125, -0.135833740234375, -0.1244964599609375, -0.1131591796875, -0.1018218994140625, -0.090484619140625, -0.0791473388671875, -0.06781005859375, -0.0564727783203125, -0.045135498046875, -0.0337982177734375, -0.0224609375, -0.0111236572265625, 0.000213623046875, 0.0115509033203125, 0.02288818359375, 0.0342254638671875, 0.045562744140625, 0.0569000244140625, 0.0682373046875, 0.0795745849609375, 0.090911865234375, 0.1022491455078125, 0.11358642578125, 0.1249237060546875, 0.136260986328125, 0.1475982666015625, 0.158935546875, 0.1702728271484375, 0.181610107421875, 0.1929473876953125, 0.20428466796875, 0.2156219482421875, 0.226959228515625, 0.2382965087890625, 0.2496337890625, 0.2609710693359375, 0.272308349609375, 0.2836456298828125, 0.29498291015625, 0.3063201904296875, 0.317657470703125, 0.3289947509765625, 0.34033203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 7.0, 8.0, 5.0, 18.0, 22.0, 29.0, 39.0, 56.0, 67.0, 114.0, 191.0, 293.0, 398.0, 693.0, 1216.0, 2099.0, 3742.0, 7126.0, 14002.0, 29023.0, 65204.0, 156160.0, 309172.0, 254886.0, 111413.0, 47223.0, 21838.0, 10687.0, 5513.0, 3005.0, 1648.0, 961.0, 604.0, 359.0, 214.0, 164.0, 110.0, 69.0, 52.0, 31.0, 29.0, 19.0, 10.0, 5.0, 6.0, 9.0, 5.0, 5.0, 1.0, 5.0], "bins": [-0.7177734375, -0.698272705078125, -0.67877197265625, -0.659271240234375, -0.6397705078125, -0.620269775390625, -0.60076904296875, -0.581268310546875, -0.561767578125, -0.542266845703125, -0.52276611328125, -0.503265380859375, -0.4837646484375, -0.464263916015625, -0.44476318359375, -0.425262451171875, -0.40576171875, -0.386260986328125, -0.36676025390625, -0.347259521484375, -0.3277587890625, -0.308258056640625, -0.28875732421875, -0.269256591796875, -0.249755859375, -0.230255126953125, -0.21075439453125, -0.191253662109375, -0.1717529296875, -0.152252197265625, -0.13275146484375, -0.113250732421875, -0.09375, -0.074249267578125, -0.05474853515625, -0.035247802734375, -0.0157470703125, 0.003753662109375, 0.02325439453125, 0.042755126953125, 0.062255859375, 0.081756591796875, 0.10125732421875, 0.120758056640625, 0.1402587890625, 0.159759521484375, 0.17926025390625, 0.198760986328125, 0.21826171875, 0.237762451171875, 0.25726318359375, 0.276763916015625, 0.2962646484375, 0.315765380859375, 0.33526611328125, 0.354766845703125, 0.374267578125, 0.393768310546875, 0.41326904296875, 0.432769775390625, 0.4522705078125, 0.471771240234375, 0.49127197265625, 0.510772705078125, 0.5302734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 8.0, 11.0, 14.0, 18.0, 11.0, 18.0, 13.0, 25.0, 20.0, 28.0, 38.0, 41.0, 39.0, 42.0, 42.0, 62.0, 49.0, 47.0, 64.0, 51.0, 42.0, 35.0, 39.0, 29.0, 33.0, 28.0, 24.0, 24.0, 16.0, 15.0, 22.0, 13.0, 9.0, 6.0, 7.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.386077880859375, -1.34735107421875, -1.308624267578125, -1.2698974609375, -1.231170654296875, -1.19244384765625, -1.153717041015625, -1.114990234375, -1.076263427734375, -1.03753662109375, -0.998809814453125, -0.9600830078125, -0.921356201171875, -0.88262939453125, -0.843902587890625, -0.80517578125, -0.766448974609375, -0.72772216796875, -0.688995361328125, -0.6502685546875, -0.611541748046875, -0.57281494140625, -0.534088134765625, -0.495361328125, -0.456634521484375, -0.41790771484375, -0.379180908203125, -0.3404541015625, -0.301727294921875, -0.26300048828125, -0.224273681640625, -0.185546875, -0.146820068359375, -0.10809326171875, -0.069366455078125, -0.0306396484375, 0.008087158203125, 0.04681396484375, 0.085540771484375, 0.124267578125, 0.162994384765625, 0.20172119140625, 0.240447998046875, 0.2791748046875, 0.317901611328125, 0.35662841796875, 0.395355224609375, 0.43408203125, 0.472808837890625, 0.51153564453125, 0.550262451171875, 0.5889892578125, 0.627716064453125, 0.66644287109375, 0.705169677734375, 0.743896484375, 0.782623291015625, 0.82135009765625, 0.860076904296875, 0.8988037109375, 0.937530517578125, 0.97625732421875, 1.014984130859375, 1.0537109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 7.0, 19.0, 13.0, 23.0, 30.0, 28.0, 40.0, 79.0, 91.0, 115.0, 198.0, 241.0, 424.0, 607.0, 981.0, 1693.0, 3042.0, 6032.0, 13217.0, 33453.0, 95497.0, 274770.0, 367313.0, 159080.0, 53438.0, 19821.0, 8413.0, 4072.0, 2247.0, 1225.0, 765.0, 486.0, 330.0, 205.0, 161.0, 109.0, 74.0, 62.0, 26.0, 24.0, 22.0, 13.0, 17.0, 9.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.26171875, -0.2533378601074219, -0.24495697021484375, -0.23657608032226562, -0.2281951904296875, -0.21981430053710938, -0.21143341064453125, -0.20305252075195312, -0.194671630859375, -0.18629074096679688, -0.17790985107421875, -0.16952896118164062, -0.1611480712890625, -0.15276718139648438, -0.14438629150390625, -0.13600540161132812, -0.12762451171875, -0.11924362182617188, -0.11086273193359375, -0.10248184204101562, -0.0941009521484375, -0.08572006225585938, -0.07733917236328125, -0.06895828247070312, -0.060577392578125, -0.052196502685546875, -0.04381561279296875, -0.035434722900390625, -0.0270538330078125, -0.018672943115234375, -0.01029205322265625, -0.001911163330078125, 0.0064697265625, 0.014850616455078125, 0.02323150634765625, 0.031612396240234375, 0.0399932861328125, 0.048374176025390625, 0.05675506591796875, 0.06513595581054688, 0.073516845703125, 0.08189773559570312, 0.09027862548828125, 0.09865951538085938, 0.1070404052734375, 0.11542129516601562, 0.12380218505859375, 0.13218307495117188, 0.14056396484375, 0.14894485473632812, 0.15732574462890625, 0.16570663452148438, 0.1740875244140625, 0.18246841430664062, 0.19084930419921875, 0.19923019409179688, 0.207611083984375, 0.21599197387695312, 0.22437286376953125, 0.23275375366210938, 0.2411346435546875, 0.24951553344726562, 0.25789642333984375, 0.2662773132324219, 0.274658203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 3.0, 4.0, 11.0, 5.0, 14.0, 15.0, 20.0, 29.0, 45.0, 42.0, 88.0, 105.0, 138.0, 144.0, 97.0, 79.0, 39.0, 33.0, 26.0, 18.0, 11.0, 9.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010985136032104492, -0.00010639242827892303, -0.00010293349623680115, -9.947456419467926e-05, -9.601563215255737e-05, -9.255670011043549e-05, -8.90977680683136e-05, -8.563883602619171e-05, -8.217990398406982e-05, -7.872097194194794e-05, -7.526203989982605e-05, -7.180310785770416e-05, -6.834417581558228e-05, -6.488524377346039e-05, -6.14263117313385e-05, -5.7967379689216614e-05, -5.4508447647094727e-05, -5.104951560497284e-05, -4.759058356285095e-05, -4.4131651520729065e-05, -4.067271947860718e-05, -3.721378743648529e-05, -3.37548553943634e-05, -3.0295923352241516e-05, -2.683699131011963e-05, -2.3378059267997742e-05, -1.9919127225875854e-05, -1.6460195183753967e-05, -1.300126314163208e-05, -9.542331099510193e-06, -6.083399057388306e-06, -2.6244670152664185e-06, 8.344650268554688e-07, 4.293397068977356e-06, 7.752329111099243e-06, 1.121126115322113e-05, 1.4670193195343018e-05, 1.8129125237464905e-05, 2.1588057279586792e-05, 2.504698932170868e-05, 2.8505921363830566e-05, 3.1964853405952454e-05, 3.542378544807434e-05, 3.888271749019623e-05, 4.2341649532318115e-05, 4.580058157444e-05, 4.925951361656189e-05, 5.271844565868378e-05, 5.6177377700805664e-05, 5.963630974292755e-05, 6.309524178504944e-05, 6.655417382717133e-05, 7.001310586929321e-05, 7.34720379114151e-05, 7.693096995353699e-05, 8.038990199565887e-05, 8.384883403778076e-05, 8.730776607990265e-05, 9.076669812202454e-05, 9.422563016414642e-05, 9.768456220626831e-05, 0.0001011434942483902, 0.00010460242629051208, 0.00010806135833263397, 0.00011152029037475586]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 10.0, 17.0, 26.0, 30.0, 60.0, 95.0, 166.0, 227.0, 413.0, 658.0, 1395.0, 2927.0, 7210.0, 22385.0, 83187.0, 303959.0, 421066.0, 147549.0, 37720.0, 11161.0, 4221.0, 1885.0, 922.0, 483.0, 297.0, 164.0, 111.0, 73.0, 37.0, 36.0, 17.0, 10.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.332763671875, -0.32303619384765625, -0.3133087158203125, -0.30358123779296875, -0.293853759765625, -0.28412628173828125, -0.2743988037109375, -0.26467132568359375, -0.25494384765625, -0.24521636962890625, -0.2354888916015625, -0.22576141357421875, -0.216033935546875, -0.20630645751953125, -0.1965789794921875, -0.18685150146484375, -0.1771240234375, -0.16739654541015625, -0.1576690673828125, -0.14794158935546875, -0.138214111328125, -0.12848663330078125, -0.1187591552734375, -0.10903167724609375, -0.09930419921875, -0.08957672119140625, -0.0798492431640625, -0.07012176513671875, -0.060394287109375, -0.05066680908203125, -0.0409393310546875, -0.03121185302734375, -0.021484375, -0.01175689697265625, -0.0020294189453125, 0.00769805908203125, 0.017425537109375, 0.02715301513671875, 0.0368804931640625, 0.04660797119140625, 0.05633544921875, 0.06606292724609375, 0.0757904052734375, 0.08551788330078125, 0.095245361328125, 0.10497283935546875, 0.1147003173828125, 0.12442779541015625, 0.1341552734375, 0.14388275146484375, 0.1536102294921875, 0.16333770751953125, 0.173065185546875, 0.18279266357421875, 0.1925201416015625, 0.20224761962890625, 0.21197509765625, 0.22170257568359375, 0.2314300537109375, 0.24115753173828125, 0.250885009765625, 0.26061248779296875, 0.2703399658203125, 0.28006744384765625, 0.289794921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 10.0, 12.0, 19.0, 17.0, 25.0, 40.0, 45.0, 47.0, 53.0, 80.0, 81.0, 89.0, 77.0, 58.0, 64.0, 62.0, 50.0, 35.0, 33.0, 17.0, 13.0, 8.0, 15.0, 5.0, 9.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.267578125, -0.25887298583984375, -0.2501678466796875, -0.24146270751953125, -0.232757568359375, -0.22405242919921875, -0.2153472900390625, -0.20664215087890625, -0.19793701171875, -0.18923187255859375, -0.1805267333984375, -0.17182159423828125, -0.163116455078125, -0.15441131591796875, -0.1457061767578125, -0.13700103759765625, -0.1282958984375, -0.11959075927734375, -0.1108856201171875, -0.10218048095703125, -0.093475341796875, -0.08477020263671875, -0.0760650634765625, -0.06735992431640625, -0.05865478515625, -0.04994964599609375, -0.0412445068359375, -0.03253936767578125, -0.023834228515625, -0.01512908935546875, -0.0064239501953125, 0.00228118896484375, 0.010986328125, 0.01969146728515625, 0.0283966064453125, 0.03710174560546875, 0.045806884765625, 0.05451202392578125, 0.0632171630859375, 0.07192230224609375, 0.08062744140625, 0.08933258056640625, 0.0980377197265625, 0.10674285888671875, 0.115447998046875, 0.12415313720703125, 0.1328582763671875, 0.14156341552734375, 0.1502685546875, 0.15897369384765625, 0.1676788330078125, 0.17638397216796875, 0.185089111328125, 0.19379425048828125, 0.2024993896484375, 0.21120452880859375, 0.21990966796875, 0.22861480712890625, 0.2373199462890625, 0.24602508544921875, 0.254730224609375, 0.26343536376953125, 0.2721405029296875, 0.28084564208984375, 0.28955078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 9.0, 14.0, 40.0, 64.0, 131.0, 144.0, 169.0, 168.0, 120.0, 70.0, 29.0, 17.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.973979949951172, -6.8146467208862305, -6.655313014984131, -6.4959797859191895, -6.33664608001709, -6.177312850952148, -6.017979621887207, -5.858645915985107, -5.699312686920166, -5.539979457855225, -5.380645751953125, -5.221312522888184, -5.061978816986084, -4.902645587921143, -4.743311882019043, -4.583978652954102, -4.42464542388916, -4.265312194824219, -4.105978488922119, -3.9466452598571777, -3.7873117923736572, -3.6279783248901367, -3.468644857406616, -3.3093113899230957, -3.149977684020996, -2.9906442165374756, -2.831310749053955, -2.6719775199890137, -2.512644052505493, -2.3533105850219727, -2.193977117538452, -2.0346436500549316, -1.8753106594085693, -1.7159771919250488, -1.5566438436508179, -1.3973103761672974, -1.2379770278930664, -1.078643560409546, -0.9193100929260254, -0.7599767446517944, -0.6006432771682739, -0.4413098692893982, -0.2819764316082001, -0.12264299392700195, 0.03669041395187378, 0.1960238218307495, 0.35535728931427, 0.514690637588501, 0.6740241050720215, 0.8333575129508972, 0.992690920829773, 1.1520243883132935, 1.3113577365875244, 1.470691204071045, 1.6300246715545654, 1.7893580198287964, 1.948691487312317, 2.108024835586548, 2.2673583030700684, 2.426691770553589, 2.5860252380371094, 2.745358467102051, 2.9046921730041504, 3.064025402069092, 3.2233588695526123]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 12.0, 12.0, 13.0, 7.0, 13.0, 12.0, 27.0, 22.0, 17.0, 27.0, 19.0, 40.0, 52.0, 56.0, 54.0, 39.0, 40.0, 45.0, 44.0, 42.0, 32.0, 37.0, 44.0, 50.0, 32.0, 41.0, 28.0, 21.0, 17.0, 19.0, 18.0, 18.0, 14.0, 7.0, 11.0, 3.0, 6.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8086347579956055, -2.7263264656066895, -2.6440181732177734, -2.5617098808288574, -2.4794013500213623, -2.3970930576324463, -2.3147847652435303, -2.2324764728546143, -2.1501681804656982, -2.0678598880767822, -1.9855514764785767, -1.9032431840896606, -1.8209348917007446, -1.738626480102539, -1.656318187713623, -1.574009895324707, -1.4917014837265015, -1.4093931913375854, -1.3270847797393799, -1.2447764873504639, -1.1624681949615479, -1.0801599025726318, -0.9978514909744263, -0.9155431985855103, -0.8332348465919495, -0.7509264945983887, -0.6686182022094727, -0.5863098502159119, -0.5040014982223511, -0.42169320583343506, -0.33938485383987427, -0.25707656145095825, -0.17476820945739746, -0.09245987981557846, -0.01015155017375946, 0.07215678691864014, 0.15446510910987854, 0.23677343130111694, 0.31908178329467773, 0.40139007568359375, 0.48369842767715454, 0.5660067796707153, 0.6483150720596313, 0.7306234240531921, 0.8129317760467529, 0.895240068435669, 0.9775484204292297, 1.059856653213501, 1.1421650648117065, 1.2244733572006226, 1.3067817687988281, 1.3890900611877441, 1.4713983535766602, 1.5537066459655762, 1.6360150575637817, 1.7183233499526978, 1.8006317615509033, 1.8829400539398193, 1.965248465538025, 2.0475568771362305, 2.1298651695251465, 2.2121734619140625, 2.2944817543029785, 2.3767900466918945, 2.4590983390808105]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 16.0, 29.0, 47.0, 53.0, 75.0, 129.0, 208.0, 312.0, 522.0, 852.0, 1422.0, 2599.0, 4897.0, 9767.0, 22283.0, 65962.0, 223098.0, 709610.0, 1341593.0, 1110108.0, 476591.0, 148339.0, 44400.0, 16031.0, 7017.0, 3566.0, 1872.0, 1075.0, 658.0, 379.0, 229.0, 166.0, 112.0, 61.0, 58.0, 25.0, 25.0, 22.0, 13.0, 2.0, 6.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.320556640625, -0.30859375, -0.296630859375, -0.28466796875, -0.272705078125, -0.2607421875, -0.248779296875, -0.23681640625, -0.224853515625, -0.212890625, -0.200927734375, -0.18896484375, -0.177001953125, -0.1650390625, -0.153076171875, -0.14111328125, -0.129150390625, -0.1171875, -0.105224609375, -0.09326171875, -0.081298828125, -0.0693359375, -0.057373046875, -0.04541015625, -0.033447265625, -0.021484375, -0.009521484375, 0.00244140625, 0.014404296875, 0.0263671875, 0.038330078125, 0.05029296875, 0.062255859375, 0.07421875, 0.086181640625, 0.09814453125, 0.110107421875, 0.1220703125, 0.134033203125, 0.14599609375, 0.157958984375, 0.169921875, 0.181884765625, 0.19384765625, 0.205810546875, 0.2177734375, 0.229736328125, 0.24169921875, 0.253662109375, 0.265625, 0.277587890625, 0.28955078125, 0.301513671875, 0.3134765625, 0.325439453125, 0.33740234375, 0.349365234375, 0.361328125, 0.373291015625, 0.38525390625, 0.397216796875, 0.4091796875, 0.421142578125, 0.43310546875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 8.0, 2.0, 7.0, 13.0, 11.0, 12.0, 11.0, 19.0, 16.0, 19.0, 27.0, 29.0, 21.0, 25.0, 24.0, 27.0, 36.0, 44.0, 42.0, 33.0, 49.0, 35.0, 49.0, 32.0, 33.0, 35.0, 42.0, 36.0, 35.0, 24.0, 31.0, 26.0, 27.0, 14.0, 18.0, 15.0, 14.0, 9.0, 11.0, 5.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.339599609375, -0.32944488525390625, -0.3192901611328125, -0.30913543701171875, -0.298980712890625, -0.28882598876953125, -0.2786712646484375, -0.26851654052734375, -0.25836181640625, -0.24820709228515625, -0.2380523681640625, -0.22789764404296875, -0.217742919921875, -0.20758819580078125, -0.1974334716796875, -0.18727874755859375, -0.1771240234375, -0.16696929931640625, -0.1568145751953125, -0.14665985107421875, -0.136505126953125, -0.12635040283203125, -0.1161956787109375, -0.10604095458984375, -0.09588623046875, -0.08573150634765625, -0.0755767822265625, -0.06542205810546875, -0.055267333984375, -0.04511260986328125, -0.0349578857421875, -0.02480316162109375, -0.0146484375, -0.00449371337890625, 0.0056610107421875, 0.01581573486328125, 0.025970458984375, 0.03612518310546875, 0.0462799072265625, 0.05643463134765625, 0.06658935546875, 0.07674407958984375, 0.0868988037109375, 0.09705352783203125, 0.107208251953125, 0.11736297607421875, 0.1275177001953125, 0.13767242431640625, 0.1478271484375, 0.15798187255859375, 0.1681365966796875, 0.17829132080078125, 0.188446044921875, 0.19860076904296875, 0.2087554931640625, 0.21891021728515625, 0.22906494140625, 0.23921966552734375, 0.2493743896484375, 0.25952911376953125, 0.269683837890625, 0.27983856201171875, 0.2899932861328125, 0.30014801025390625, 0.310302734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 3.0, 14.0, 20.0, 25.0, 40.0, 67.0, 120.0, 149.0, 240.0, 513.0, 1076.0, 2316.0, 5998.0, 18543.0, 75411.0, 522556.0, 2907239.0, 551871.0, 78589.0, 18742.0, 6078.0, 2353.0, 1080.0, 497.0, 283.0, 140.0, 93.0, 58.0, 54.0, 28.0, 22.0, 17.0, 7.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7306137084960938, -0.7058563232421875, -0.6810989379882812, -0.656341552734375, -0.6315841674804688, -0.6068267822265625, -0.5820693969726562, -0.55731201171875, -0.5325546264648438, -0.5077972412109375, -0.48303985595703125, -0.458282470703125, -0.43352508544921875, -0.4087677001953125, -0.38401031494140625, -0.3592529296875, -0.33449554443359375, -0.3097381591796875, -0.28498077392578125, -0.260223388671875, -0.23546600341796875, -0.2107086181640625, -0.18595123291015625, -0.16119384765625, -0.13643646240234375, -0.1116790771484375, -0.08692169189453125, -0.062164306640625, -0.03740692138671875, -0.0126495361328125, 0.01210784912109375, 0.036865234375, 0.06162261962890625, 0.0863800048828125, 0.11113739013671875, 0.135894775390625, 0.16065216064453125, 0.1854095458984375, 0.21016693115234375, 0.23492431640625, 0.25968170166015625, 0.2844390869140625, 0.30919647216796875, 0.333953857421875, 0.35871124267578125, 0.3834686279296875, 0.40822601318359375, 0.4329833984375, 0.45774078369140625, 0.4824981689453125, 0.5072555541992188, 0.532012939453125, 0.5567703247070312, 0.5815277099609375, 0.6062850952148438, 0.63104248046875, 0.6557998657226562, 0.6805572509765625, 0.7053146362304688, 0.730072021484375, 0.7548294067382812, 0.7795867919921875, 0.8043441772460938, 0.8291015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 13.0, 15.0, 20.0, 28.0, 51.0, 93.0, 127.0, 178.0, 312.0, 616.0, 845.0, 736.0, 432.0, 246.0, 124.0, 79.0, 47.0, 38.0, 22.0, 13.0, 17.0, 10.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71533203125, -0.6851272583007812, -0.6549224853515625, -0.6247177124023438, -0.594512939453125, -0.5643081665039062, -0.5341033935546875, -0.5038986206054688, -0.47369384765625, -0.44348907470703125, -0.4132843017578125, -0.38307952880859375, -0.352874755859375, -0.32266998291015625, -0.2924652099609375, -0.26226043701171875, -0.2320556640625, -0.20185089111328125, -0.1716461181640625, -0.14144134521484375, -0.111236572265625, -0.08103179931640625, -0.0508270263671875, -0.02062225341796875, 0.00958251953125, 0.03978729248046875, 0.0699920654296875, 0.10019683837890625, 0.130401611328125, 0.16060638427734375, 0.1908111572265625, 0.22101593017578125, 0.251220703125, 0.28142547607421875, 0.3116302490234375, 0.34183502197265625, 0.372039794921875, 0.40224456787109375, 0.4324493408203125, 0.46265411376953125, 0.49285888671875, 0.5230636596679688, 0.5532684326171875, 0.5834732055664062, 0.613677978515625, 0.6438827514648438, 0.6740875244140625, 0.7042922973632812, 0.7344970703125, 0.7647018432617188, 0.7949066162109375, 0.8251113891601562, 0.855316162109375, 0.8855209350585938, 0.9157257080078125, 0.9459304809570312, 0.97613525390625, 1.0063400268554688, 1.0365447998046875, 1.0667495727539062, 1.096954345703125, 1.1271591186523438, 1.1573638916015625, 1.1875686645507812, 1.2177734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 16.0, 36.0, 74.0, 142.0, 202.0, 229.0, 156.0, 77.0, 35.0, 17.0, 8.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.867579936981201, -7.648634910583496, -7.429689884185791, -7.210744857788086, -6.991799831390381, -6.772854804992676, -6.553910255432129, -6.334965229034424, -6.116020202636719, -5.897075176239014, -5.678130149841309, -5.4591851234436035, -5.240240097045898, -5.021295547485352, -4.802350044250488, -4.583405494689941, -4.364459991455078, -4.145514965057373, -3.926569938659668, -3.707624912261963, -3.488680124282837, -3.269735097885132, -3.0507900714874268, -2.831845283508301, -2.6129002571105957, -2.3939552307128906, -2.1750102043151855, -1.95606529712677, -1.7371203899383545, -1.5181753635406494, -1.2992303371429443, -1.0802854299545288, -0.8613405227661133, -0.642395555973053, -0.4234505593776703, -0.2045055627822876, 0.014439404010772705, 0.233384370803833, 0.4523293972015381, 0.6712743043899536, 0.8902193307876587, 1.1091643571853638, 1.3281092643737793, 1.5470542907714844, 1.7659993171691895, 1.984944224357605, 2.2038893699645996, 2.4228341579437256, 2.6417791843414307, 2.8607242107391357, 3.079669237136841, 3.298614025115967, 3.517559051513672, 3.736504077911377, 3.955449104309082, 4.174394130706787, 4.393339157104492, 4.612284183502197, 4.831229209899902, 5.050174236297607, 5.2691192626953125, 5.488063812255859, 5.707009315490723, 5.9259538650512695, 6.144898891448975]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 10.0, 3.0, 8.0, 13.0, 13.0, 11.0, 21.0, 21.0, 14.0, 30.0, 20.0, 23.0, 30.0, 32.0, 36.0, 35.0, 42.0, 46.0, 43.0, 37.0, 44.0, 44.0, 37.0, 33.0, 34.0, 36.0, 33.0, 33.0, 26.0, 30.0, 32.0, 19.0, 19.0, 16.0, 9.0, 12.0, 5.0, 12.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.038085699081421, -1.9768325090408325, -1.9155793190002441, -1.8543261289596558, -1.7930729389190674, -1.7318198680877686, -1.6705666780471802, -1.6093134880065918, -1.5480602979660034, -1.486807107925415, -1.4255539178848267, -1.3643007278442383, -1.3030476570129395, -1.2417943477630615, -1.1805412769317627, -1.1192880868911743, -1.058034896850586, -0.9967817068099976, -0.9355285167694092, -0.8742753863334656, -0.8130221962928772, -0.7517690062522888, -0.6905158758163452, -0.6292626857757568, -0.5680094957351685, -0.5067563056945801, -0.4455031454563141, -0.3842499852180481, -0.3229967951774597, -0.26174360513687134, -0.20049044489860535, -0.13923728466033936, -0.07798397541046143, -0.01673080027103424, 0.044522374868392944, 0.10577555000782013, 0.16702872514724731, 0.2282819151878357, 0.2895350754261017, 0.3507882356643677, 0.41204142570495605, 0.47329461574554443, 0.5345478057861328, 0.5958009362220764, 0.6570541262626648, 0.7183073163032532, 0.7795604467391968, 0.8408136367797852, 0.9020668268203735, 0.9633200168609619, 1.0245732069015503, 1.0858263969421387, 1.1470794677734375, 1.2083327770233154, 1.2695858478546143, 1.3308390378952026, 1.392092227935791, 1.4533454179763794, 1.5145986080169678, 1.5758517980575562, 1.6371049880981445, 1.6983580589294434, 1.7596112489700317, 1.8208644390106201, 1.8821176290512085]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 9.0, 17.0, 19.0, 32.0, 51.0, 69.0, 112.0, 146.0, 219.0, 372.0, 578.0, 931.0, 1639.0, 3021.0, 5561.0, 10840.0, 22182.0, 49773.0, 122999.0, 270586.0, 298414.0, 149021.0, 59304.0, 25792.0, 12364.0, 6352.0, 3465.0, 1837.0, 1023.0, 668.0, 390.0, 256.0, 146.0, 101.0, 66.0, 58.0, 40.0, 22.0, 15.0, 8.0, 5.0, 8.0, 5.0, 6.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.463134765625, -0.4477500915527344, -0.43236541748046875, -0.4169807434082031, -0.4015960693359375, -0.3862113952636719, -0.37082672119140625, -0.3554420471191406, -0.340057373046875, -0.3246726989746094, -0.30928802490234375, -0.2939033508300781, -0.2785186767578125, -0.2631340026855469, -0.24774932861328125, -0.23236465454101562, -0.21697998046875, -0.20159530639648438, -0.18621063232421875, -0.17082595825195312, -0.1554412841796875, -0.14005661010742188, -0.12467193603515625, -0.10928726196289062, -0.093902587890625, -0.07851791381835938, -0.06313323974609375, -0.047748565673828125, -0.0323638916015625, -0.016979217529296875, -0.00159454345703125, 0.013790130615234375, 0.0291748046875, 0.044559478759765625, 0.05994415283203125, 0.07532882690429688, 0.0907135009765625, 0.10609817504882812, 0.12148284912109375, 0.13686752319335938, 0.152252197265625, 0.16763687133789062, 0.18302154541015625, 0.19840621948242188, 0.2137908935546875, 0.22917556762695312, 0.24456024169921875, 0.2599449157714844, 0.27532958984375, 0.2907142639160156, 0.30609893798828125, 0.3214836120605469, 0.3368682861328125, 0.3522529602050781, 0.36763763427734375, 0.3830223083496094, 0.398406982421875, 0.4137916564941406, 0.42917633056640625, 0.4445610046386719, 0.4599456787109375, 0.4753303527832031, 0.49071502685546875, 0.5060997009277344, 0.521484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 8.0, 2.0, 10.0, 12.0, 10.0, 15.0, 10.0, 19.0, 23.0, 23.0, 22.0, 28.0, 42.0, 35.0, 38.0, 30.0, 45.0, 49.0, 39.0, 36.0, 32.0, 58.0, 41.0, 37.0, 42.0, 36.0, 31.0, 36.0, 24.0, 27.0, 27.0, 21.0, 12.0, 17.0, 8.0, 11.0, 6.0, 11.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.42822265625, -0.4158515930175781, -0.40348052978515625, -0.3911094665527344, -0.3787384033203125, -0.3663673400878906, -0.35399627685546875, -0.3416252136230469, -0.329254150390625, -0.3168830871582031, -0.30451202392578125, -0.2921409606933594, -0.2797698974609375, -0.2673988342285156, -0.25502777099609375, -0.24265670776367188, -0.23028564453125, -0.21791458129882812, -0.20554351806640625, -0.19317245483398438, -0.1808013916015625, -0.16843032836914062, -0.15605926513671875, -0.14368820190429688, -0.131317138671875, -0.11894607543945312, -0.10657501220703125, -0.09420394897460938, -0.0818328857421875, -0.06946182250976562, -0.05709075927734375, -0.044719696044921875, -0.0323486328125, -0.019977569580078125, -0.00760650634765625, 0.004764556884765625, 0.0171356201171875, 0.029506683349609375, 0.04187774658203125, 0.054248809814453125, 0.066619873046875, 0.07899093627929688, 0.09136199951171875, 0.10373306274414062, 0.1161041259765625, 0.12847518920898438, 0.14084625244140625, 0.15321731567382812, 0.16558837890625, 0.17795944213867188, 0.19033050537109375, 0.20270156860351562, 0.2150726318359375, 0.22744369506835938, 0.23981475830078125, 0.2521858215332031, 0.264556884765625, 0.2769279479980469, 0.28929901123046875, 0.3016700744628906, 0.3140411376953125, 0.3264122009277344, 0.33878326416015625, 0.3511543273925781, 0.363525390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 8.0, 17.0, 17.0, 45.0, 45.0, 68.0, 74.0, 137.0, 236.0, 366.0, 692.0, 1223.0, 2380.0, 4806.0, 10306.0, 23257.0, 58475.0, 173309.0, 400913.0, 238913.0, 77928.0, 30168.0, 12906.0, 5899.0, 2854.0, 1471.0, 778.0, 449.0, 293.0, 150.0, 123.0, 68.0, 56.0, 36.0, 13.0, 25.0, 10.0, 8.0, 7.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.79736328125, -0.7743453979492188, -0.7513275146484375, -0.7283096313476562, -0.705291748046875, -0.6822738647460938, -0.6592559814453125, -0.6362380981445312, -0.61322021484375, -0.5902023315429688, -0.5671844482421875, -0.5441665649414062, -0.521148681640625, -0.49813079833984375, -0.4751129150390625, -0.45209503173828125, -0.4290771484375, -0.40605926513671875, -0.3830413818359375, -0.36002349853515625, -0.337005615234375, -0.31398773193359375, -0.2909698486328125, -0.26795196533203125, -0.24493408203125, -0.22191619873046875, -0.1988983154296875, -0.17588043212890625, -0.152862548828125, -0.12984466552734375, -0.1068267822265625, -0.08380889892578125, -0.060791015625, -0.03777313232421875, -0.0147552490234375, 0.00826263427734375, 0.031280517578125, 0.05429840087890625, 0.0773162841796875, 0.10033416748046875, 0.12335205078125, 0.14636993408203125, 0.1693878173828125, 0.19240570068359375, 0.215423583984375, 0.23844146728515625, 0.2614593505859375, 0.28447723388671875, 0.3074951171875, 0.33051300048828125, 0.3535308837890625, 0.37654876708984375, 0.399566650390625, 0.42258453369140625, 0.4456024169921875, 0.46862030029296875, 0.49163818359375, 0.5146560668945312, 0.5376739501953125, 0.5606918334960938, 0.583709716796875, 0.6067276000976562, 0.6297454833984375, 0.6527633666992188, 0.67578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 9.0, 14.0, 18.0, 13.0, 17.0, 28.0, 19.0, 21.0, 36.0, 35.0, 35.0, 21.0, 37.0, 47.0, 51.0, 41.0, 54.0, 31.0, 40.0, 37.0, 40.0, 39.0, 31.0, 29.0, 37.0, 25.0, 29.0, 20.0, 20.0, 14.0, 12.0, 15.0, 15.0, 8.0, 7.0, 8.0, 6.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9599609375, -0.925384521484375, -0.89080810546875, -0.856231689453125, -0.8216552734375, -0.787078857421875, -0.75250244140625, -0.717926025390625, -0.683349609375, -0.648773193359375, -0.61419677734375, -0.579620361328125, -0.5450439453125, -0.510467529296875, -0.47589111328125, -0.441314697265625, -0.40673828125, -0.372161865234375, -0.33758544921875, -0.303009033203125, -0.2684326171875, -0.233856201171875, -0.19927978515625, -0.164703369140625, -0.130126953125, -0.095550537109375, -0.06097412109375, -0.026397705078125, 0.0081787109375, 0.042755126953125, 0.07733154296875, 0.111907958984375, 0.146484375, 0.181060791015625, 0.21563720703125, 0.250213623046875, 0.2847900390625, 0.319366455078125, 0.35394287109375, 0.388519287109375, 0.423095703125, 0.457672119140625, 0.49224853515625, 0.526824951171875, 0.5614013671875, 0.595977783203125, 0.63055419921875, 0.665130615234375, 0.69970703125, 0.734283447265625, 0.76885986328125, 0.803436279296875, 0.8380126953125, 0.872589111328125, 0.90716552734375, 0.941741943359375, 0.976318359375, 1.010894775390625, 1.04547119140625, 1.080047607421875, 1.1146240234375, 1.149200439453125, 1.18377685546875, 1.218353271484375, 1.2529296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 6.0, 7.0, 7.0, 11.0, 17.0, 21.0, 42.0, 36.0, 55.0, 109.0, 140.0, 161.0, 276.0, 484.0, 775.0, 1208.0, 2224.0, 4509.0, 10951.0, 34774.0, 150464.0, 507516.0, 252202.0, 54343.0, 15647.0, 5889.0, 2688.0, 1468.0, 908.0, 494.0, 371.0, 230.0, 151.0, 116.0, 83.0, 44.0, 42.0, 24.0, 15.0, 11.0, 13.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2885475158691406, -0.27997589111328125, -0.2714042663574219, -0.2628326416015625, -0.2542610168457031, -0.24568939208984375, -0.23711776733398438, -0.228546142578125, -0.21997451782226562, -0.21140289306640625, -0.20283126831054688, -0.1942596435546875, -0.18568801879882812, -0.17711639404296875, -0.16854476928710938, -0.15997314453125, -0.15140151977539062, -0.14282989501953125, -0.13425827026367188, -0.1256866455078125, -0.11711502075195312, -0.10854339599609375, -0.09997177124023438, -0.091400146484375, -0.08282852172851562, -0.07425689697265625, -0.06568527221679688, -0.0571136474609375, -0.048542022705078125, -0.03997039794921875, -0.031398773193359375, -0.0228271484375, -0.014255523681640625, -0.00568389892578125, 0.002887725830078125, 0.0114593505859375, 0.020030975341796875, 0.02860260009765625, 0.037174224853515625, 0.045745849609375, 0.054317474365234375, 0.06288909912109375, 0.07146072387695312, 0.0800323486328125, 0.08860397338867188, 0.09717559814453125, 0.10574722290039062, 0.11431884765625, 0.12289047241210938, 0.13146209716796875, 0.14003372192382812, 0.1486053466796875, 0.15717697143554688, 0.16574859619140625, 0.17432022094726562, 0.182891845703125, 0.19146347045898438, 0.20003509521484375, 0.20860671997070312, 0.2171783447265625, 0.22574996948242188, 0.23432159423828125, 0.24289321899414062, 0.25146484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 13.0, 15.0, 27.0, 43.0, 64.0, 83.0, 132.0, 164.0, 143.0, 102.0, 68.0, 58.0, 28.0, 21.0, 3.0, 6.0, 9.0, 6.0, 7.0, 1.0, 0.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00014519691467285156, -0.00014172587543725967, -0.00013825483620166779, -0.0001347837969660759, -0.000131312757730484, -0.00012784171849489212, -0.00012437067925930023, -0.00012089964002370834, -0.00011742860078811646, -0.00011395756155252457, -0.00011048652231693268, -0.00010701548308134079, -0.0001035444438457489, -0.00010007340461015701, -9.660236537456512e-05, -9.313132613897324e-05, -8.966028690338135e-05, -8.618924766778946e-05, -8.271820843219757e-05, -7.924716919660568e-05, -7.57761299610138e-05, -7.23050907254219e-05, -6.883405148983002e-05, -6.536301225423813e-05, -6.189197301864624e-05, -5.842093378305435e-05, -5.494989454746246e-05, -5.1478855311870575e-05, -4.8007816076278687e-05, -4.45367768406868e-05, -4.106573760509491e-05, -3.759469836950302e-05, -3.412365913391113e-05, -3.0652619898319244e-05, -2.7181580662727356e-05, -2.3710541427135468e-05, -2.023950219154358e-05, -1.676846295595169e-05, -1.3297423720359802e-05, -9.826384484767914e-06, -6.355345249176025e-06, -2.884306013584137e-06, 5.867332220077515e-07, 4.05777245759964e-06, 7.528811693191528e-06, 1.0999850928783417e-05, 1.4470890164375305e-05, 1.7941929399967194e-05, 2.1412968635559082e-05, 2.488400787115097e-05, 2.835504710674286e-05, 3.182608634233475e-05, 3.5297125577926636e-05, 3.8768164813518524e-05, 4.223920404911041e-05, 4.57102432847023e-05, 4.918128252029419e-05, 5.265232175588608e-05, 5.6123360991477966e-05, 5.9594400227069855e-05, 6.306543946266174e-05, 6.653647869825363e-05, 7.000751793384552e-05, 7.347855716943741e-05, 7.69495964050293e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 21.0, 25.0, 24.0, 24.0, 63.0, 74.0, 119.0, 170.0, 231.0, 352.0, 559.0, 881.0, 1285.0, 2104.0, 3527.0, 6705.0, 13358.0, 30350.0, 79740.0, 212871.0, 346575.0, 211364.0, 78450.0, 30072.0, 13415.0, 6634.0, 3536.0, 2082.0, 1303.0, 843.0, 625.0, 374.0, 257.0, 144.0, 126.0, 81.0, 56.0, 34.0, 26.0, 13.0, 16.0, 12.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1864013671875, -0.1809978485107422, -0.17559432983398438, -0.17019081115722656, -0.16478729248046875, -0.15938377380371094, -0.15398025512695312, -0.1485767364501953, -0.1431732177734375, -0.1377696990966797, -0.13236618041992188, -0.12696266174316406, -0.12155914306640625, -0.11615562438964844, -0.11075210571289062, -0.10534858703613281, -0.099945068359375, -0.09454154968261719, -0.08913803100585938, -0.08373451232910156, -0.07833099365234375, -0.07292747497558594, -0.06752395629882812, -0.06212043762207031, -0.0567169189453125, -0.05131340026855469, -0.045909881591796875, -0.04050636291503906, -0.03510284423828125, -0.029699325561523438, -0.024295806884765625, -0.018892288208007812, -0.01348876953125, -0.008085250854492188, -0.002681732177734375, 0.0027217864990234375, 0.00812530517578125, 0.013528823852539062, 0.018932342529296875, 0.024335861206054688, 0.0297393798828125, 0.03514289855957031, 0.040546417236328125, 0.04594993591308594, 0.05135345458984375, 0.05675697326660156, 0.062160491943359375, 0.06756401062011719, 0.072967529296875, 0.07837104797363281, 0.08377456665039062, 0.08917808532714844, 0.09458160400390625, 0.09998512268066406, 0.10538864135742188, 0.11079216003417969, 0.1161956787109375, 0.12159919738769531, 0.12700271606445312, 0.13240623474121094, 0.13780975341796875, 0.14321327209472656, 0.14861679077148438, 0.1540203094482422, 0.159423828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 11.0, 7.0, 11.0, 16.0, 15.0, 20.0, 15.0, 24.0, 55.0, 66.0, 73.0, 91.0, 98.0, 120.0, 81.0, 67.0, 54.0, 29.0, 31.0, 19.0, 14.0, 10.0, 14.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24211883544921875, -0.2339935302734375, -0.22586822509765625, -0.217742919921875, -0.20961761474609375, -0.2014923095703125, -0.19336700439453125, -0.18524169921875, -0.17711639404296875, -0.1689910888671875, -0.16086578369140625, -0.152740478515625, -0.14461517333984375, -0.1364898681640625, -0.12836456298828125, -0.1202392578125, -0.11211395263671875, -0.1039886474609375, -0.09586334228515625, -0.087738037109375, -0.07961273193359375, -0.0714874267578125, -0.06336212158203125, -0.05523681640625, -0.04711151123046875, -0.0389862060546875, -0.03086090087890625, -0.022735595703125, -0.01461029052734375, -0.0064849853515625, 0.00164031982421875, 0.009765625, 0.01789093017578125, 0.0260162353515625, 0.03414154052734375, 0.042266845703125, 0.05039215087890625, 0.0585174560546875, 0.06664276123046875, 0.07476806640625, 0.08289337158203125, 0.0910186767578125, 0.09914398193359375, 0.107269287109375, 0.11539459228515625, 0.1235198974609375, 0.13164520263671875, 0.1397705078125, 0.14789581298828125, 0.1560211181640625, 0.16414642333984375, 0.172271728515625, 0.18039703369140625, 0.1885223388671875, 0.19664764404296875, 0.20477294921875, 0.21289825439453125, 0.2210235595703125, 0.22914886474609375, 0.237274169921875, 0.24539947509765625, 0.2535247802734375, 0.26165008544921875, 0.269775390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 1.0, 9.0, 10.0, 14.0, 28.0, 64.0, 107.0, 200.0, 237.0, 158.0, 83.0, 46.0, 18.0, 9.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.646662712097168, -6.449023723602295, -6.251384735107422, -6.053746223449707, -5.856107234954834, -5.658468246459961, -5.460829257965088, -5.263190269470215, -5.0655517578125, -4.867912769317627, -4.670273780822754, -4.472635269165039, -4.274996280670166, -4.077357292175293, -3.87971830368042, -3.682079553604126, -3.484440565109253, -3.28680157661438, -3.089162826538086, -2.891523838043213, -2.693885087966919, -2.496246099472046, -2.298607349395752, -2.100968360900879, -1.9033294916152954, -1.705690622329712, -1.5080517530441284, -1.310412883758545, -1.1127738952636719, -0.9151350855827332, -0.7174961566925049, -0.5198572874069214, -0.3222184181213379, -0.1245795339345932, 0.07305935025215149, 0.2706982493400574, 0.46833711862564087, 0.6659759879112244, 0.8636149168014526, 1.0612537860870361, 1.2588926553726196, 1.4565315246582031, 1.6541703939437866, 1.8518092632293701, 2.049448251724243, 2.247087001800537, 2.44472599029541, 2.642364978790283, 2.840003728866577, 3.03764271736145, 3.235281467437744, 3.432920455932617, 3.630559206008911, 3.828198194503784, 4.025836944580078, 4.223475933074951, 4.421114921569824, 4.618753910064697, 4.81639289855957, 5.014031410217285, 5.211670398712158, 5.409309387207031, 5.606948375701904, 5.804587364196777, 6.002225875854492]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 6.0, 9.0, 14.0, 11.0, 19.0, 18.0, 27.0, 31.0, 24.0, 31.0, 42.0, 36.0, 39.0, 35.0, 39.0, 46.0, 32.0, 51.0, 42.0, 29.0, 45.0, 38.0, 36.0, 37.0, 45.0, 30.0, 35.0, 27.0, 18.0, 17.0, 9.0, 8.0, 11.0, 6.0, 5.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6855623722076416, -2.6018378734588623, -2.518113136291504, -2.4343886375427246, -2.3506641387939453, -2.266939401626587, -2.1832149028778076, -2.099490165710449, -2.01576566696167, -1.932041049003601, -1.8483164310455322, -1.764591932296753, -1.680867314338684, -1.5971426963806152, -1.513418197631836, -1.429693579673767, -1.3459689617156982, -1.2622443437576294, -1.1785197257995605, -1.0947952270507812, -1.0110706090927124, -0.9273459911346436, -0.8436214327812195, -0.7598968744277954, -0.6761722564697266, -0.5924476385116577, -0.5087230801582336, -0.4249984920024872, -0.3412739038467407, -0.25754931569099426, -0.1738247275352478, -0.09010016918182373, -0.006375312805175781, 0.07734927535057068, 0.16107386350631714, 0.2447984516620636, 0.32852303981781006, 0.4122476279735565, 0.495972216129303, 0.579696774482727, 0.6634213924407959, 0.7471460103988647, 0.8308705687522888, 0.9145951271057129, 0.9983197450637817, 1.0820443630218506, 1.1657688617706299, 1.2494934797286987, 1.3332180976867676, 1.4169427156448364, 1.5006673336029053, 1.5843918323516846, 1.6681164503097534, 1.7518410682678223, 1.8355655670166016, 1.9192901849746704, 2.0030148029327393, 2.0867393016815186, 2.170464038848877, 2.2541885375976562, 2.3379130363464355, 2.421637773513794, 2.5053622722625732, 2.5890870094299316, 2.672811508178711]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 13.0, 9.0, 21.0, 34.0, 39.0, 67.0, 91.0, 127.0, 168.0, 214.0, 353.0, 555.0, 875.0, 1467.0, 2558.0, 5085.0, 11288.0, 32850.0, 135032.0, 547482.0, 1470048.0, 1363491.0, 463378.0, 108192.0, 29116.0, 10486.0, 4698.0, 2427.0, 1382.0, 870.0, 575.0, 370.0, 245.0, 176.0, 129.0, 94.0, 81.0, 52.0, 45.0, 23.0, 18.0, 17.0, 8.0, 12.0, 2.0, 8.0, 6.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.52294921875, -0.5075416564941406, -0.49213409423828125, -0.4767265319824219, -0.4613189697265625, -0.4459114074707031, -0.43050384521484375, -0.4150962829589844, -0.399688720703125, -0.3842811584472656, -0.36887359619140625, -0.3534660339355469, -0.3380584716796875, -0.3226509094238281, -0.30724334716796875, -0.2918357849121094, -0.27642822265625, -0.2610206604003906, -0.24561309814453125, -0.23020553588867188, -0.2147979736328125, -0.19939041137695312, -0.18398284912109375, -0.16857528686523438, -0.153167724609375, -0.13776016235351562, -0.12235260009765625, -0.10694503784179688, -0.0915374755859375, -0.07612991333007812, -0.06072235107421875, -0.045314788818359375, -0.0299072265625, -0.014499664306640625, 0.00090789794921875, 0.016315460205078125, 0.0317230224609375, 0.047130584716796875, 0.06253814697265625, 0.07794570922851562, 0.093353271484375, 0.10876083374023438, 0.12416839599609375, 0.13957595825195312, 0.1549835205078125, 0.17039108276367188, 0.18579864501953125, 0.20120620727539062, 0.21661376953125, 0.23202133178710938, 0.24742889404296875, 0.2628364562988281, 0.2782440185546875, 0.2936515808105469, 0.30905914306640625, 0.3244667053222656, 0.339874267578125, 0.3552818298339844, 0.37068939208984375, 0.3860969543457031, 0.4015045166015625, 0.4169120788574219, 0.43231964111328125, 0.4477272033691406, 0.463134765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 6.0, 5.0, 11.0, 5.0, 14.0, 14.0, 12.0, 19.0, 26.0, 31.0, 20.0, 28.0, 34.0, 38.0, 31.0, 47.0, 46.0, 52.0, 54.0, 53.0, 56.0, 32.0, 47.0, 36.0, 42.0, 29.0, 30.0, 27.0, 22.0, 22.0, 20.0, 15.0, 16.0, 9.0, 14.0, 9.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.443359375, -0.43099212646484375, -0.4186248779296875, -0.40625762939453125, -0.393890380859375, -0.38152313232421875, -0.3691558837890625, -0.35678863525390625, -0.34442138671875, -0.33205413818359375, -0.3196868896484375, -0.30731964111328125, -0.294952392578125, -0.28258514404296875, -0.2702178955078125, -0.25785064697265625, -0.2454833984375, -0.23311614990234375, -0.2207489013671875, -0.20838165283203125, -0.196014404296875, -0.18364715576171875, -0.1712799072265625, -0.15891265869140625, -0.14654541015625, -0.13417816162109375, -0.1218109130859375, -0.10944366455078125, -0.097076416015625, -0.08470916748046875, -0.0723419189453125, -0.05997467041015625, -0.047607421875, -0.03524017333984375, -0.0228729248046875, -0.01050567626953125, 0.001861572265625, 0.01422882080078125, 0.0265960693359375, 0.03896331787109375, 0.05133056640625, 0.06369781494140625, 0.0760650634765625, 0.08843231201171875, 0.100799560546875, 0.11316680908203125, 0.1255340576171875, 0.13790130615234375, 0.1502685546875, 0.16263580322265625, 0.1750030517578125, 0.18737030029296875, 0.199737548828125, 0.21210479736328125, 0.2244720458984375, 0.23683929443359375, 0.24920654296875, 0.26157379150390625, 0.2739410400390625, 0.28630828857421875, 0.298675537109375, 0.31104278564453125, 0.3234100341796875, 0.33577728271484375, 0.34814453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 8.0, 17.0, 16.0, 27.0, 50.0, 63.0, 80.0, 145.0, 200.0, 362.0, 567.0, 930.0, 1655.0, 3142.0, 6614.0, 15538.0, 40771.0, 136183.0, 736936.0, 2525497.0, 551613.0, 112844.0, 34864.0, 13553.0, 5850.0, 2972.0, 1524.0, 813.0, 507.0, 342.0, 198.0, 125.0, 95.0, 57.0, 34.0, 25.0, 21.0, 13.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5350418090820312, -0.5168609619140625, -0.49868011474609375, -0.480499267578125, -0.46231842041015625, -0.4441375732421875, -0.42595672607421875, -0.40777587890625, -0.38959503173828125, -0.3714141845703125, -0.35323333740234375, -0.335052490234375, -0.31687164306640625, -0.2986907958984375, -0.28050994873046875, -0.2623291015625, -0.24414825439453125, -0.2259674072265625, -0.20778656005859375, -0.189605712890625, -0.17142486572265625, -0.1532440185546875, -0.13506317138671875, -0.11688232421875, -0.09870147705078125, -0.0805206298828125, -0.06233978271484375, -0.044158935546875, -0.02597808837890625, -0.0077972412109375, 0.01038360595703125, 0.028564453125, 0.04674530029296875, 0.0649261474609375, 0.08310699462890625, 0.101287841796875, 0.11946868896484375, 0.1376495361328125, 0.15583038330078125, 0.17401123046875, 0.19219207763671875, 0.2103729248046875, 0.22855377197265625, 0.246734619140625, 0.26491546630859375, 0.2830963134765625, 0.30127716064453125, 0.3194580078125, 0.33763885498046875, 0.3558197021484375, 0.37400054931640625, 0.392181396484375, 0.41036224365234375, 0.4285430908203125, 0.44672393798828125, 0.46490478515625, 0.48308563232421875, 0.5012664794921875, 0.5194473266601562, 0.537628173828125, 0.5558090209960938, 0.5739898681640625, 0.5921707153320312, 0.6103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 11.0, 10.0, 14.0, 12.0, 25.0, 41.0, 56.0, 100.0, 143.0, 243.0, 454.0, 631.0, 830.0, 592.0, 364.0, 208.0, 104.0, 76.0, 39.0, 39.0, 22.0, 18.0, 11.0, 12.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.7790374755859375, -0.749481201171875, -0.7199249267578125, -0.69036865234375, -0.6608123779296875, -0.631256103515625, -0.6016998291015625, -0.5721435546875, -0.5425872802734375, -0.513031005859375, -0.4834747314453125, -0.45391845703125, -0.4243621826171875, -0.394805908203125, -0.3652496337890625, -0.335693359375, -0.3061370849609375, -0.276580810546875, -0.2470245361328125, -0.21746826171875, -0.1879119873046875, -0.158355712890625, -0.1287994384765625, -0.0992431640625, -0.0696868896484375, -0.040130615234375, -0.0105743408203125, 0.01898193359375, 0.0485382080078125, 0.078094482421875, 0.1076507568359375, 0.13720703125, 0.1667633056640625, 0.196319580078125, 0.2258758544921875, 0.25543212890625, 0.2849884033203125, 0.314544677734375, 0.3441009521484375, 0.3736572265625, 0.4032135009765625, 0.432769775390625, 0.4623260498046875, 0.49188232421875, 0.5214385986328125, 0.550994873046875, 0.5805511474609375, 0.610107421875, 0.6396636962890625, 0.669219970703125, 0.6987762451171875, 0.72833251953125, 0.7578887939453125, 0.787445068359375, 0.8170013427734375, 0.8465576171875, 0.8761138916015625, 0.905670166015625, 0.9352264404296875, 0.96478271484375, 0.9943389892578125, 1.023895263671875, 1.0534515380859375, 1.0830078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 8.0, 11.0, 27.0, 53.0, 87.0, 198.0, 259.0, 163.0, 106.0, 49.0, 22.0, 10.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.604303359985352, -9.361337661743164, -9.11837100982666, -8.875405311584473, -8.632438659667969, -8.389472961425781, -8.146507263183594, -7.90354061126709, -7.660574913024902, -7.417608737945557, -7.174642562866211, -6.931676864624023, -6.688710689544678, -6.445744514465332, -6.202778339385986, -5.959812164306641, -5.716845989227295, -5.473879814147949, -5.2309136390686035, -4.987947463989258, -4.74498176574707, -4.502015590667725, -4.259049415588379, -4.016083240509033, -3.7731173038482666, -3.530151128768921, -3.2871851921081543, -3.0442190170288086, -2.801252841949463, -2.5582869052886963, -2.3153207302093506, -2.072354793548584, -1.8293886184692383, -1.5864225625991821, -1.343456506729126, -1.1004903316497803, -0.8575242757797241, -0.614558219909668, -0.37159204483032227, -0.1286259889602661, 0.11434006690979004, 0.3573061525821686, 0.6002722382545471, 0.843238353729248, 1.0862044095993042, 1.3291704654693604, 1.572136640548706, 1.8151026964187622, 2.0580687522888184, 2.301034927368164, 2.5440008640289307, 2.7869670391082764, 3.029932975769043, 3.2728991508483887, 3.5158653259277344, 3.75883150100708, 4.001797676086426, 4.2447638511657715, 4.487730026245117, 4.730695724487305, 4.97366189956665, 5.216628074645996, 5.459594249725342, 5.7025604248046875, 5.945526123046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 11.0, 8.0, 14.0, 21.0, 18.0, 18.0, 22.0, 23.0, 23.0, 26.0, 26.0, 31.0, 31.0, 37.0, 33.0, 44.0, 38.0, 53.0, 41.0, 30.0, 49.0, 40.0, 35.0, 32.0, 33.0, 31.0, 30.0, 25.0, 31.0, 21.0, 23.0, 16.0, 15.0, 10.0, 6.0, 7.0, 8.0, 3.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9542481899261475, -1.8868615627288818, -1.8194748163223267, -1.7520880699157715, -1.6847014427185059, -1.6173148155212402, -1.549928069114685, -1.4825413227081299, -1.4151546955108643, -1.3477680683135986, -1.2803813219070435, -1.2129945755004883, -1.1456079483032227, -1.078221321105957, -1.0108345746994019, -0.9434478878974915, -0.876061201095581, -0.8086745142936707, -0.7412878274917603, -0.6739011406898499, -0.6065144538879395, -0.539127767086029, -0.47174108028411865, -0.40435439348220825, -0.33696770668029785, -0.26958101987838745, -0.20219433307647705, -0.13480764627456665, -0.06742095947265625, -3.427267074584961e-05, 0.06735241413116455, 0.13473910093307495, 0.20212578773498535, 0.26951247453689575, 0.33689916133880615, 0.40428584814071655, 0.47167253494262695, 0.5390592217445374, 0.6064459085464478, 0.6738325953483582, 0.7412192821502686, 0.808605968952179, 0.8759926557540894, 0.9433793425559998, 1.0107660293579102, 1.0781526565551758, 1.145539402961731, 1.2129261493682861, 1.2803127765655518, 1.3476994037628174, 1.4150861501693726, 1.4824728965759277, 1.5498595237731934, 1.617246150970459, 1.6846328973770142, 1.7520196437835693, 1.819406270980835, 1.8867928981781006, 1.9541796445846558, 2.021566390991211, 2.0889530181884766, 2.156339645385742, 2.223726272583008, 2.2911131381988525, 2.358499765396118]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 13.0, 11.0, 18.0, 21.0, 47.0, 81.0, 104.0, 149.0, 232.0, 346.0, 572.0, 877.0, 1307.0, 2050.0, 3259.0, 5296.0, 8682.0, 14263.0, 24208.0, 41344.0, 71206.0, 116744.0, 172561.0, 193054.0, 152527.0, 97027.0, 57893.0, 33601.0, 20012.0, 11835.0, 7038.0, 4305.0, 2872.0, 1760.0, 1081.0, 764.0, 461.0, 325.0, 186.0, 140.0, 90.0, 50.0, 35.0, 39.0, 14.0, 11.0, 15.0, 4.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.32568359375, -0.3159065246582031, -0.30612945556640625, -0.2963523864746094, -0.2865753173828125, -0.2767982482910156, -0.26702117919921875, -0.2572441101074219, -0.247467041015625, -0.23768997192382812, -0.22791290283203125, -0.21813583374023438, -0.2083587646484375, -0.19858169555664062, -0.18880462646484375, -0.17902755737304688, -0.16925048828125, -0.15947341918945312, -0.14969635009765625, -0.13991928100585938, -0.1301422119140625, -0.12036514282226562, -0.11058807373046875, -0.10081100463867188, -0.091033935546875, -0.08125686645507812, -0.07147979736328125, -0.061702728271484375, -0.0519256591796875, -0.042148590087890625, -0.03237152099609375, -0.022594451904296875, -0.0128173828125, -0.003040313720703125, 0.00673675537109375, 0.016513824462890625, 0.0262908935546875, 0.036067962646484375, 0.04584503173828125, 0.055622100830078125, 0.065399169921875, 0.07517623901367188, 0.08495330810546875, 0.09473037719726562, 0.1045074462890625, 0.11428451538085938, 0.12406158447265625, 0.13383865356445312, 0.14361572265625, 0.15339279174804688, 0.16316986083984375, 0.17294692993164062, 0.1827239990234375, 0.19250106811523438, 0.20227813720703125, 0.21205520629882812, 0.221832275390625, 0.23160934448242188, 0.24138641357421875, 0.2511634826660156, 0.2609405517578125, 0.2707176208496094, 0.28049468994140625, 0.2902717590332031, 0.300048828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 0.0, 8.0, 5.0, 6.0, 5.0, 14.0, 15.0, 18.0, 13.0, 22.0, 22.0, 22.0, 14.0, 35.0, 31.0, 41.0, 27.0, 40.0, 44.0, 39.0, 35.0, 38.0, 38.0, 39.0, 47.0, 42.0, 31.0, 32.0, 40.0, 25.0, 34.0, 35.0, 22.0, 22.0, 17.0, 10.0, 16.0, 8.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.35857391357421875, -0.3465423583984375, -0.33451080322265625, -0.322479248046875, -0.31044769287109375, -0.2984161376953125, -0.28638458251953125, -0.27435302734375, -0.26232147216796875, -0.2502899169921875, -0.23825836181640625, -0.226226806640625, -0.21419525146484375, -0.2021636962890625, -0.19013214111328125, -0.1781005859375, -0.16606903076171875, -0.1540374755859375, -0.14200592041015625, -0.129974365234375, -0.11794281005859375, -0.1059112548828125, -0.09387969970703125, -0.08184814453125, -0.06981658935546875, -0.0577850341796875, -0.04575347900390625, -0.033721923828125, -0.02169036865234375, -0.0096588134765625, 0.00237274169921875, 0.014404296875, 0.02643585205078125, 0.0384674072265625, 0.05049896240234375, 0.062530517578125, 0.07456207275390625, 0.0865936279296875, 0.09862518310546875, 0.11065673828125, 0.12268829345703125, 0.1347198486328125, 0.14675140380859375, 0.158782958984375, 0.17081451416015625, 0.1828460693359375, 0.19487762451171875, 0.2069091796875, 0.21894073486328125, 0.2309722900390625, 0.24300384521484375, 0.255035400390625, 0.26706695556640625, 0.2790985107421875, 0.29113006591796875, 0.30316162109375, 0.31519317626953125, 0.3272247314453125, 0.33925628662109375, 0.351287841796875, 0.36331939697265625, 0.3753509521484375, 0.38738250732421875, 0.3994140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 8.0, 12.0, 15.0, 28.0, 37.0, 53.0, 59.0, 93.0, 146.0, 246.0, 328.0, 576.0, 966.0, 1506.0, 2635.0, 4535.0, 8127.0, 15269.0, 29220.0, 58745.0, 118396.0, 214085.0, 270471.0, 158020.0, 80174.0, 39633.0, 20269.0, 10673.0, 5731.0, 3387.0, 1907.0, 1221.0, 682.0, 419.0, 290.0, 171.0, 143.0, 96.0, 46.0, 46.0, 26.0, 21.0, 8.0, 8.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.40966796875, -0.3969535827636719, -0.38423919677734375, -0.3715248107910156, -0.3588104248046875, -0.3460960388183594, -0.33338165283203125, -0.3206672668457031, -0.307952880859375, -0.2952384948730469, -0.28252410888671875, -0.2698097229003906, -0.2570953369140625, -0.24438095092773438, -0.23166656494140625, -0.21895217895507812, -0.20623779296875, -0.19352340698242188, -0.18080902099609375, -0.16809463500976562, -0.1553802490234375, -0.14266586303710938, -0.12995147705078125, -0.11723709106445312, -0.104522705078125, -0.09180831909179688, -0.07909393310546875, -0.06637954711914062, -0.0536651611328125, -0.040950775146484375, -0.02823638916015625, -0.015522003173828125, -0.0028076171875, 0.009906768798828125, 0.02262115478515625, 0.035335540771484375, 0.0480499267578125, 0.060764312744140625, 0.07347869873046875, 0.08619308471679688, 0.098907470703125, 0.11162185668945312, 0.12433624267578125, 0.13705062866210938, 0.1497650146484375, 0.16247940063476562, 0.17519378662109375, 0.18790817260742188, 0.20062255859375, 0.21333694458007812, 0.22605133056640625, 0.23876571655273438, 0.2514801025390625, 0.2641944885253906, 0.27690887451171875, 0.2896232604980469, 0.302337646484375, 0.3150520324707031, 0.32776641845703125, 0.3404808044433594, 0.3531951904296875, 0.3659095764160156, 0.37862396240234375, 0.3913383483886719, 0.404052734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 9.0, 11.0, 19.0, 13.0, 31.0, 15.0, 32.0, 33.0, 28.0, 38.0, 31.0, 40.0, 42.0, 43.0, 42.0, 47.0, 51.0, 38.0, 46.0, 41.0, 49.0, 34.0, 34.0, 27.0, 33.0, 19.0, 30.0, 21.0, 28.0, 12.0, 8.0, 11.0, 5.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.9674224853515625, -0.932891845703125, -0.8983612060546875, -0.86383056640625, -0.8292999267578125, -0.794769287109375, -0.7602386474609375, -0.7257080078125, -0.6911773681640625, -0.656646728515625, -0.6221160888671875, -0.58758544921875, -0.5530548095703125, -0.518524169921875, -0.4839935302734375, -0.449462890625, -0.4149322509765625, -0.380401611328125, -0.3458709716796875, -0.31134033203125, -0.2768096923828125, -0.242279052734375, -0.2077484130859375, -0.1732177734375, -0.1386871337890625, -0.104156494140625, -0.0696258544921875, -0.03509521484375, -0.0005645751953125, 0.033966064453125, 0.0684967041015625, 0.10302734375, 0.1375579833984375, 0.172088623046875, 0.2066192626953125, 0.24114990234375, 0.2756805419921875, 0.310211181640625, 0.3447418212890625, 0.3792724609375, 0.4138031005859375, 0.448333740234375, 0.4828643798828125, 0.51739501953125, 0.5519256591796875, 0.586456298828125, 0.6209869384765625, 0.655517578125, 0.6900482177734375, 0.724578857421875, 0.7591094970703125, 0.79364013671875, 0.8281707763671875, 0.862701416015625, 0.8972320556640625, 0.9317626953125, 0.9662933349609375, 1.000823974609375, 1.0353546142578125, 1.06988525390625, 1.1044158935546875, 1.138946533203125, 1.1734771728515625, 1.2080078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 15.0, 18.0, 20.0, 37.0, 45.0, 61.0, 83.0, 122.0, 164.0, 249.0, 374.0, 580.0, 833.0, 1335.0, 2189.0, 3525.0, 5998.0, 10695.0, 19107.0, 35797.0, 68764.0, 127624.0, 209285.0, 243844.0, 145278.0, 79432.0, 41373.0, 21901.0, 12077.0, 6893.0, 3906.0, 2445.0, 1523.0, 967.0, 640.0, 407.0, 255.0, 188.0, 181.0, 95.0, 60.0, 43.0, 39.0, 27.0, 17.0, 17.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08135986328125, -0.07874488830566406, -0.07612991333007812, -0.07351493835449219, -0.07089996337890625, -0.06828498840332031, -0.06567001342773438, -0.06305503845214844, -0.0604400634765625, -0.05782508850097656, -0.055210113525390625, -0.05259513854980469, -0.04998016357421875, -0.04736518859863281, -0.044750213623046875, -0.04213523864746094, -0.039520263671875, -0.03690528869628906, -0.034290313720703125, -0.03167533874511719, -0.02906036376953125, -0.026445388793945312, -0.023830413818359375, -0.021215438842773438, -0.0186004638671875, -0.015985488891601562, -0.013370513916015625, -0.010755538940429688, -0.00814056396484375, -0.0055255889892578125, -0.002910614013671875, -0.0002956390380859375, 0.0023193359375, 0.0049343109130859375, 0.007549285888671875, 0.010164260864257812, 0.01277923583984375, 0.015394210815429688, 0.018009185791015625, 0.020624160766601562, 0.0232391357421875, 0.025854110717773438, 0.028469085693359375, 0.031084060668945312, 0.03369903564453125, 0.03631401062011719, 0.038928985595703125, 0.04154396057128906, 0.044158935546875, 0.04677391052246094, 0.049388885498046875, 0.05200386047363281, 0.05461883544921875, 0.05723381042480469, 0.059848785400390625, 0.06246376037597656, 0.0650787353515625, 0.06769371032714844, 0.07030868530273438, 0.07292366027832031, 0.07553863525390625, 0.07815361022949219, 0.08076858520507812, 0.08338356018066406, 0.08599853515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 2.0, 6.0, 9.0, 8.0, 7.0, 8.0, 10.0, 9.0, 15.0, 16.0, 21.0, 43.0, 38.0, 39.0, 57.0, 63.0, 77.0, 75.0, 86.0, 68.0, 58.0, 46.0, 49.0, 23.0, 28.0, 27.0, 20.0, 16.0, 19.0, 12.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.6372413635253906e-05, -4.49158251285553e-05, -4.345923662185669e-05, -4.200264811515808e-05, -4.054605960845947e-05, -3.9089471101760864e-05, -3.7632882595062256e-05, -3.617629408836365e-05, -3.471970558166504e-05, -3.326311707496643e-05, -3.180652856826782e-05, -3.0349940061569214e-05, -2.8893351554870605e-05, -2.7436763048171997e-05, -2.598017454147339e-05, -2.452358603477478e-05, -2.3066997528076172e-05, -2.1610409021377563e-05, -2.0153820514678955e-05, -1.8697232007980347e-05, -1.7240643501281738e-05, -1.578405499458313e-05, -1.4327466487884521e-05, -1.2870877981185913e-05, -1.1414289474487305e-05, -9.957700967788696e-06, -8.501112461090088e-06, -7.0445239543914795e-06, -5.587935447692871e-06, -4.131346940994263e-06, -2.6747584342956543e-06, -1.218169927597046e-06, 2.384185791015625e-07, 1.695007085800171e-06, 3.1515955924987793e-06, 4.608184099197388e-06, 6.064772605895996e-06, 7.5213611125946045e-06, 8.977949619293213e-06, 1.0434538125991821e-05, 1.189112663269043e-05, 1.3347715139389038e-05, 1.4804303646087646e-05, 1.6260892152786255e-05, 1.7717480659484863e-05, 1.917406916618347e-05, 2.063065767288208e-05, 2.208724617958069e-05, 2.3543834686279297e-05, 2.5000423192977905e-05, 2.6457011699676514e-05, 2.7913600206375122e-05, 2.937018871307373e-05, 3.082677721977234e-05, 3.228336572647095e-05, 3.3739954233169556e-05, 3.5196542739868164e-05, 3.665313124656677e-05, 3.810971975326538e-05, 3.956630825996399e-05, 4.10228967666626e-05, 4.2479485273361206e-05, 4.3936073780059814e-05, 4.539266228675842e-05, 4.684925079345703e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 21.0, 31.0, 38.0, 57.0, 78.0, 101.0, 152.0, 207.0, 336.0, 537.0, 748.0, 1201.0, 1850.0, 2902.0, 4945.0, 8331.0, 14975.0, 26776.0, 49894.0, 90577.0, 152841.0, 232997.0, 186896.0, 119764.0, 67644.0, 36376.0, 20137.0, 11134.0, 6337.0, 3758.0, 2442.0, 1503.0, 966.0, 638.0, 468.0, 261.0, 187.0, 132.0, 85.0, 72.0, 46.0, 33.0, 24.0, 13.0, 8.0, 13.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07232666015625, -0.06997489929199219, -0.06762313842773438, -0.06527137756347656, -0.06291961669921875, -0.06056785583496094, -0.058216094970703125, -0.05586433410644531, -0.0535125732421875, -0.05116081237792969, -0.048809051513671875, -0.04645729064941406, -0.04410552978515625, -0.04175376892089844, -0.039402008056640625, -0.03705024719238281, -0.034698486328125, -0.03234672546386719, -0.029994964599609375, -0.027643203735351562, -0.02529144287109375, -0.022939682006835938, -0.020587921142578125, -0.018236160278320312, -0.0158843994140625, -0.013532638549804688, -0.011180877685546875, -0.008829116821289062, -0.00647735595703125, -0.0041255950927734375, -0.001773834228515625, 0.0005779266357421875, 0.0029296875, 0.0052814483642578125, 0.007633209228515625, 0.009984970092773438, 0.01233673095703125, 0.014688491821289062, 0.017040252685546875, 0.019392013549804688, 0.0217437744140625, 0.024095535278320312, 0.026447296142578125, 0.028799057006835938, 0.03115081787109375, 0.03350257873535156, 0.035854339599609375, 0.03820610046386719, 0.040557861328125, 0.04290962219238281, 0.045261383056640625, 0.04761314392089844, 0.04996490478515625, 0.05231666564941406, 0.054668426513671875, 0.05702018737792969, 0.0593719482421875, 0.06172370910644531, 0.06407546997070312, 0.06642723083496094, 0.06877899169921875, 0.07113075256347656, 0.07348251342773438, 0.07583427429199219, 0.07818603515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 10.0, 11.0, 12.0, 17.0, 24.0, 26.0, 17.0, 33.0, 40.0, 41.0, 59.0, 61.0, 54.0, 83.0, 54.0, 72.0, 55.0, 64.0, 44.0, 33.0, 25.0, 31.0, 24.0, 17.0, 22.0, 16.0, 10.0, 4.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1380615234375, -0.13360595703125, -0.129150390625, -0.12469482421875, -0.1202392578125, -0.11578369140625, -0.111328125, -0.10687255859375, -0.1024169921875, -0.09796142578125, -0.093505859375, -0.08905029296875, -0.0845947265625, -0.08013916015625, -0.07568359375, -0.07122802734375, -0.0667724609375, -0.06231689453125, -0.057861328125, -0.05340576171875, -0.0489501953125, -0.04449462890625, -0.0400390625, -0.03558349609375, -0.0311279296875, -0.02667236328125, -0.022216796875, -0.01776123046875, -0.0133056640625, -0.00885009765625, -0.00439453125, 6.103515625e-05, 0.0045166015625, 0.00897216796875, 0.013427734375, 0.01788330078125, 0.0223388671875, 0.02679443359375, 0.03125, 0.03570556640625, 0.0401611328125, 0.04461669921875, 0.049072265625, 0.05352783203125, 0.0579833984375, 0.06243896484375, 0.06689453125, 0.07135009765625, 0.0758056640625, 0.08026123046875, 0.084716796875, 0.08917236328125, 0.0936279296875, 0.09808349609375, 0.1025390625, 0.10699462890625, 0.1114501953125, 0.11590576171875, 0.120361328125, 0.12481689453125, 0.1292724609375, 0.13372802734375, 0.13818359375, 0.14263916015625, 0.1470947265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 14.0, 28.0, 47.0, 72.0, 106.0, 146.0, 182.0, 141.0, 104.0, 62.0, 44.0, 18.0, 10.0, 5.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.143479824066162, -4.026763439178467, -3.9100470542907715, -3.793330669403076, -3.676614284515381, -3.5598978996276855, -3.4431815147399902, -3.326465129852295, -3.2097487449645996, -3.0930323600769043, -2.976315975189209, -2.8595995903015137, -2.7428832054138184, -2.626166820526123, -2.5094504356384277, -2.3927340507507324, -2.276017665863037, -2.159301280975342, -2.0425848960876465, -1.9258685111999512, -1.8091521263122559, -1.6924357414245605, -1.5757193565368652, -1.45900297164917, -1.3422863483428955, -1.2255699634552002, -1.1088535785675049, -0.9921371936798096, -0.8754208087921143, -0.7587043642997742, -0.6419879794120789, -0.5252715945243835, -0.408555269241333, -0.2918388843536377, -0.1751224845647812, -0.05840608477592468, 0.05831030011177063, 0.17502671480178833, 0.29174309968948364, 0.40845948457717896, 0.5251758694648743, 0.6418922543525696, 0.7586086392402649, 0.875325083732605, 0.9920414686203003, 1.1087578535079956, 1.225474238395691, 1.3421906232833862, 1.4589070081710815, 1.5756233930587769, 1.6923397779464722, 1.8090561628341675, 1.9257725477218628, 2.0424890518188477, 2.159205436706543, 2.2759218215942383, 2.3926382064819336, 2.509354591369629, 2.626070976257324, 2.7427873611450195, 2.859503746032715, 2.97622013092041, 3.0929365158081055, 3.209652900695801, 3.326369285583496]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 6.0, 12.0, 11.0, 15.0, 13.0, 24.0, 20.0, 28.0, 38.0, 29.0, 40.0, 49.0, 46.0, 47.0, 37.0, 44.0, 48.0, 50.0, 47.0, 33.0, 42.0, 43.0, 40.0, 32.0, 33.0, 18.0, 14.0, 20.0, 18.0, 14.0, 19.0, 11.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.652841567993164, -2.5749683380126953, -2.4970951080322266, -2.419222116470337, -2.341348886489868, -2.2634756565093994, -2.1856026649475098, -2.107729434967041, -2.0298562049865723, -1.9519829750061035, -1.8741098642349243, -1.7962367534637451, -1.7183635234832764, -1.6404902935028076, -1.5626171827316284, -1.4847440719604492, -1.4068708419799805, -1.3289976119995117, -1.2511245012283325, -1.1732513904571533, -1.0953781604766846, -1.0175049304962158, -0.9396318197250366, -0.8617586493492126, -0.7838854789733887, -0.7060123085975647, -0.6281391382217407, -0.5502659678459167, -0.4723927974700928, -0.3945196270942688, -0.3166464567184448, -0.23877328634262085, -0.16090011596679688, -0.0830269455909729, -0.005153775215148926, 0.07271939516067505, 0.15059256553649902, 0.228465735912323, 0.306338906288147, 0.38421207666397095, 0.4620852470397949, 0.5399584174156189, 0.6178315877914429, 0.6957047581672668, 0.7735779285430908, 0.8514510989189148, 0.9293242692947388, 1.007197380065918, 1.0850706100463867, 1.1629438400268555, 1.2408169507980347, 1.3186900615692139, 1.3965632915496826, 1.4744365215301514, 1.5523096323013306, 1.6301827430725098, 1.7080559730529785, 1.7859292030334473, 1.8638023138046265, 1.9416754245758057, 2.0195486545562744, 2.097421884536743, 2.175294876098633, 2.2531681060791016, 2.3310413360595703]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 0.0, 8.0, 3.0, 4.0, 8.0, 16.0, 9.0, 14.0, 22.0, 34.0, 31.0, 45.0, 74.0, 80.0, 89.0, 103.0, 113.0, 123.0, 177.0, 278.0, 395.0, 810.0, 2064.0, 7785.0, 56690.0, 921016.0, 2630000.0, 529144.0, 35690.0, 5610.0, 1561.0, 729.0, 342.0, 263.0, 152.0, 162.0, 133.0, 101.0, 82.0, 68.0, 59.0, 52.0, 33.0, 33.0, 16.0, 14.0, 11.0, 11.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.9794921875, -0.947265625, -0.9150390625, -0.8828125, -0.8505859375, -0.818359375, -0.7861328125, -0.75390625, -0.7216796875, -0.689453125, -0.6572265625, -0.625, -0.5927734375, -0.560546875, -0.5283203125, -0.49609375, -0.4638671875, -0.431640625, -0.3994140625, -0.3671875, -0.3349609375, -0.302734375, -0.2705078125, -0.23828125, -0.2060546875, -0.173828125, -0.1416015625, -0.109375, -0.0771484375, -0.044921875, -0.0126953125, 0.01953125, 0.0517578125, 0.083984375, 0.1162109375, 0.1484375, 0.1806640625, 0.212890625, 0.2451171875, 0.27734375, 0.3095703125, 0.341796875, 0.3740234375, 0.40625, 0.4384765625, 0.470703125, 0.5029296875, 0.53515625, 0.5673828125, 0.599609375, 0.6318359375, 0.6640625, 0.6962890625, 0.728515625, 0.7607421875, 0.79296875, 0.8251953125, 0.857421875, 0.8896484375, 0.921875, 0.9541015625, 0.986328125, 1.0185546875, 1.05078125, 1.0830078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 2.0, 8.0, 9.0, 8.0, 10.0, 12.0, 10.0, 8.0, 16.0, 18.0, 14.0, 19.0, 24.0, 35.0, 28.0, 30.0, 32.0, 37.0, 32.0, 35.0, 31.0, 31.0, 36.0, 63.0, 30.0, 30.0, 39.0, 30.0, 36.0, 30.0, 28.0, 28.0, 31.0, 23.0, 27.0, 15.0, 12.0, 21.0, 19.0, 11.0, 12.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.34375, -0.3335762023925781, -0.32340240478515625, -0.3132286071777344, -0.3030548095703125, -0.2928810119628906, -0.28270721435546875, -0.2725334167480469, -0.262359619140625, -0.2521858215332031, -0.24201202392578125, -0.23183822631835938, -0.2216644287109375, -0.21149063110351562, -0.20131683349609375, -0.19114303588867188, -0.18096923828125, -0.17079544067382812, -0.16062164306640625, -0.15044784545898438, -0.1402740478515625, -0.13010025024414062, -0.11992645263671875, -0.10975265502929688, -0.099578857421875, -0.08940505981445312, -0.07923126220703125, -0.06905746459960938, -0.0588836669921875, -0.048709869384765625, -0.03853607177734375, -0.028362274169921875, -0.0181884765625, -0.008014678955078125, 0.00215911865234375, 0.012332916259765625, 0.0225067138671875, 0.032680511474609375, 0.04285430908203125, 0.053028106689453125, 0.063201904296875, 0.07337570190429688, 0.08354949951171875, 0.09372329711914062, 0.1038970947265625, 0.11407089233398438, 0.12424468994140625, 0.13441848754882812, 0.14459228515625, 0.15476608276367188, 0.16493988037109375, 0.17511367797851562, 0.1852874755859375, 0.19546127319335938, 0.20563507080078125, 0.21580886840820312, 0.225982666015625, 0.23615646362304688, 0.24633026123046875, 0.2565040588378906, 0.2666778564453125, 0.2768516540527344, 0.28702545166015625, 0.2971992492675781, 0.307373046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 9.0, 8.0, 9.0, 14.0, 30.0, 32.0, 45.0, 50.0, 85.0, 109.0, 188.0, 244.0, 427.0, 717.0, 1286.0, 2700.0, 6124.0, 17454.0, 64879.0, 339620.0, 2346547.0, 1185661.0, 169962.0, 37382.0, 11384.0, 4445.0, 2017.0, 1055.0, 607.0, 356.0, 263.0, 174.0, 118.0, 81.0, 50.0, 36.0, 36.0, 21.0, 16.0, 5.0, 5.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.57275390625, -0.552154541015625, -0.53155517578125, -0.510955810546875, -0.4903564453125, -0.469757080078125, -0.44915771484375, -0.428558349609375, -0.407958984375, -0.387359619140625, -0.36676025390625, -0.346160888671875, -0.3255615234375, -0.304962158203125, -0.28436279296875, -0.263763427734375, -0.2431640625, -0.222564697265625, -0.20196533203125, -0.181365966796875, -0.1607666015625, -0.140167236328125, -0.11956787109375, -0.098968505859375, -0.078369140625, -0.057769775390625, -0.03717041015625, -0.016571044921875, 0.0040283203125, 0.024627685546875, 0.04522705078125, 0.065826416015625, 0.08642578125, 0.107025146484375, 0.12762451171875, 0.148223876953125, 0.1688232421875, 0.189422607421875, 0.21002197265625, 0.230621337890625, 0.251220703125, 0.271820068359375, 0.29241943359375, 0.313018798828125, 0.3336181640625, 0.354217529296875, 0.37481689453125, 0.395416259765625, 0.416015625, 0.436614990234375, 0.45721435546875, 0.477813720703125, 0.4984130859375, 0.519012451171875, 0.53961181640625, 0.560211181640625, 0.580810546875, 0.601409912109375, 0.62200927734375, 0.642608642578125, 0.6632080078125, 0.683807373046875, 0.70440673828125, 0.725006103515625, 0.74560546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 4.0, 17.0, 9.0, 18.0, 24.0, 35.0, 33.0, 60.0, 67.0, 94.0, 127.0, 151.0, 216.0, 251.0, 290.0, 382.0, 382.0, 352.0, 341.0, 254.0, 213.0, 171.0, 127.0, 104.0, 71.0, 75.0, 47.0, 27.0, 27.0, 24.0, 22.0, 13.0, 9.0, 2.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.7391738891601562, -0.7166290283203125, -0.6940841674804688, -0.671539306640625, -0.6489944458007812, -0.6264495849609375, -0.6039047241210938, -0.58135986328125, -0.5588150024414062, -0.5362701416015625, -0.5137252807617188, -0.491180419921875, -0.46863555908203125, -0.4460906982421875, -0.42354583740234375, -0.4010009765625, -0.37845611572265625, -0.3559112548828125, -0.33336639404296875, -0.310821533203125, -0.28827667236328125, -0.2657318115234375, -0.24318695068359375, -0.22064208984375, -0.19809722900390625, -0.1755523681640625, -0.15300750732421875, -0.130462646484375, -0.10791778564453125, -0.0853729248046875, -0.06282806396484375, -0.040283203125, -0.01773834228515625, 0.0048065185546875, 0.02735137939453125, 0.049896240234375, 0.07244110107421875, 0.0949859619140625, 0.11753082275390625, 0.14007568359375, 0.16262054443359375, 0.1851654052734375, 0.20771026611328125, 0.230255126953125, 0.25279998779296875, 0.2753448486328125, 0.29788970947265625, 0.3204345703125, 0.34297943115234375, 0.3655242919921875, 0.38806915283203125, 0.410614013671875, 0.43315887451171875, 0.4557037353515625, 0.47824859619140625, 0.50079345703125, 0.5233383178710938, 0.5458831787109375, 0.5684280395507812, 0.590972900390625, 0.6135177612304688, 0.6360626220703125, 0.6586074829101562, 0.68115234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 3.0, 9.0, 25.0, 25.0, 34.0, 60.0, 75.0, 99.0, 112.0, 115.0, 106.0, 99.0, 75.0, 42.0, 27.0, 26.0, 23.0, 9.0, 8.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.27735710144043, -9.046242713928223, -8.815128326416016, -8.584013938903809, -8.352899551391602, -8.121786117553711, -7.890671253204346, -7.659556865692139, -7.42844295501709, -7.197328567504883, -6.966214179992676, -6.735099792480469, -6.50398588180542, -6.272871494293213, -6.041757106781006, -5.810642719268799, -5.579528331756592, -5.348413944244385, -5.117299556732178, -4.886185646057129, -4.655071258544922, -4.423956871032715, -4.192842483520508, -3.961728096008301, -3.730613946914673, -3.499499559402466, -3.268385410308838, -3.037271022796631, -2.806156635284424, -2.575042486190796, -2.343928098678589, -2.112813949584961, -1.881700038909912, -1.6505857706069946, -1.4194715023040771, -1.1883571147918701, -0.9572428464889526, -0.7261285781860352, -0.4950141906738281, -0.26389992237091064, -0.032785654067993164, 0.1983286440372467, 0.4294429421424866, 0.6605572700500488, 0.8916715383529663, 1.1227858066558838, 1.3539001941680908, 1.5850144624710083, 1.8161287307739258, 2.047243118286133, 2.2783572673797607, 2.5094716548919678, 2.7405858039855957, 2.9717001914978027, 3.2028145790100098, 3.433928966522217, 3.6650431156158447, 3.8961575031280518, 4.12727165222168, 4.358386039733887, 4.589500427246094, 4.820614814758301, 5.051729202270508, 5.282843112945557, 5.513957500457764]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 5.0, 9.0, 8.0, 14.0, 10.0, 25.0, 23.0, 37.0, 24.0, 38.0, 38.0, 39.0, 45.0, 42.0, 49.0, 52.0, 42.0, 43.0, 38.0, 36.0, 36.0, 42.0, 44.0, 42.0, 21.0, 31.0, 31.0, 21.0, 28.0, 14.0, 16.0, 9.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5183959007263184, -3.4006423950195312, -3.282888889312744, -3.165135383605957, -3.04738187789917, -2.929628372192383, -2.8118748664855957, -2.6941213607788086, -2.5763678550720215, -2.4586143493652344, -2.3408608436584473, -2.22310733795166, -2.105353832244873, -1.987600326538086, -1.8698468208312988, -1.7520933151245117, -1.6343399286270142, -1.516586422920227, -1.39883291721344, -1.2810794115066528, -1.1633259057998657, -1.0455725193023682, -0.9278189539909363, -0.8100654482841492, -0.6923119425773621, -0.574558436870575, -0.45680493116378784, -0.3390514552593231, -0.221297949552536, -0.10354447364807129, 0.01420903205871582, 0.13196253776550293, 0.24971604347229004, 0.36746954917907715, 0.48522305488586426, 0.6029765605926514, 0.7207300662994385, 0.8384835124015808, 0.9562370181083679, 1.0739905834197998, 1.191744089126587, 1.309497594833374, 1.4272511005401611, 1.5450046062469482, 1.6627581119537354, 1.7805116176605225, 1.8982651233673096, 2.0160186290740967, 2.1337718963623047, 2.251525402069092, 2.369278907775879, 2.487032413482666, 2.604785919189453, 2.7225394248962402, 2.8402929306030273, 2.9580464363098145, 3.0757999420166016, 3.1935534477233887, 3.311306953430176, 3.429060459136963, 3.54681396484375, 3.664567470550537, 3.782320976257324, 3.9000744819641113, 4.017827987670898]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 8.0, 9.0, 14.0, 24.0, 31.0, 31.0, 56.0, 62.0, 104.0, 120.0, 170.0, 219.0, 341.0, 569.0, 1022.0, 2208.0, 6048.0, 22960.0, 150330.0, 691957.0, 139895.0, 21707.0, 5767.0, 2099.0, 1064.0, 552.0, 352.0, 213.0, 154.0, 125.0, 85.0, 59.0, 44.0, 31.0, 16.0, 24.0, 18.0, 7.0, 12.0, 12.0, 7.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.9398040771484375, -0.907928466796875, -0.8760528564453125, -0.84417724609375, -0.8123016357421875, -0.780426025390625, -0.7485504150390625, -0.7166748046875, -0.6847991943359375, -0.652923583984375, -0.6210479736328125, -0.58917236328125, -0.5572967529296875, -0.525421142578125, -0.4935455322265625, -0.461669921875, -0.4297943115234375, -0.397918701171875, -0.3660430908203125, -0.33416748046875, -0.3022918701171875, -0.270416259765625, -0.2385406494140625, -0.2066650390625, -0.1747894287109375, -0.142913818359375, -0.1110382080078125, -0.07916259765625, -0.0472869873046875, -0.015411376953125, 0.0164642333984375, 0.04833984375, 0.0802154541015625, 0.112091064453125, 0.1439666748046875, 0.17584228515625, 0.2077178955078125, 0.239593505859375, 0.2714691162109375, 0.3033447265625, 0.3352203369140625, 0.367095947265625, 0.3989715576171875, 0.43084716796875, 0.4627227783203125, 0.494598388671875, 0.5264739990234375, 0.558349609375, 0.5902252197265625, 0.622100830078125, 0.6539764404296875, 0.68585205078125, 0.7177276611328125, 0.749603271484375, 0.7814788818359375, 0.8133544921875, 0.8452301025390625, 0.877105712890625, 0.9089813232421875, 0.94085693359375, 0.9727325439453125, 1.004608154296875, 1.0364837646484375, 1.068359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 8.0, 9.0, 11.0, 18.0, 28.0, 24.0, 33.0, 22.0, 32.0, 41.0, 39.0, 25.0, 44.0, 45.0, 37.0, 55.0, 61.0, 40.0, 50.0, 46.0, 39.0, 34.0, 47.0, 33.0, 31.0, 22.0, 23.0, 26.0, 13.0, 8.0, 10.0, 2.0, 5.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5203094482421875, -0.503509521484375, -0.4867095947265625, -0.46990966796875, -0.4531097412109375, -0.436309814453125, -0.4195098876953125, -0.4027099609375, -0.3859100341796875, -0.369110107421875, -0.3523101806640625, -0.33551025390625, -0.3187103271484375, -0.301910400390625, -0.2851104736328125, -0.268310546875, -0.2515106201171875, -0.234710693359375, -0.2179107666015625, -0.20111083984375, -0.1843109130859375, -0.167510986328125, -0.1507110595703125, -0.1339111328125, -0.1171112060546875, -0.100311279296875, -0.0835113525390625, -0.06671142578125, -0.0499114990234375, -0.033111572265625, -0.0163116455078125, 0.00048828125, 0.0172882080078125, 0.034088134765625, 0.0508880615234375, 0.06768798828125, 0.0844879150390625, 0.101287841796875, 0.1180877685546875, 0.1348876953125, 0.1516876220703125, 0.168487548828125, 0.1852874755859375, 0.20208740234375, 0.2188873291015625, 0.235687255859375, 0.2524871826171875, 0.269287109375, 0.2860870361328125, 0.302886962890625, 0.3196868896484375, 0.33648681640625, 0.3532867431640625, 0.370086669921875, 0.3868865966796875, 0.4036865234375, 0.4204864501953125, 0.437286376953125, 0.4540863037109375, 0.47088623046875, 0.4876861572265625, 0.504486083984375, 0.5212860107421875, 0.5380859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 10.0, 11.0, 16.0, 18.0, 22.0, 26.0, 28.0, 47.0, 60.0, 102.0, 151.0, 255.0, 686.0, 2586.0, 25736.0, 916503.0, 94923.0, 5346.0, 1107.0, 382.0, 186.0, 105.0, 75.0, 45.0, 29.0, 25.0, 22.0, 13.0, 10.0, 8.0, 3.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5301055908203125, -1.485992431640625, -1.4418792724609375, -1.39776611328125, -1.3536529541015625, -1.309539794921875, -1.2654266357421875, -1.2213134765625, -1.1772003173828125, -1.133087158203125, -1.0889739990234375, -1.04486083984375, -1.0007476806640625, -0.956634521484375, -0.9125213623046875, -0.868408203125, -0.8242950439453125, -0.780181884765625, -0.7360687255859375, -0.69195556640625, -0.6478424072265625, -0.603729248046875, -0.5596160888671875, -0.5155029296875, -0.4713897705078125, -0.427276611328125, -0.3831634521484375, -0.33905029296875, -0.2949371337890625, -0.250823974609375, -0.2067108154296875, -0.16259765625, -0.1184844970703125, -0.074371337890625, -0.0302581787109375, 0.01385498046875, 0.0579681396484375, 0.102081298828125, 0.1461944580078125, 0.1903076171875, 0.2344207763671875, 0.278533935546875, 0.3226470947265625, 0.36676025390625, 0.4108734130859375, 0.454986572265625, 0.4990997314453125, 0.543212890625, 0.5873260498046875, 0.631439208984375, 0.6755523681640625, 0.71966552734375, 0.7637786865234375, 0.807891845703125, 0.8520050048828125, 0.8961181640625, 0.9402313232421875, 0.984344482421875, 1.0284576416015625, 1.07257080078125, 1.1166839599609375, 1.160797119140625, 1.2049102783203125, 1.2490234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 7.0, 5.0, 11.0, 13.0, 12.0, 8.0, 18.0, 19.0, 31.0, 30.0, 35.0, 34.0, 50.0, 54.0, 49.0, 67.0, 55.0, 60.0, 66.0, 59.0, 52.0, 38.0, 45.0, 26.0, 25.0, 23.0, 16.0, 16.0, 17.0, 14.0, 11.0, 9.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2705078125, -1.2351150512695312, -1.1997222900390625, -1.1643295288085938, -1.128936767578125, -1.0935440063476562, -1.0581512451171875, -1.0227584838867188, -0.98736572265625, -0.9519729614257812, -0.9165802001953125, -0.8811874389648438, -0.845794677734375, -0.8104019165039062, -0.7750091552734375, -0.7396163940429688, -0.7042236328125, -0.6688308715820312, -0.6334381103515625, -0.5980453491210938, -0.562652587890625, -0.5272598266601562, -0.4918670654296875, -0.45647430419921875, -0.42108154296875, -0.38568878173828125, -0.3502960205078125, -0.31490325927734375, -0.279510498046875, -0.24411773681640625, -0.2087249755859375, -0.17333221435546875, -0.137939453125, -0.10254669189453125, -0.0671539306640625, -0.03176116943359375, 0.003631591796875, 0.03902435302734375, 0.0744171142578125, 0.10980987548828125, 0.14520263671875, 0.18059539794921875, 0.2159881591796875, 0.25138092041015625, 0.286773681640625, 0.32216644287109375, 0.3575592041015625, 0.39295196533203125, 0.4283447265625, 0.46373748779296875, 0.4991302490234375, 0.5345230102539062, 0.569915771484375, 0.6053085327148438, 0.6407012939453125, 0.6760940551757812, 0.71148681640625, 0.7468795776367188, 0.7822723388671875, 0.8176651000976562, 0.853057861328125, 0.8884506225585938, 0.9238433837890625, 0.9592361450195312, 0.99462890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 14.0, 14.0, 21.0, 30.0, 51.0, 120.0, 239.0, 543.0, 2264.0, 24105.0, 854039.0, 158885.0, 6473.0, 1040.0, 349.0, 174.0, 69.0, 47.0, 21.0, 21.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.317626953125, -0.30792999267578125, -0.2982330322265625, -0.28853607177734375, -0.278839111328125, -0.26914215087890625, -0.2594451904296875, -0.24974822998046875, -0.24005126953125, -0.23035430908203125, -0.2206573486328125, -0.21096038818359375, -0.201263427734375, -0.19156646728515625, -0.1818695068359375, -0.17217254638671875, -0.1624755859375, -0.15277862548828125, -0.1430816650390625, -0.13338470458984375, -0.123687744140625, -0.11399078369140625, -0.1042938232421875, -0.09459686279296875, -0.08489990234375, -0.07520294189453125, -0.0655059814453125, -0.05580902099609375, -0.046112060546875, -0.03641510009765625, -0.0267181396484375, -0.01702117919921875, -0.00732421875, 0.00237274169921875, 0.0120697021484375, 0.02176666259765625, 0.031463623046875, 0.04116058349609375, 0.0508575439453125, 0.06055450439453125, 0.07025146484375, 0.07994842529296875, 0.0896453857421875, 0.09934234619140625, 0.109039306640625, 0.11873626708984375, 0.1284332275390625, 0.13813018798828125, 0.1478271484375, 0.15752410888671875, 0.1672210693359375, 0.17691802978515625, 0.186614990234375, 0.19631195068359375, 0.2060089111328125, 0.21570587158203125, 0.22540283203125, 0.23509979248046875, 0.2447967529296875, 0.25449371337890625, 0.264190673828125, 0.27388763427734375, 0.2835845947265625, 0.29328155517578125, 0.302978515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 9.0, 2.0, 10.0, 10.0, 12.0, 20.0, 22.0, 36.0, 38.0, 48.0, 63.0, 79.0, 88.0, 95.0, 74.0, 79.0, 79.0, 49.0, 41.0, 22.0, 19.0, 22.0, 17.0, 17.0, 7.0, 6.0, 3.0, 1.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.112720489501953e-05, -3.986712545156479e-05, -3.8607046008110046e-05, -3.7346966564655304e-05, -3.608688712120056e-05, -3.482680767774582e-05, -3.356672823429108e-05, -3.2306648790836334e-05, -3.104656934738159e-05, -2.978648990392685e-05, -2.8526410460472107e-05, -2.7266331017017365e-05, -2.6006251573562622e-05, -2.474617213010788e-05, -2.3486092686653137e-05, -2.2226013243198395e-05, -2.0965933799743652e-05, -1.970585435628891e-05, -1.8445774912834167e-05, -1.7185695469379425e-05, -1.5925616025924683e-05, -1.466553658246994e-05, -1.3405457139015198e-05, -1.2145377695560455e-05, -1.0885298252105713e-05, -9.62521880865097e-06, -8.365139365196228e-06, -7.105059921741486e-06, -5.844980478286743e-06, -4.584901034832001e-06, -3.3248215913772583e-06, -2.064742147922516e-06, -8.046627044677734e-07, 4.55416738986969e-07, 1.7154961824417114e-06, 2.975575625896454e-06, 4.235655069351196e-06, 5.495734512805939e-06, 6.755813956260681e-06, 8.015893399715424e-06, 9.275972843170166e-06, 1.0536052286624908e-05, 1.1796131730079651e-05, 1.3056211173534393e-05, 1.4316290616989136e-05, 1.5576370060443878e-05, 1.683644950389862e-05, 1.8096528947353363e-05, 1.9356608390808105e-05, 2.0616687834262848e-05, 2.187676727771759e-05, 2.3136846721172333e-05, 2.4396926164627075e-05, 2.5657005608081818e-05, 2.691708505153656e-05, 2.8177164494991302e-05, 2.9437243938446045e-05, 3.069732338190079e-05, 3.195740282535553e-05, 3.321748226881027e-05, 3.4477561712265015e-05, 3.573764115571976e-05, 3.69977205991745e-05, 3.825780004262924e-05, 3.9517879486083984e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 11.0, 9.0, 24.0, 35.0, 74.0, 121.0, 247.0, 953.0, 5586.0, 112460.0, 890548.0, 34751.0, 2718.0, 602.0, 206.0, 89.0, 49.0, 23.0, 14.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.42529296875, -0.4150047302246094, -0.40471649169921875, -0.3944282531738281, -0.3841400146484375, -0.3738517761230469, -0.36356353759765625, -0.3532752990722656, -0.342987060546875, -0.3326988220214844, -0.32241058349609375, -0.3121223449707031, -0.3018341064453125, -0.2915458679199219, -0.28125762939453125, -0.2709693908691406, -0.26068115234375, -0.2503929138183594, -0.24010467529296875, -0.22981643676757812, -0.2195281982421875, -0.20923995971679688, -0.19895172119140625, -0.18866348266601562, -0.178375244140625, -0.16808700561523438, -0.15779876708984375, -0.14751052856445312, -0.1372222900390625, -0.12693405151367188, -0.11664581298828125, -0.10635757446289062, -0.0960693359375, -0.08578109741210938, -0.07549285888671875, -0.06520462036132812, -0.0549163818359375, -0.044628143310546875, -0.03433990478515625, -0.024051666259765625, -0.013763427734375, -0.003475189208984375, 0.00681304931640625, 0.017101287841796875, 0.0273895263671875, 0.037677764892578125, 0.04796600341796875, 0.058254241943359375, 0.06854248046875, 0.07883071899414062, 0.08911895751953125, 0.09940719604492188, 0.1096954345703125, 0.11998367309570312, 0.13027191162109375, 0.14056015014648438, 0.150848388671875, 0.16113662719726562, 0.17142486572265625, 0.18171310424804688, 0.1920013427734375, 0.20228958129882812, 0.21257781982421875, 0.22286605834960938, 0.233154296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 15.0, 24.0, 33.0, 43.0, 69.0, 101.0, 131.0, 136.0, 120.0, 101.0, 70.0, 53.0, 28.0, 23.0, 18.0, 16.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210693359375, -0.20403099060058594, -0.19736862182617188, -0.1907062530517578, -0.18404388427734375, -0.1773815155029297, -0.17071914672851562, -0.16405677795410156, -0.1573944091796875, -0.15073204040527344, -0.14406967163085938, -0.1374073028564453, -0.13074493408203125, -0.12408256530761719, -0.11742019653320312, -0.11075782775878906, -0.104095458984375, -0.09743309020996094, -0.09077072143554688, -0.08410835266113281, -0.07744598388671875, -0.07078361511230469, -0.06412124633789062, -0.05745887756347656, -0.0507965087890625, -0.04413414001464844, -0.037471771240234375, -0.030809402465820312, -0.02414703369140625, -0.017484664916992188, -0.010822296142578125, -0.0041599273681640625, 0.00250244140625, 0.009164810180664062, 0.015827178955078125, 0.022489547729492188, 0.02915191650390625, 0.03581428527832031, 0.042476654052734375, 0.04913902282714844, 0.0558013916015625, 0.06246376037597656, 0.06912612915039062, 0.07578849792480469, 0.08245086669921875, 0.08911323547363281, 0.09577560424804688, 0.10243797302246094, 0.109100341796875, 0.11576271057128906, 0.12242507934570312, 0.1290874481201172, 0.13574981689453125, 0.1424121856689453, 0.14907455444335938, 0.15573692321777344, 0.1623992919921875, 0.16906166076660156, 0.17572402954101562, 0.1823863983154297, 0.18904876708984375, 0.1957111358642578, 0.20237350463867188, 0.20903587341308594, 0.2156982421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 9.0, 7.0, 15.0, 40.0, 87.0, 181.0, 301.0, 194.0, 71.0, 36.0, 25.0, 17.0, 7.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.102482795715332, -3.9190473556518555, -3.735611915588379, -3.5521767139434814, -3.368741273880005, -3.1853058338165283, -3.001870632171631, -2.8184351921081543, -2.6349997520446777, -2.451564311981201, -2.2681288719177246, -2.084693670272827, -1.9012582302093506, -1.717822790145874, -1.534387469291687, -1.3509521484375, -1.1675167083740234, -0.9840813279151917, -0.8006459474563599, -0.6172105669975281, -0.4337751865386963, -0.2503398060798645, -0.06690442562103271, 0.1165308952331543, 0.29996633529663086, 0.48340171575546265, 0.6668370962142944, 0.8502724766731262, 1.033707857131958, 1.2171432971954346, 1.4005786180496216, 1.5840139389038086, 1.767448902130127, 1.9508843421936035, 2.13431978225708, 2.3177549839019775, 2.501190423965454, 2.6846258640289307, 2.868061065673828, 3.0514965057373047, 3.2349319458007812, 3.418367385864258, 3.6018028259277344, 3.785238027572632, 3.9686734676361084, 4.152108669281006, 4.335544109344482, 4.518979549407959, 4.7024149894714355, 4.885850429534912, 5.069285869598389, 5.252721309661865, 5.436156272888184, 5.61959171295166, 5.803027153015137, 5.986462593078613, 6.16989803314209, 6.353333473205566, 6.536768913269043, 6.7202043533325195, 6.903639793395996, 7.0870747566223145, 7.270510196685791, 7.453945636749268, 7.637381076812744]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 1.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 20.0, 26.0, 27.0, 33.0, 34.0, 38.0, 44.0, 41.0, 59.0, 68.0, 77.0, 70.0, 65.0, 63.0, 39.0, 42.0, 35.0, 28.0, 18.0, 18.0, 22.0, 14.0, 9.0, 8.0, 11.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.240878105163574, -2.1651220321655273, -2.0893659591674805, -2.0136098861694336, -1.9378538131713867, -1.8620977401733398, -1.786341667175293, -1.710585594177246, -1.6348295211791992, -1.5590734481811523, -1.4833173751831055, -1.4075613021850586, -1.3318052291870117, -1.2560491561889648, -1.180293083190918, -1.104537010192871, -1.0287809371948242, -0.9530248641967773, -0.8772687911987305, -0.8015127182006836, -0.7257566452026367, -0.6500005722045898, -0.574244499206543, -0.4984884262084961, -0.4227323532104492, -0.34697628021240234, -0.27122020721435547, -0.1954641342163086, -0.11970806121826172, -0.043951988220214844, 0.03180408477783203, 0.1075601577758789, 0.18331646919250488, 0.25907254219055176, 0.33482861518859863, 0.4105846881866455, 0.4863407611846924, 0.5620968341827393, 0.6378529071807861, 0.713608980178833, 0.7893650531768799, 0.8651211261749268, 0.9408771991729736, 1.0166332721710205, 1.0923893451690674, 1.1681454181671143, 1.2439014911651611, 1.319657564163208, 1.3954136371612549, 1.4711697101593018, 1.5469257831573486, 1.6226818561553955, 1.6984379291534424, 1.7741940021514893, 1.8499500751495361, 1.925706148147583, 2.00146222114563, 2.0772182941436768, 2.1529743671417236, 2.2287304401397705, 2.3044865131378174, 2.3802425861358643, 2.455998659133911, 2.531754732131958, 2.607510805130005]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 10.0, 7.0, 10.0, 14.0, 19.0, 17.0, 26.0, 26.0, 26.0, 29.0, 42.0, 89.0, 218.0, 151.0, 70.0, 35.0, 24.0, 28.0, 19.0, 19.0, 21.0, 18.0, 11.0, 11.0, 7.0, 4.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.70263671875, -0.6840324401855469, -0.6654281616210938, -0.6468238830566406, -0.6282196044921875, -0.6096153259277344, -0.5910110473632812, -0.5724067687988281, -0.553802490234375, -0.5351982116699219, -0.5165939331054688, -0.4979896545410156, -0.4793853759765625, -0.4607810974121094, -0.44217681884765625, -0.4235725402832031, -0.40496826171875, -0.3863639831542969, -0.36775970458984375, -0.3491554260253906, -0.3305511474609375, -0.3119468688964844, -0.29334259033203125, -0.2747383117675781, -0.256134033203125, -0.23752975463867188, -0.21892547607421875, -0.20032119750976562, -0.1817169189453125, -0.16311264038085938, -0.14450836181640625, -0.12590408325195312, -0.1072998046875, -0.08869552612304688, -0.07009124755859375, -0.051486968994140625, -0.0328826904296875, -0.014278411865234375, 0.00432586669921875, 0.022930145263671875, 0.041534423828125, 0.060138702392578125, 0.07874298095703125, 0.09734725952148438, 0.1159515380859375, 0.13455581665039062, 0.15316009521484375, 0.17176437377929688, 0.19036865234375, 0.20897293090820312, 0.22757720947265625, 0.24618148803710938, 0.2647857666015625, 0.2833900451660156, 0.30199432373046875, 0.3205986022949219, 0.339202880859375, 0.3578071594238281, 0.37641143798828125, 0.3950157165527344, 0.4136199951171875, 0.4322242736816406, 0.45082855224609375, 0.4694328308105469, 0.488037109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 13.0, 12.0, 10.0, 26.0, 32.0, 41.0, 48.0, 92.0, 135.0, 217.0, 313.0, 601.0, 1150.0, 2595.0, 7333.0, 35555.0, 8294095.0, 34219.0, 7244.0, 2453.0, 1026.0, 521.0, 300.0, 180.0, 114.0, 67.0, 54.0, 43.0, 20.0, 25.0, 12.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3404881954193115, -1.2950398921966553, -1.249591588973999, -1.2041432857513428, -1.158695101737976, -1.1132467985153198, -1.0677984952926636, -1.0223501920700073, -0.9769019484519958, -0.9314536452293396, -0.8860054016113281, -0.8405570983886719, -0.7951087951660156, -0.7496605515480042, -0.7042122483253479, -0.6587640047073364, -0.6133157014846802, -0.5678673982620239, -0.5224191546440125, -0.4769708514213562, -0.43152257800102234, -0.3860743045806885, -0.3406260013580322, -0.29517772793769836, -0.2497294545173645, -0.20428118109703064, -0.15883289277553558, -0.11338460445404053, -0.06793633103370667, -0.022488057613372803, 0.022960245609283447, 0.06840851902961731, 0.11385667324066162, 0.15930494666099548, 0.20475323498249054, 0.2502015233039856, 0.29564979672431946, 0.3410980701446533, 0.38654637336730957, 0.43199464678764343, 0.4774429202079773, 0.5228912234306335, 0.568339467048645, 0.6137877702713013, 0.6592360734939575, 0.704684317111969, 0.7501326203346252, 0.7955808639526367, 0.841029167175293, 0.8864774703979492, 0.9319257140159607, 0.9773740172386169, 1.0228222608566284, 1.0682705640792847, 1.113718867301941, 1.1591671705245972, 1.2046153545379639, 1.2500636577606201, 1.2955119609832764, 1.3409602642059326, 1.3864084482192993, 1.4318567514419556, 1.4773050546646118, 1.522753357887268, 1.5682016611099243]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 30.0, 14.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6868336796760559, -0.6426858305931091, -0.5985379815101624, -0.5543901324272156, -0.5102422833442688, -0.466094434261322, -0.42194658517837524, -0.37779873609542847, -0.3336508870124817, -0.2895030379295349, -0.24535518884658813, -0.20120733976364136, -0.15705949068069458, -0.1129116415977478, -0.06876379251480103, -0.024615943431854248, 0.01953190565109253, 0.0636797547340393, 0.10782760381698608, 0.15197545289993286, 0.19612330198287964, 0.24027115106582642, 0.2844190001487732, 0.32856684923171997, 0.37271469831466675, 0.4168625473976135, 0.4610103964805603, 0.5051582455635071, 0.5493060946464539, 0.5934539437294006, 0.6376017928123474, 0.6817496418952942, 0.7258975505828857, 0.7700453996658325, 0.8141932487487793, 0.8583410978317261, 0.9024889469146729, 0.9466367959976196, 0.9907846450805664, 1.0349324941635132, 1.07908034324646, 1.1232281923294067, 1.1673760414123535, 1.2115238904953003, 1.255671739578247, 1.2998195886611938, 1.3439674377441406, 1.3881152868270874, 1.4322631359100342, 1.476410984992981, 1.5205588340759277, 1.5647066831588745, 1.6088545322418213, 1.653002381324768, 1.6971502304077148, 1.7412980794906616, 1.7854459285736084, 1.8295937776565552, 1.873741626739502, 1.9178894758224487, 1.9620373249053955, 2.0061850547790527, 2.050333023071289, 2.0944809913635254, 2.1386287212371826]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 7.0, 8.0, 12.0, 16.0, 12.0, 13.0, 19.0, 20.0, 29.0, 32.0, 36.0, 42.0, 39.0, 30.0, 53.0, 57.0, 50.0, 52.0, 44.0, 49.0, 47.0, 41.0, 34.0, 54.0, 23.0, 21.0, 31.0, 22.0, 15.0, 16.0, 10.0, 16.0, 10.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338623046875, -0.326690673828125, -0.31475830078125, -0.302825927734375, -0.2908935546875, -0.278961181640625, -0.26702880859375, -0.255096435546875, -0.2431640625, -0.231231689453125, -0.21929931640625, -0.207366943359375, -0.1954345703125, -0.183502197265625, -0.17156982421875, -0.159637451171875, -0.147705078125, -0.135772705078125, -0.12384033203125, -0.111907958984375, -0.0999755859375, -0.088043212890625, -0.07611083984375, -0.064178466796875, -0.05224609375, -0.040313720703125, -0.02838134765625, -0.016448974609375, -0.0045166015625, 0.007415771484375, 0.01934814453125, 0.031280517578125, 0.043212890625, 0.055145263671875, 0.06707763671875, 0.079010009765625, 0.0909423828125, 0.102874755859375, 0.11480712890625, 0.126739501953125, 0.138671875, 0.150604248046875, 0.16253662109375, 0.174468994140625, 0.1864013671875, 0.198333740234375, 0.21026611328125, 0.222198486328125, 0.234130859375, 0.246063232421875, 0.25799560546875, 0.269927978515625, 0.2818603515625, 0.293792724609375, 0.30572509765625, 0.317657470703125, 0.32958984375, 0.341522216796875, 0.35345458984375, 0.365386962890625, 0.3773193359375, 0.389251708984375, 0.40118408203125, 0.413116455078125, 0.425048828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 7.0, 14.0, 24.0, 27.0, 46.0, 43.0, 106.0, 97.0, 162.0, 268.0, 430.0, 719.0, 1432.0, 3120.0, 7424.0, 20017.0, 74718.0, 287652.0, 89929.0, 22713.0, 8081.0, 3355.0, 1614.0, 859.0, 465.0, 292.0, 204.0, 127.0, 66.0, 55.0, 65.0, 29.0, 17.0, 20.0, 14.0, 13.0, 5.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.52978515625, -5.3291015625, -5.12841796875, -4.927734375, -4.72705078125, -4.5263671875, -4.32568359375, -4.125, -3.92431640625, -3.7236328125, -3.52294921875, -3.322265625, -3.12158203125, -2.9208984375, -2.72021484375, -2.51953125, -2.31884765625, -2.1181640625, -1.91748046875, -1.716796875, -1.51611328125, -1.3154296875, -1.11474609375, -0.9140625, -0.71337890625, -0.5126953125, -0.31201171875, -0.111328125, 0.08935546875, 0.2900390625, 0.49072265625, 0.69140625, 0.89208984375, 1.0927734375, 1.29345703125, 1.494140625, 1.69482421875, 1.8955078125, 2.09619140625, 2.296875, 2.49755859375, 2.6982421875, 2.89892578125, 3.099609375, 3.30029296875, 3.5009765625, 3.70166015625, 3.90234375, 4.10302734375, 4.3037109375, 4.50439453125, 4.705078125, 4.90576171875, 5.1064453125, 5.30712890625, 5.5078125, 5.70849609375, 5.9091796875, 6.10986328125, 6.310546875, 6.51123046875, 6.7119140625, 6.91259765625, 7.11328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 9.0, 14.0, 6.0, 20.0, 18.0, 30.0, 23.0, 34.0, 51.0, 63.0, 68.0, 80.0, 61.0, 90.0, 75.0, 57.0, 53.0, 52.0, 39.0, 39.0, 30.0, 23.0, 13.0, 14.0, 8.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7053680419921875, -0.685638427734375, -0.6659088134765625, -0.64617919921875, -0.6264495849609375, -0.606719970703125, -0.5869903564453125, -0.5672607421875, -0.5475311279296875, -0.527801513671875, -0.5080718994140625, -0.48834228515625, -0.4686126708984375, -0.448883056640625, -0.4291534423828125, -0.409423828125, -0.3896942138671875, -0.369964599609375, -0.3502349853515625, -0.33050537109375, -0.3107757568359375, -0.291046142578125, -0.2713165283203125, -0.2515869140625, -0.2318572998046875, -0.212127685546875, -0.1923980712890625, -0.17266845703125, -0.1529388427734375, -0.133209228515625, -0.1134796142578125, -0.09375, -0.0740203857421875, -0.054290771484375, -0.0345611572265625, -0.01483154296875, 0.0048980712890625, 0.024627685546875, 0.0443572998046875, 0.0640869140625, 0.0838165283203125, 0.103546142578125, 0.1232757568359375, 0.14300537109375, 0.1627349853515625, 0.182464599609375, 0.2021942138671875, 0.221923828125, 0.2416534423828125, 0.261383056640625, 0.2811126708984375, 0.30084228515625, 0.3205718994140625, 0.340301513671875, 0.3600311279296875, 0.3797607421875, 0.3994903564453125, 0.419219970703125, 0.4389495849609375, 0.45867919921875, 0.4784088134765625, 0.498138427734375, 0.5178680419921875, 0.53759765625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 12.0, 12.0, 17.0, 20.0, 45.0, 83.0, 86.0, 61.0, 35.0, 31.0, 11.0, 11.0, 9.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9835522174835205, -1.9297783374786377, -1.8760045766830444, -1.8222306966781616, -1.7684569358825684, -1.7146830558776855, -1.6609091758728027, -1.60713529586792, -1.5533615350723267, -1.4995876550674438, -1.4458138942718506, -1.3920400142669678, -1.338266134262085, -1.2844923734664917, -1.2307184934616089, -1.1769447326660156, -1.1231708526611328, -1.06939697265625, -1.0156232118606567, -0.9618493318557739, -0.9080755114555359, -0.8543016910552979, -0.800527811050415, -0.746753990650177, -0.692980170249939, -0.6392063498497009, -0.5854325294494629, -0.5316586494445801, -0.47788482904434204, -0.424111008644104, -0.3703371584415436, -0.31656330823898315, -0.26278936862945557, -0.20901553332805634, -0.1552416980266571, -0.10146786272525787, -0.04769402742385864, 0.0060797929763793945, 0.05985364317893982, 0.11362749338150024, 0.16740131378173828, 0.2211751490831375, 0.27494898438453674, 0.32872283458709717, 0.3824966549873352, 0.43627047538757324, 0.49004432559013367, 0.5438181757926941, 0.5975919961929321, 0.6513658165931702, 0.7051396369934082, 0.758913516998291, 0.812687337398529, 0.8664611577987671, 0.9202350378036499, 0.9740088582038879, 1.027782678604126, 1.0815565586090088, 1.135330319404602, 1.1891041994094849, 1.2428779602050781, 1.296651840209961, 1.3504257202148438, 1.4041996002197266, 1.4579733610153198]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 6.0, 11.0, 12.0, 10.0, 11.0, 27.0, 49.0, 116.0, 85.0, 27.0, 16.0, 9.0, 6.0, 11.0, 10.0, 9.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.2394521236419678, -2.1765334606170654, -2.113614559173584, -2.0506958961486816, -1.9877771139144897, -1.9248583316802979, -1.861939549446106, -1.799020767211914, -1.7361021041870117, -1.6731833219528198, -1.610264539718628, -1.5473458766937256, -1.4844270944595337, -1.4215083122253418, -1.35858952999115, -1.295670747756958, -1.2327519655227661, -1.1698331832885742, -1.1069144010543823, -1.0439956188201904, -0.9810769557952881, -0.9181581735610962, -0.8552393913269043, -0.7923206090927124, -0.7294018864631653, -0.6664831042289734, -0.6035643815994263, -0.5406455993652344, -0.47772684693336487, -0.41480809450149536, -0.35188931226730347, -0.28897055983543396, -0.2260516881942749, -0.1631329357624054, -0.1002141684293747, -0.037295401096343994, 0.025623351335525513, 0.08854210376739502, 0.15146088600158691, 0.21437963843345642, 0.2772983908653259, 0.34021714329719543, 0.40313589572906494, 0.46605467796325684, 0.5289734601974487, 0.5918921828269958, 0.6548109650611877, 0.7177296876907349, 0.7806484699249268, 0.8435672521591187, 0.9064859747886658, 0.9694047570228577, 1.0323234796524048, 1.0952422618865967, 1.1581610441207886, 1.2210798263549805, 1.2839984893798828, 1.3469172716140747, 1.4098360538482666, 1.472754716873169, 1.5356734991073608, 1.5985922813415527, 1.6615110635757446, 1.7244298458099365, 1.7873486280441284]}, "eval/loss": 5.10392951965332, "eval/bleu": 0.0, "eval/runtime": 2560.6032, "eval/samples_per_second": 5.764, "eval/steps_per_second": 0.721} \ No newline at end of file