diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.5259, "train/learning_rate": 2.2961971830985914e-05, "train/epoch": 6.73, "train/global_step": 6000, "_runtime": 35889, "_timestamp": 1648177233, "_step": 6003, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 1.0, 1.0, 3.0, 5.0, 5.0, 12.0, 10.0, 24.0, 21.0, 26.0, 34.0, 36.0, 31.0, 33.0, 36.0, 44.0, 44.0, 43.0, 57.0, 59.0, 71.0, 49.0, 54.0, 48.0, 52.0, 43.0, 36.0, 27.0, 27.0, 17.0, 11.0, 11.0, 13.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5392951965332, -45.22349548339844, -43.90769958496094, -42.59189987182617, -41.276100158691406, -39.96030044555664, -38.644500732421875, -37.328704833984375, -36.01290512084961, -34.697105407714844, -33.381309509277344, -32.06550979614258, -30.749710083007812, -29.433910369873047, -28.118112564086914, -26.80231475830078, -25.486515045166016, -24.17071533203125, -22.854917526245117, -21.539119720458984, -20.22332000732422, -18.907520294189453, -17.59172248840332, -16.275924682617188, -14.960124969482422, -13.644326210021973, -12.328527450561523, -11.012728691101074, -9.696929931640625, -8.381131172180176, -7.065332412719727, -5.749533653259277, -4.4337310791015625, -3.1179323196411133, -1.802133560180664, -0.48633480072021484, 0.8294639587402344, 2.1452627182006836, 3.461061477661133, 4.776860237121582, 6.092658996582031, 7.4084577560424805, 8.72425651550293, 10.040055274963379, 11.355854034423828, 12.671652793884277, 13.987451553344727, 15.303250312805176, 16.619049072265625, 17.93484878540039, 19.250646591186523, 20.566444396972656, 21.882244110107422, 23.198043823242188, 24.51384162902832, 25.829639434814453, 27.14543914794922, 28.461238861083984, 29.777036666870117, 31.09283447265625, 32.408634185791016, 33.72443389892578, 35.04022979736328, 36.35602951049805, 37.67182922363281]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 10.0, 8.0, 9.0, 13.0, 11.0, 13.0, 24.0, 18.0, 18.0, 28.0, 32.0, 24.0, 27.0, 34.0, 29.0, 37.0, 32.0, 31.0, 41.0, 36.0, 35.0, 37.0, 44.0, 35.0, 36.0, 30.0, 24.0, 32.0, 38.0, 27.0, 17.0, 21.0, 15.0, 19.0, 21.0, 17.0, 16.0, 8.0, 14.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.92849349975586, -34.91211700439453, -33.89574432373047, -32.87936782836914, -31.862993240356445, -30.84661865234375, -29.830244064331055, -28.81386947631836, -27.79749298095703, -26.781118392944336, -25.76474380493164, -24.748367309570312, -23.731992721557617, -22.715618133544922, -21.699243545532227, -20.68286895751953, -19.666494369506836, -18.65011978149414, -17.633745193481445, -16.61737060546875, -15.600994110107422, -14.584619522094727, -13.568244934082031, -12.551870346069336, -11.535494804382324, -10.519120216369629, -9.502744674682617, -8.486370086669922, -7.469995021820068, -6.453619956970215, -5.4372453689575195, -4.420870304107666, -3.4044952392578125, -2.388120174407959, -1.3717453479766846, -0.35537052154541016, 0.6610045433044434, 1.6773796081542969, 2.693754196166992, 3.7101292610168457, 4.726504325866699, 5.742879390716553, 6.759254455566406, 7.775629043579102, 8.792003631591797, 9.808379173278809, 10.824753761291504, 11.841129302978516, 12.857503890991211, 13.873878479003906, 14.890254020690918, 15.906628608703613, 16.923004150390625, 17.93937873840332, 18.955753326416016, 19.97212791442871, 20.988502502441406, 22.0048770904541, 23.021251678466797, 24.037628173828125, 25.05400276184082, 26.070377349853516, 27.08675193786621, 28.103126525878906, 29.119503021240234]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 13.0, 23.0, 28.0, 39.0, 68.0, 87.0, 151.0, 199.0, 392.0, 600.0, 971.0, 1564.0, 2549.0, 4282.0, 7320.0, 12767.0, 21970.0, 38543.0, 67608.0, 118559.0, 210006.0, 359328.0, 564308.0, 735761.0, 717348.0, 535014.0, 337380.0, 197141.0, 111849.0, 63421.0, 35742.0, 20374.0, 11778.0, 6864.0, 3986.0, 2525.0, 1416.0, 814.0, 528.0, 347.0, 214.0, 123.0, 101.0, 55.0, 36.0, 29.0, 17.0, 10.0, 13.0, 5.0, 8.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-37.28125, -36.076171875, -34.87109375, -33.666015625, -32.4609375, -31.255859375, -30.05078125, -28.845703125, -27.640625, -26.435546875, -25.23046875, -24.025390625, -22.8203125, -21.615234375, -20.41015625, -19.205078125, -18.0, -16.794921875, -15.58984375, -14.384765625, -13.1796875, -11.974609375, -10.76953125, -9.564453125, -8.359375, -7.154296875, -5.94921875, -4.744140625, -3.5390625, -2.333984375, -1.12890625, 0.076171875, 1.28125, 2.486328125, 3.69140625, 4.896484375, 6.1015625, 7.306640625, 8.51171875, 9.716796875, 10.921875, 12.126953125, 13.33203125, 14.537109375, 15.7421875, 16.947265625, 18.15234375, 19.357421875, 20.5625, 21.767578125, 22.97265625, 24.177734375, 25.3828125, 26.587890625, 27.79296875, 28.998046875, 30.203125, 31.408203125, 32.61328125, 33.818359375, 35.0234375, 36.228515625, 37.43359375, 38.638671875, 39.84375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 11.0, 8.0, 8.0, 17.0, 15.0, 14.0, 27.0, 33.0, 23.0, 31.0, 29.0, 40.0, 38.0, 31.0, 30.0, 49.0, 48.0, 42.0, 48.0, 42.0, 42.0, 46.0, 38.0, 34.0, 38.0, 31.0, 28.0, 38.0, 24.0, 11.0, 15.0, 13.0, 18.0, 9.0, 6.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.578125, -28.610107421875, -27.64208984375, -26.674072265625, -25.7060546875, -24.738037109375, -23.77001953125, -22.802001953125, -21.833984375, -20.865966796875, -19.89794921875, -18.929931640625, -17.9619140625, -16.993896484375, -16.02587890625, -15.057861328125, -14.08984375, -13.121826171875, -12.15380859375, -11.185791015625, -10.2177734375, -9.249755859375, -8.28173828125, -7.313720703125, -6.345703125, -5.377685546875, -4.40966796875, -3.441650390625, -2.4736328125, -1.505615234375, -0.53759765625, 0.430419921875, 1.3984375, 2.366455078125, 3.33447265625, 4.302490234375, 5.2705078125, 6.238525390625, 7.20654296875, 8.174560546875, 9.142578125, 10.110595703125, 11.07861328125, 12.046630859375, 13.0146484375, 13.982666015625, 14.95068359375, 15.918701171875, 16.88671875, 17.854736328125, 18.82275390625, 19.790771484375, 20.7587890625, 21.726806640625, 22.69482421875, 23.662841796875, 24.630859375, 25.598876953125, 26.56689453125, 27.534912109375, 28.5029296875, 29.470947265625, 30.43896484375, 31.406982421875, 32.375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 16.0, 25.0, 38.0, 54.0, 88.0, 147.0, 237.0, 375.0, 583.0, 858.0, 1350.0, 2068.0, 3396.0, 5438.0, 8509.0, 14069.0, 22561.0, 35748.0, 57695.0, 90357.0, 139314.0, 208792.0, 301956.0, 410187.0, 508323.0, 549811.0, 510077.0, 412971.0, 306665.0, 212500.0, 141608.0, 91777.0, 58671.0, 36714.0, 22986.0, 14406.0, 8989.0, 5503.0, 3438.0, 2149.0, 1416.0, 847.0, 588.0, 345.0, 242.0, 137.0, 108.0, 49.0, 31.0, 16.0, 18.0, 13.0, 9.0, 2.0, 2.0, 6.0], "bins": [-28.59375, -27.74072265625, -26.8876953125, -26.03466796875, -25.181640625, -24.32861328125, -23.4755859375, -22.62255859375, -21.76953125, -20.91650390625, -20.0634765625, -19.21044921875, -18.357421875, -17.50439453125, -16.6513671875, -15.79833984375, -14.9453125, -14.09228515625, -13.2392578125, -12.38623046875, -11.533203125, -10.68017578125, -9.8271484375, -8.97412109375, -8.12109375, -7.26806640625, -6.4150390625, -5.56201171875, -4.708984375, -3.85595703125, -3.0029296875, -2.14990234375, -1.296875, -0.44384765625, 0.4091796875, 1.26220703125, 2.115234375, 2.96826171875, 3.8212890625, 4.67431640625, 5.52734375, 6.38037109375, 7.2333984375, 8.08642578125, 8.939453125, 9.79248046875, 10.6455078125, 11.49853515625, 12.3515625, 13.20458984375, 14.0576171875, 14.91064453125, 15.763671875, 16.61669921875, 17.4697265625, 18.32275390625, 19.17578125, 20.02880859375, 20.8818359375, 21.73486328125, 22.587890625, 23.44091796875, 24.2939453125, 25.14697265625, 26.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 17.0, 23.0, 27.0, 22.0, 31.0, 38.0, 68.0, 75.0, 75.0, 89.0, 105.0, 133.0, 168.0, 166.0, 183.0, 215.0, 194.0, 205.0, 232.0, 235.0, 205.0, 182.0, 231.0, 186.0, 146.0, 140.0, 99.0, 93.0, 96.0, 71.0, 38.0, 53.0, 40.0, 37.0, 30.0, 19.0, 18.0, 20.0, 15.0, 10.0, 7.0, 2.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.609375, -12.203857421875, -11.79833984375, -11.392822265625, -10.9873046875, -10.581787109375, -10.17626953125, -9.770751953125, -9.365234375, -8.959716796875, -8.55419921875, -8.148681640625, -7.7431640625, -7.337646484375, -6.93212890625, -6.526611328125, -6.12109375, -5.715576171875, -5.31005859375, -4.904541015625, -4.4990234375, -4.093505859375, -3.68798828125, -3.282470703125, -2.876953125, -2.471435546875, -2.06591796875, -1.660400390625, -1.2548828125, -0.849365234375, -0.44384765625, -0.038330078125, 0.3671875, 0.772705078125, 1.17822265625, 1.583740234375, 1.9892578125, 2.394775390625, 2.80029296875, 3.205810546875, 3.611328125, 4.016845703125, 4.42236328125, 4.827880859375, 5.2333984375, 5.638916015625, 6.04443359375, 6.449951171875, 6.85546875, 7.260986328125, 7.66650390625, 8.072021484375, 8.4775390625, 8.883056640625, 9.28857421875, 9.694091796875, 10.099609375, 10.505126953125, 10.91064453125, 11.316162109375, 11.7216796875, 12.127197265625, 12.53271484375, 12.938232421875, 13.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 17.0, 5.0, 16.0, 21.0, 10.0, 31.0, 21.0, 28.0, 34.0, 32.0, 52.0, 46.0, 51.0, 55.0, 57.0, 55.0, 46.0, 56.0, 49.0, 46.0, 30.0, 29.0, 47.0, 26.0, 26.0, 21.0, 20.0, 11.0, 8.0, 8.0, 11.0, 4.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.374835968017578, -28.21469497680664, -27.054553985595703, -25.894411087036133, -24.734270095825195, -23.574129104614258, -22.413986206054688, -21.25384521484375, -20.093704223632812, -18.933563232421875, -17.773422241210938, -16.613279342651367, -15.45313835144043, -14.292997360229492, -13.132855415344238, -11.972713470458984, -10.812572479248047, -9.65243148803711, -8.492289543151855, -7.33214807510376, -6.172006607055664, -5.011865139007568, -3.8517236709594727, -2.6915817260742188, -1.5314407348632812, -0.37129926681518555, 0.7888422012329102, 1.9489836692810059, 3.1091251373291016, 4.269266605377197, 5.429408073425293, 6.589550018310547, 7.749687194824219, 8.909828186035156, 10.06997013092041, 11.230112075805664, 12.390253067016602, 13.550394058227539, 14.710536003112793, 15.870677947998047, 17.030818939208984, 18.190959930419922, 19.35110092163086, 20.51124382019043, 21.671384811401367, 22.831525802612305, 23.991668701171875, 25.151809692382812, 26.31195068359375, 27.472091674804688, 28.632232666015625, 29.792375564575195, 30.952516555786133, 32.1126594543457, 33.27280044555664, 34.43294143676758, 35.593082427978516, 36.75322341918945, 37.91336441040039, 39.07350540161133, 40.23365020751953, 41.39379119873047, 42.553932189941406, 43.714073181152344, 44.87421417236328]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 13.0, 18.0, 11.0, 16.0, 13.0, 16.0, 12.0, 19.0, 33.0, 26.0, 26.0, 23.0, 27.0, 37.0, 37.0, 37.0, 32.0, 32.0, 56.0, 31.0, 32.0, 42.0, 40.0, 34.0, 28.0, 36.0, 31.0, 21.0, 25.0, 20.0, 24.0, 30.0, 12.0, 18.0, 18.0, 5.0, 11.0, 8.0, 5.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.3676700592041, -26.449026107788086, -25.530384063720703, -24.611740112304688, -23.693098068237305, -22.77445411682129, -21.855812072753906, -20.93716812133789, -20.018524169921875, -19.09988021850586, -18.181238174438477, -17.26259422302246, -16.343952178955078, -15.425308227539062, -14.506665229797363, -13.588022232055664, -12.669379234313965, -11.750736236572266, -10.832093238830566, -9.913450241088867, -8.994806289672852, -8.076163291931152, -7.157520294189453, -6.238876819610596, -5.3202338218688965, -4.401590824127197, -3.48294734954834, -2.5643043518066406, -1.6456611156463623, -0.727017879486084, 0.19162511825561523, 1.1102685928344727, 2.028911590576172, 2.94755482673645, 3.8661980628967285, 4.784841060638428, 5.703484535217285, 6.622127532958984, 7.540770530700684, 8.459413528442383, 9.378057479858398, 10.296700477600098, 11.215343475341797, 12.133987426757812, 13.052630424499512, 13.971273422241211, 14.88991641998291, 15.80855941772461, 16.727203369140625, 17.64584732055664, 18.564489364624023, 19.48313331604004, 20.401775360107422, 21.320419311523438, 22.239063262939453, 23.157705307006836, 24.07634735107422, 24.994991302490234, 25.913633346557617, 26.832277297973633, 27.750919342041016, 28.66956329345703, 29.588207244873047, 30.50684928894043, 31.425493240356445]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 16.0, 18.0, 30.0, 37.0, 61.0, 95.0, 133.0, 185.0, 319.0, 417.0, 681.0, 1029.0, 1475.0, 2118.0, 3288.0, 5091.0, 7640.0, 11643.0, 16941.0, 25128.0, 36685.0, 53279.0, 74233.0, 98616.0, 119604.0, 128697.0, 120111.0, 98979.0, 74500.0, 53425.0, 37122.0, 25280.0, 17120.0, 11449.0, 7471.0, 5285.0, 3457.0, 2270.0, 1536.0, 1021.0, 668.0, 452.0, 308.0, 208.0, 155.0, 86.0, 64.0, 47.0, 15.0, 27.0, 17.0, 6.0, 9.0, 2.0, 6.0, 0.0, 2.0, 3.0], "bins": [-25.65625, -24.842041015625, -24.02783203125, -23.213623046875, -22.3994140625, -21.585205078125, -20.77099609375, -19.956787109375, -19.142578125, -18.328369140625, -17.51416015625, -16.699951171875, -15.8857421875, -15.071533203125, -14.25732421875, -13.443115234375, -12.62890625, -11.814697265625, -11.00048828125, -10.186279296875, -9.3720703125, -8.557861328125, -7.74365234375, -6.929443359375, -6.115234375, -5.301025390625, -4.48681640625, -3.672607421875, -2.8583984375, -2.044189453125, -1.22998046875, -0.415771484375, 0.3984375, 1.212646484375, 2.02685546875, 2.841064453125, 3.6552734375, 4.469482421875, 5.28369140625, 6.097900390625, 6.912109375, 7.726318359375, 8.54052734375, 9.354736328125, 10.1689453125, 10.983154296875, 11.79736328125, 12.611572265625, 13.42578125, 14.239990234375, 15.05419921875, 15.868408203125, 16.6826171875, 17.496826171875, 18.31103515625, 19.125244140625, 19.939453125, 20.753662109375, 21.56787109375, 22.382080078125, 23.1962890625, 24.010498046875, 24.82470703125, 25.638916015625, 26.453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 5.0, 9.0, 11.0, 15.0, 16.0, 12.0, 16.0, 14.0, 27.0, 33.0, 23.0, 26.0, 29.0, 33.0, 29.0, 34.0, 42.0, 38.0, 49.0, 31.0, 45.0, 32.0, 34.0, 36.0, 38.0, 24.0, 31.0, 36.0, 30.0, 24.0, 24.0, 19.0, 14.0, 18.0, 15.0, 19.0, 16.0, 11.0, 7.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.0625, -27.177978515625, -26.29345703125, -25.408935546875, -24.5244140625, -23.639892578125, -22.75537109375, -21.870849609375, -20.986328125, -20.101806640625, -19.21728515625, -18.332763671875, -17.4482421875, -16.563720703125, -15.67919921875, -14.794677734375, -13.91015625, -13.025634765625, -12.14111328125, -11.256591796875, -10.3720703125, -9.487548828125, -8.60302734375, -7.718505859375, -6.833984375, -5.949462890625, -5.06494140625, -4.180419921875, -3.2958984375, -2.411376953125, -1.52685546875, -0.642333984375, 0.2421875, 1.126708984375, 2.01123046875, 2.895751953125, 3.7802734375, 4.664794921875, 5.54931640625, 6.433837890625, 7.318359375, 8.202880859375, 9.08740234375, 9.971923828125, 10.8564453125, 11.740966796875, 12.62548828125, 13.510009765625, 14.39453125, 15.279052734375, 16.16357421875, 17.048095703125, 17.9326171875, 18.817138671875, 19.70166015625, 20.586181640625, 21.470703125, 22.355224609375, 23.23974609375, 24.124267578125, 25.0087890625, 25.893310546875, 26.77783203125, 27.662353515625, 28.546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 13.0, 25.0, 36.0, 65.0, 89.0, 145.0, 214.0, 307.0, 448.0, 745.0, 1208.0, 2043.0, 3748.0, 6715.0, 12500.0, 25142.0, 51449.0, 105246.0, 194818.0, 252996.0, 188883.0, 100853.0, 49291.0, 24197.0, 12158.0, 6384.0, 3509.0, 2032.0, 1201.0, 743.0, 457.0, 279.0, 188.0, 138.0, 64.0, 59.0, 31.0, 35.0, 19.0, 12.0, 12.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0, -41.5888671875, -40.177734375, -38.7666015625, -37.35546875, -35.9443359375, -34.533203125, -33.1220703125, -31.7109375, -30.2998046875, -28.888671875, -27.4775390625, -26.06640625, -24.6552734375, -23.244140625, -21.8330078125, -20.421875, -19.0107421875, -17.599609375, -16.1884765625, -14.77734375, -13.3662109375, -11.955078125, -10.5439453125, -9.1328125, -7.7216796875, -6.310546875, -4.8994140625, -3.48828125, -2.0771484375, -0.666015625, 0.7451171875, 2.15625, 3.5673828125, 4.978515625, 6.3896484375, 7.80078125, 9.2119140625, 10.623046875, 12.0341796875, 13.4453125, 14.8564453125, 16.267578125, 17.6787109375, 19.08984375, 20.5009765625, 21.912109375, 23.3232421875, 24.734375, 26.1455078125, 27.556640625, 28.9677734375, 30.37890625, 31.7900390625, 33.201171875, 34.6123046875, 36.0234375, 37.4345703125, 38.845703125, 40.2568359375, 41.66796875, 43.0791015625, 44.490234375, 45.9013671875, 47.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 6.0, 13.0, 18.0, 17.0, 20.0, 26.0, 22.0, 26.0, 33.0, 26.0, 33.0, 31.0, 28.0, 47.0, 43.0, 50.0, 47.0, 45.0, 42.0, 47.0, 46.0, 28.0, 38.0, 37.0, 27.0, 25.0, 24.0, 21.0, 21.0, 19.0, 13.0, 16.0, 7.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-24.375, -23.670654296875, -22.96630859375, -22.261962890625, -21.5576171875, -20.853271484375, -20.14892578125, -19.444580078125, -18.740234375, -18.035888671875, -17.33154296875, -16.627197265625, -15.9228515625, -15.218505859375, -14.51416015625, -13.809814453125, -13.10546875, -12.401123046875, -11.69677734375, -10.992431640625, -10.2880859375, -9.583740234375, -8.87939453125, -8.175048828125, -7.470703125, -6.766357421875, -6.06201171875, -5.357666015625, -4.6533203125, -3.948974609375, -3.24462890625, -2.540283203125, -1.8359375, -1.131591796875, -0.42724609375, 0.277099609375, 0.9814453125, 1.685791015625, 2.39013671875, 3.094482421875, 3.798828125, 4.503173828125, 5.20751953125, 5.911865234375, 6.6162109375, 7.320556640625, 8.02490234375, 8.729248046875, 9.43359375, 10.137939453125, 10.84228515625, 11.546630859375, 12.2509765625, 12.955322265625, 13.65966796875, 14.364013671875, 15.068359375, 15.772705078125, 16.47705078125, 17.181396484375, 17.8857421875, 18.590087890625, 19.29443359375, 19.998779296875, 20.703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 18.0, 23.0, 24.0, 29.0, 49.0, 69.0, 87.0, 141.0, 167.0, 284.0, 365.0, 551.0, 923.0, 1576.0, 2689.0, 5016.0, 9736.0, 20406.0, 48030.0, 114481.0, 241595.0, 295467.0, 171140.0, 73998.0, 31391.0, 14216.0, 7054.0, 3631.0, 2024.0, 1202.0, 731.0, 442.0, 295.0, 213.0, 161.0, 98.0, 62.0, 55.0, 31.0, 26.0, 15.0, 10.0, 6.0, 9.0, 1.0, 1.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.71875, -20.0556640625, -19.392578125, -18.7294921875, -18.06640625, -17.4033203125, -16.740234375, -16.0771484375, -15.4140625, -14.7509765625, -14.087890625, -13.4248046875, -12.76171875, -12.0986328125, -11.435546875, -10.7724609375, -10.109375, -9.4462890625, -8.783203125, -8.1201171875, -7.45703125, -6.7939453125, -6.130859375, -5.4677734375, -4.8046875, -4.1416015625, -3.478515625, -2.8154296875, -2.15234375, -1.4892578125, -0.826171875, -0.1630859375, 0.5, 1.1630859375, 1.826171875, 2.4892578125, 3.15234375, 3.8154296875, 4.478515625, 5.1416015625, 5.8046875, 6.4677734375, 7.130859375, 7.7939453125, 8.45703125, 9.1201171875, 9.783203125, 10.4462890625, 11.109375, 11.7724609375, 12.435546875, 13.0986328125, 13.76171875, 14.4248046875, 15.087890625, 15.7509765625, 16.4140625, 17.0771484375, 17.740234375, 18.4033203125, 19.06640625, 19.7294921875, 20.392578125, 21.0556640625, 21.71875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 7.0, 15.0, 11.0, 23.0, 28.0, 45.0, 74.0, 68.0, 102.0, 125.0, 98.0, 106.0, 97.0, 58.0, 32.0, 28.0, 27.0, 10.0, 10.0, 11.0, 4.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038852691650390625, -0.0037883222103118896, -0.003691375255584717, -0.003594428300857544, -0.003497481346130371, -0.0034005343914031982, -0.0033035874366760254, -0.0032066404819488525, -0.0031096935272216797, -0.003012746572494507, -0.002915799617767334, -0.002818852663040161, -0.0027219057083129883, -0.0026249587535858154, -0.0025280117988586426, -0.0024310648441314697, -0.002334117889404297, -0.002237170934677124, -0.002140223979949951, -0.0020432770252227783, -0.0019463300704956055, -0.0018493831157684326, -0.0017524361610412598, -0.001655489206314087, -0.001558542251586914, -0.0014615952968597412, -0.0013646483421325684, -0.0012677013874053955, -0.0011707544326782227, -0.0010738074779510498, -0.000976860523223877, -0.0008799135684967041, -0.0007829666137695312, -0.0006860196590423584, -0.0005890727043151855, -0.0004921257495880127, -0.00039517879486083984, -0.000298231840133667, -0.00020128488540649414, -0.00010433793067932129, -7.3909759521484375e-06, 8.955597877502441e-05, 0.00018650293350219727, 0.0002834498882293701, 0.00038039684295654297, 0.0004773437976837158, 0.0005742907524108887, 0.0006712377071380615, 0.0007681846618652344, 0.0008651316165924072, 0.0009620785713195801, 0.001059025526046753, 0.0011559724807739258, 0.0012529194355010986, 0.0013498663902282715, 0.0014468133449554443, 0.0015437602996826172, 0.00164070725440979, 0.0017376542091369629, 0.0018346011638641357, 0.0019315481185913086, 0.0020284950733184814, 0.0021254420280456543, 0.002222388982772827, 0.0023193359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 6.0, 10.0, 12.0, 18.0, 25.0, 38.0, 48.0, 52.0, 73.0, 102.0, 144.0, 172.0, 257.0, 353.0, 499.0, 722.0, 1144.0, 1989.0, 3318.0, 7076.0, 16613.0, 45369.0, 130809.0, 299046.0, 311374.0, 143995.0, 49906.0, 18224.0, 7645.0, 3665.0, 1966.0, 1183.0, 781.0, 499.0, 368.0, 291.0, 210.0, 139.0, 105.0, 77.0, 55.0, 46.0, 41.0, 23.0, 16.0, 11.0, 11.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.57666015625, -30.5595703125, -29.54248046875, -28.525390625, -27.50830078125, -26.4912109375, -25.47412109375, -24.45703125, -23.43994140625, -22.4228515625, -21.40576171875, -20.388671875, -19.37158203125, -18.3544921875, -17.33740234375, -16.3203125, -15.30322265625, -14.2861328125, -13.26904296875, -12.251953125, -11.23486328125, -10.2177734375, -9.20068359375, -8.18359375, -7.16650390625, -6.1494140625, -5.13232421875, -4.115234375, -3.09814453125, -2.0810546875, -1.06396484375, -0.046875, 0.97021484375, 1.9873046875, 3.00439453125, 4.021484375, 5.03857421875, 6.0556640625, 7.07275390625, 8.08984375, 9.10693359375, 10.1240234375, 11.14111328125, 12.158203125, 13.17529296875, 14.1923828125, 15.20947265625, 16.2265625, 17.24365234375, 18.2607421875, 19.27783203125, 20.294921875, 21.31201171875, 22.3291015625, 23.34619140625, 24.36328125, 25.38037109375, 26.3974609375, 27.41455078125, 28.431640625, 29.44873046875, 30.4658203125, 31.48291015625, 32.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 18.0, 19.0, 19.0, 25.0, 42.0, 37.0, 63.0, 63.0, 82.0, 66.0, 82.0, 90.0, 70.0, 54.0, 55.0, 49.0, 35.0, 30.0, 19.0, 19.0, 16.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.9921875, -9.7281494140625, -9.464111328125, -9.2000732421875, -8.93603515625, -8.6719970703125, -8.407958984375, -8.1439208984375, -7.8798828125, -7.6158447265625, -7.351806640625, -7.0877685546875, -6.82373046875, -6.5596923828125, -6.295654296875, -6.0316162109375, -5.767578125, -5.5035400390625, -5.239501953125, -4.9754638671875, -4.71142578125, -4.4473876953125, -4.183349609375, -3.9193115234375, -3.6552734375, -3.3912353515625, -3.127197265625, -2.8631591796875, -2.59912109375, -2.3350830078125, -2.071044921875, -1.8070068359375, -1.54296875, -1.2789306640625, -1.014892578125, -0.7508544921875, -0.48681640625, -0.2227783203125, 0.041259765625, 0.3052978515625, 0.5693359375, 0.8333740234375, 1.097412109375, 1.3614501953125, 1.62548828125, 1.8895263671875, 2.153564453125, 2.4176025390625, 2.681640625, 2.9456787109375, 3.209716796875, 3.4737548828125, 3.73779296875, 4.0018310546875, 4.265869140625, 4.5299072265625, 4.7939453125, 5.0579833984375, 5.322021484375, 5.5860595703125, 5.85009765625, 6.1141357421875, 6.378173828125, 6.6422119140625, 6.90625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 11.0, 20.0, 21.0, 8.0, 19.0, 32.0, 24.0, 38.0, 39.0, 47.0, 42.0, 50.0, 48.0, 41.0, 44.0, 44.0, 59.0, 47.0, 42.0, 38.0, 48.0, 36.0, 31.0, 26.0, 13.0, 17.0, 18.0, 17.0, 12.0, 6.0, 8.0, 10.0, 1.0, 4.0, 2.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.283079147338867, -24.300622940063477, -23.31816864013672, -22.335712432861328, -21.35325813293457, -20.37080192565918, -19.388347625732422, -18.40589141845703, -17.42343521118164, -16.44097900390625, -15.458524703979492, -14.476068496704102, -13.493614196777344, -12.511157989501953, -11.528702735900879, -10.546247482299805, -9.563793182373047, -8.581337928771973, -7.598882675170898, -6.616426944732666, -5.633971691131592, -4.651516437530518, -3.669060707092285, -2.686605453491211, -1.7041501998901367, -0.721694827079773, 0.2607605457305908, 1.2432160377502441, 2.2256712913513184, 3.2081265449523926, 4.190582275390625, 5.173037528991699, 6.155494689941406, 7.1379499435424805, 8.120405197143555, 9.102861404418945, 10.085315704345703, 11.067771911621094, 12.050227165222168, 13.032682418823242, 14.015137672424316, 14.99759292602539, 15.980048179626465, 16.96250343322754, 17.94495964050293, 18.927413940429688, 19.909870147705078, 20.89232635498047, 21.874780654907227, 22.857236862182617, 23.839691162109375, 24.822147369384766, 25.804601669311523, 26.787057876586914, 27.769512176513672, 28.751968383789062, 29.734424591064453, 30.716880798339844, 31.6993350982666, 32.68178939819336, 33.66424560546875, 34.64670181274414, 35.62915802001953, 36.611610412597656, 37.59406661987305]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 4.0, 13.0, 12.0, 19.0, 13.0, 12.0, 17.0, 17.0, 22.0, 24.0, 21.0, 29.0, 30.0, 33.0, 31.0, 32.0, 39.0, 42.0, 35.0, 32.0, 40.0, 28.0, 34.0, 39.0, 33.0, 41.0, 33.0, 30.0, 25.0, 24.0, 29.0, 22.0, 18.0, 22.0, 19.0, 12.0, 11.0, 12.0, 7.0, 10.0, 7.0, 5.0, 1.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.850452423095703, -25.021982192993164, -24.193513870239258, -23.36504364013672, -22.53657341003418, -21.70810317993164, -20.879634857177734, -20.051164627075195, -19.222694396972656, -18.394224166870117, -17.56575584411621, -16.737285614013672, -15.908815383911133, -15.08034610748291, -14.251876831054688, -13.423406600952148, -12.594938278198242, -11.76646900177002, -10.93799877166748, -10.109529495239258, -9.281059265136719, -8.452589988708496, -7.624120712280273, -6.795650959014893, -5.967181205749512, -5.138711452484131, -4.31024169921875, -3.4817724227905273, -2.6533026695251465, -1.8248329162597656, -0.996363639831543, -0.1678938865661621, 0.6605739593505859, 1.4890435934066772, 2.3175132274627686, 3.1459827423095703, 3.974452495574951, 4.802922248840332, 5.631391525268555, 6.4598612785339355, 7.288331031799316, 8.116800308227539, 8.945270538330078, 9.7737398147583, 10.602209091186523, 11.430679321289062, 12.259148597717285, 13.087617874145508, 13.916088104248047, 14.74455738067627, 15.573027610778809, 16.40149688720703, 17.22996711730957, 18.05843734741211, 18.886905670166016, 19.715375900268555, 20.543846130371094, 21.372316360473633, 22.20078468322754, 23.029254913330078, 23.857725143432617, 24.686195373535156, 25.514663696289062, 26.3431339263916, 27.171602249145508]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 10.0, 19.0, 27.0, 38.0, 64.0, 89.0, 127.0, 251.0, 330.0, 528.0, 821.0, 1159.0, 1707.0, 2570.0, 3790.0, 5431.0, 7866.0, 11250.0, 15431.0, 21491.0, 29120.0, 37803.0, 48086.0, 58686.0, 69031.0, 78148.0, 84296.0, 86133.0, 84709.0, 78717.0, 69985.0, 59467.0, 48607.0, 37916.0, 29726.0, 21985.0, 16158.0, 11637.0, 8118.0, 5473.0, 3868.0, 2646.0, 1771.0, 1213.0, 789.0, 492.0, 347.0, 185.0, 160.0, 110.0, 72.0, 46.0, 29.0, 11.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0], "bins": [-16.84375, -16.3095703125, -15.775390625, -15.2412109375, -14.70703125, -14.1728515625, -13.638671875, -13.1044921875, -12.5703125, -12.0361328125, -11.501953125, -10.9677734375, -10.43359375, -9.8994140625, -9.365234375, -8.8310546875, -8.296875, -7.7626953125, -7.228515625, -6.6943359375, -6.16015625, -5.6259765625, -5.091796875, -4.5576171875, -4.0234375, -3.4892578125, -2.955078125, -2.4208984375, -1.88671875, -1.3525390625, -0.818359375, -0.2841796875, 0.25, 0.7841796875, 1.318359375, 1.8525390625, 2.38671875, 2.9208984375, 3.455078125, 3.9892578125, 4.5234375, 5.0576171875, 5.591796875, 6.1259765625, 6.66015625, 7.1943359375, 7.728515625, 8.2626953125, 8.796875, 9.3310546875, 9.865234375, 10.3994140625, 10.93359375, 11.4677734375, 12.001953125, 12.5361328125, 13.0703125, 13.6044921875, 14.138671875, 14.6728515625, 15.20703125, 15.7412109375, 16.275390625, 16.8095703125, 17.34375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 9.0, 4.0, 8.0, 16.0, 12.0, 15.0, 21.0, 11.0, 21.0, 22.0, 22.0, 42.0, 23.0, 30.0, 39.0, 44.0, 29.0, 46.0, 37.0, 42.0, 47.0, 30.0, 36.0, 41.0, 27.0, 40.0, 28.0, 36.0, 26.0, 25.0, 24.0, 23.0, 18.0, 17.0, 11.0, 7.0, 5.0, 9.0, 15.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.374267578125, -25.51416015625, -24.654052734375, -23.7939453125, -22.933837890625, -22.07373046875, -21.213623046875, -20.353515625, -19.493408203125, -18.63330078125, -17.773193359375, -16.9130859375, -16.052978515625, -15.19287109375, -14.332763671875, -13.47265625, -12.612548828125, -11.75244140625, -10.892333984375, -10.0322265625, -9.172119140625, -8.31201171875, -7.451904296875, -6.591796875, -5.731689453125, -4.87158203125, -4.011474609375, -3.1513671875, -2.291259765625, -1.43115234375, -0.571044921875, 0.2890625, 1.149169921875, 2.00927734375, 2.869384765625, 3.7294921875, 4.589599609375, 5.44970703125, 6.309814453125, 7.169921875, 8.030029296875, 8.89013671875, 9.750244140625, 10.6103515625, 11.470458984375, 12.33056640625, 13.190673828125, 14.05078125, 14.910888671875, 15.77099609375, 16.631103515625, 17.4912109375, 18.351318359375, 19.21142578125, 20.071533203125, 20.931640625, 21.791748046875, 22.65185546875, 23.511962890625, 24.3720703125, 25.232177734375, 26.09228515625, 26.952392578125, 27.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 5.0, 14.0, 20.0, 24.0, 45.0, 72.0, 101.0, 164.0, 294.0, 464.0, 800.0, 1287.0, 2121.0, 3585.0, 5805.0, 9744.0, 16390.0, 26561.0, 42116.0, 64327.0, 90918.0, 117595.0, 134175.0, 135826.0, 119205.0, 94217.0, 66931.0, 44521.0, 27834.0, 17406.0, 10539.0, 6174.0, 3755.0, 2148.0, 1284.0, 807.0, 459.0, 307.0, 174.0, 134.0, 87.0, 50.0, 27.0, 13.0, 15.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0], "bins": [-36.53125, -35.45849609375, -34.3857421875, -33.31298828125, -32.240234375, -31.16748046875, -30.0947265625, -29.02197265625, -27.94921875, -26.87646484375, -25.8037109375, -24.73095703125, -23.658203125, -22.58544921875, -21.5126953125, -20.43994140625, -19.3671875, -18.29443359375, -17.2216796875, -16.14892578125, -15.076171875, -14.00341796875, -12.9306640625, -11.85791015625, -10.78515625, -9.71240234375, -8.6396484375, -7.56689453125, -6.494140625, -5.42138671875, -4.3486328125, -3.27587890625, -2.203125, -1.13037109375, -0.0576171875, 1.01513671875, 2.087890625, 3.16064453125, 4.2333984375, 5.30615234375, 6.37890625, 7.45166015625, 8.5244140625, 9.59716796875, 10.669921875, 11.74267578125, 12.8154296875, 13.88818359375, 14.9609375, 16.03369140625, 17.1064453125, 18.17919921875, 19.251953125, 20.32470703125, 21.3974609375, 22.47021484375, 23.54296875, 24.61572265625, 25.6884765625, 26.76123046875, 27.833984375, 28.90673828125, 29.9794921875, 31.05224609375, 32.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 9.0, 11.0, 15.0, 12.0, 14.0, 31.0, 21.0, 29.0, 21.0, 26.0, 39.0, 39.0, 25.0, 28.0, 38.0, 39.0, 40.0, 43.0, 37.0, 39.0, 39.0, 45.0, 29.0, 32.0, 33.0, 41.0, 18.0, 27.0, 31.0, 20.0, 17.0, 14.0, 10.0, 10.0, 12.0, 11.0, 6.0, 6.0, 5.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.625, -16.036865234375, -15.44873046875, -14.860595703125, -14.2724609375, -13.684326171875, -13.09619140625, -12.508056640625, -11.919921875, -11.331787109375, -10.74365234375, -10.155517578125, -9.5673828125, -8.979248046875, -8.39111328125, -7.802978515625, -7.21484375, -6.626708984375, -6.03857421875, -5.450439453125, -4.8623046875, -4.274169921875, -3.68603515625, -3.097900390625, -2.509765625, -1.921630859375, -1.33349609375, -0.745361328125, -0.1572265625, 0.430908203125, 1.01904296875, 1.607177734375, 2.1953125, 2.783447265625, 3.37158203125, 3.959716796875, 4.5478515625, 5.135986328125, 5.72412109375, 6.312255859375, 6.900390625, 7.488525390625, 8.07666015625, 8.664794921875, 9.2529296875, 9.841064453125, 10.42919921875, 11.017333984375, 11.60546875, 12.193603515625, 12.78173828125, 13.369873046875, 13.9580078125, 14.546142578125, 15.13427734375, 15.722412109375, 16.310546875, 16.898681640625, 17.48681640625, 18.074951171875, 18.6630859375, 19.251220703125, 19.83935546875, 20.427490234375, 21.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 8.0, 11.0, 21.0, 21.0, 36.0, 41.0, 51.0, 61.0, 110.0, 132.0, 251.0, 323.0, 489.0, 751.0, 1273.0, 2253.0, 3677.0, 6886.0, 12842.0, 23779.0, 44657.0, 78862.0, 125698.0, 170939.0, 182994.0, 152709.0, 103767.0, 61278.0, 34083.0, 18077.0, 9676.0, 5200.0, 2946.0, 1643.0, 955.0, 664.0, 415.0, 288.0, 188.0, 136.0, 89.0, 83.0, 50.0, 34.0, 37.0, 20.0, 21.0, 7.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0], "bins": [-11.703125, -11.3616943359375, -11.020263671875, -10.6788330078125, -10.33740234375, -9.9959716796875, -9.654541015625, -9.3131103515625, -8.9716796875, -8.6302490234375, -8.288818359375, -7.9473876953125, -7.60595703125, -7.2645263671875, -6.923095703125, -6.5816650390625, -6.240234375, -5.8988037109375, -5.557373046875, -5.2159423828125, -4.87451171875, -4.5330810546875, -4.191650390625, -3.8502197265625, -3.5087890625, -3.1673583984375, -2.825927734375, -2.4844970703125, -2.14306640625, -1.8016357421875, -1.460205078125, -1.1187744140625, -0.77734375, -0.4359130859375, -0.094482421875, 0.2469482421875, 0.58837890625, 0.9298095703125, 1.271240234375, 1.6126708984375, 1.9541015625, 2.2955322265625, 2.636962890625, 2.9783935546875, 3.31982421875, 3.6612548828125, 4.002685546875, 4.3441162109375, 4.685546875, 5.0269775390625, 5.368408203125, 5.7098388671875, 6.05126953125, 6.3927001953125, 6.734130859375, 7.0755615234375, 7.4169921875, 7.7584228515625, 8.099853515625, 8.4412841796875, 8.78271484375, 9.1241455078125, 9.465576171875, 9.8070068359375, 10.1484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 6.0, 14.0, 13.0, 16.0, 37.0, 33.0, 33.0, 40.0, 54.0, 51.0, 46.0, 43.0, 70.0, 51.0, 61.0, 47.0, 49.0, 45.0, 49.0, 47.0, 31.0, 34.0, 18.0, 15.0, 13.0, 7.0, 4.0, 13.0, 4.0, 5.0, 3.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010766983032226562, -0.0010413676500320435, -0.0010060369968414307, -0.0009707063436508179, -0.0009353756904602051, -0.0009000450372695923, -0.0008647143840789795, -0.0008293837308883667, -0.0007940530776977539, -0.0007587224245071411, -0.0007233917713165283, -0.0006880611181259155, -0.0006527304649353027, -0.0006173998117446899, -0.0005820691585540771, -0.0005467385053634644, -0.0005114078521728516, -0.00047607719898223877, -0.000440746545791626, -0.0004054158926010132, -0.0003700852394104004, -0.0003347545862197876, -0.0002994239330291748, -0.000264093279838562, -0.00022876262664794922, -0.00019343197345733643, -0.00015810132026672363, -0.00012277066707611084, -8.744001388549805e-05, -5.2109360694885254e-05, -1.677870750427246e-05, 1.8551945686340332e-05, 5.3882598876953125e-05, 8.921325206756592e-05, 0.0001245439052581787, 0.0001598745584487915, 0.0001952052116394043, 0.0002305358648300171, 0.0002658665180206299, 0.0003011971712112427, 0.00033652782440185547, 0.00037185847759246826, 0.00040718913078308105, 0.00044251978397369385, 0.00047785043716430664, 0.0005131810903549194, 0.0005485117435455322, 0.000583842396736145, 0.0006191730499267578, 0.0006545037031173706, 0.0006898343563079834, 0.0007251650094985962, 0.000760495662689209, 0.0007958263158798218, 0.0008311569690704346, 0.0008664876222610474, 0.0009018182754516602, 0.000937148928642273, 0.0009724795818328857, 0.0010078102350234985, 0.0010431408882141113, 0.0010784715414047241, 0.001113802194595337, 0.0011491328477859497, 0.0011844635009765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 10.0, 8.0, 7.0, 16.0, 9.0, 42.0, 34.0, 61.0, 98.0, 127.0, 205.0, 309.0, 485.0, 821.0, 1236.0, 2076.0, 3387.0, 5562.0, 9408.0, 15933.0, 26581.0, 43793.0, 68496.0, 100745.0, 133191.0, 151173.0, 144463.0, 116712.0, 83793.0, 54233.0, 34315.0, 20465.0, 12295.0, 7108.0, 4309.0, 2689.0, 1575.0, 1009.0, 612.0, 406.0, 244.0, 164.0, 118.0, 71.0, 50.0, 34.0, 25.0, 22.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.3359375, -8.0556640625, -7.775390625, -7.4951171875, -7.21484375, -6.9345703125, -6.654296875, -6.3740234375, -6.09375, -5.8134765625, -5.533203125, -5.2529296875, -4.97265625, -4.6923828125, -4.412109375, -4.1318359375, -3.8515625, -3.5712890625, -3.291015625, -3.0107421875, -2.73046875, -2.4501953125, -2.169921875, -1.8896484375, -1.609375, -1.3291015625, -1.048828125, -0.7685546875, -0.48828125, -0.2080078125, 0.072265625, 0.3525390625, 0.6328125, 0.9130859375, 1.193359375, 1.4736328125, 1.75390625, 2.0341796875, 2.314453125, 2.5947265625, 2.875, 3.1552734375, 3.435546875, 3.7158203125, 3.99609375, 4.2763671875, 4.556640625, 4.8369140625, 5.1171875, 5.3974609375, 5.677734375, 5.9580078125, 6.23828125, 6.5185546875, 6.798828125, 7.0791015625, 7.359375, 7.6396484375, 7.919921875, 8.2001953125, 8.48046875, 8.7607421875, 9.041015625, 9.3212890625, 9.6015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 12.0, 19.0, 11.0, 14.0, 23.0, 15.0, 31.0, 23.0, 35.0, 27.0, 45.0, 44.0, 36.0, 45.0, 49.0, 52.0, 50.0, 54.0, 39.0, 51.0, 42.0, 38.0, 29.0, 34.0, 27.0, 16.0, 19.0, 20.0, 11.0, 8.0, 12.0, 10.0, 10.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.654296875, -3.551025390625, -3.44775390625, -3.344482421875, -3.2412109375, -3.137939453125, -3.03466796875, -2.931396484375, -2.828125, -2.724853515625, -2.62158203125, -2.518310546875, -2.4150390625, -2.311767578125, -2.20849609375, -2.105224609375, -2.001953125, -1.898681640625, -1.79541015625, -1.692138671875, -1.5888671875, -1.485595703125, -1.38232421875, -1.279052734375, -1.17578125, -1.072509765625, -0.96923828125, -0.865966796875, -0.7626953125, -0.659423828125, -0.55615234375, -0.452880859375, -0.349609375, -0.246337890625, -0.14306640625, -0.039794921875, 0.0634765625, 0.166748046875, 0.27001953125, 0.373291015625, 0.4765625, 0.579833984375, 0.68310546875, 0.786376953125, 0.8896484375, 0.992919921875, 1.09619140625, 1.199462890625, 1.302734375, 1.406005859375, 1.50927734375, 1.612548828125, 1.7158203125, 1.819091796875, 1.92236328125, 2.025634765625, 2.12890625, 2.232177734375, 2.33544921875, 2.438720703125, 2.5419921875, 2.645263671875, 2.74853515625, 2.851806640625, 2.955078125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 3.0, 7.0, 11.0, 6.0, 12.0, 16.0, 15.0, 16.0, 25.0, 19.0, 27.0, 30.0, 37.0, 23.0, 24.0, 38.0, 36.0, 54.0, 39.0, 30.0, 44.0, 38.0, 37.0, 50.0, 47.0, 34.0, 37.0, 19.0, 36.0, 26.0, 21.0, 11.0, 26.0, 19.0, 13.0, 10.0, 10.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-25.48256492614746, -24.663169860839844, -23.843772888183594, -23.024377822875977, -22.20498275756836, -21.38558578491211, -20.566190719604492, -19.746795654296875, -18.927398681640625, -18.108003616333008, -17.288606643676758, -16.46921157836914, -15.649816513061523, -14.83042049407959, -14.011024475097656, -13.191629409790039, -12.372234344482422, -11.552838325500488, -10.733443260192871, -9.914047241210938, -9.09465217590332, -8.275256156921387, -7.455860137939453, -6.636464595794678, -5.817069053649902, -4.997673511505127, -4.178277969360352, -3.358881950378418, -2.5394864082336426, -1.7200908660888672, -0.9006948471069336, -0.0812993049621582, 0.7380943298339844, 1.5574899911880493, 2.3768856525421143, 3.1962814331054688, 4.015676975250244, 4.8350725173950195, 5.654468536376953, 6.4738640785217285, 7.293259620666504, 8.112655639648438, 8.932050704956055, 9.751446723937988, 10.570842742919922, 11.390237808227539, 12.209633827209473, 13.029029846191406, 13.848424911499023, 14.667820930480957, 15.487215995788574, 16.306612014770508, 17.126007080078125, 17.945404052734375, 18.764799118041992, 19.58419418334961, 20.40359115600586, 21.222986221313477, 22.042383193969727, 22.861778259277344, 23.68117332458496, 24.500568389892578, 25.319965362548828, 26.139360427856445, 26.958755493164062]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 8.0, 5.0, 9.0, 8.0, 9.0, 11.0, 13.0, 24.0, 17.0, 22.0, 24.0, 17.0, 23.0, 35.0, 31.0, 36.0, 26.0, 40.0, 34.0, 29.0, 42.0, 30.0, 50.0, 41.0, 34.0, 28.0, 41.0, 26.0, 31.0, 26.0, 26.0, 23.0, 20.0, 18.0, 23.0, 13.0, 16.0, 19.0, 10.0, 11.0, 7.0, 10.0, 3.0, 6.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-28.986473083496094, -28.149890899658203, -27.313310623168945, -26.476728439331055, -25.640148162841797, -24.803565979003906, -23.96698570251465, -23.130403518676758, -22.2938232421875, -21.45724105834961, -20.62066078186035, -19.78407859802246, -18.947498321533203, -18.110916137695312, -17.274335861206055, -16.437753677368164, -15.60117244720459, -14.764591217041016, -13.928009986877441, -13.091428756713867, -12.254847526550293, -11.418266296386719, -10.581684112548828, -9.74510383605957, -8.90852165222168, -8.071940422058105, -7.235359191894531, -6.398777961730957, -5.562196731567383, -4.72561502456665, -3.889033794403076, -3.052452564239502, -2.215871810913086, -1.3792905807495117, -0.542709231376648, 0.2938721179962158, 1.13045334815979, 1.9670348167419434, 2.8036160469055176, 3.640197277069092, 4.476778507232666, 5.31335973739624, 6.1499409675598145, 6.986522674560547, 7.823103904724121, 8.659685134887695, 9.49626636505127, 10.332847595214844, 11.169428825378418, 12.006010055541992, 12.842591285705566, 13.67917251586914, 14.515753746032715, 15.352334976196289, 16.18891716003418, 17.025497436523438, 17.862079620361328, 18.69866180419922, 19.535242080688477, 20.371824264526367, 21.208404541015625, 22.044986724853516, 22.881567001342773, 23.718149185180664, 24.554729461669922]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 10.0, 9.0, 15.0, 14.0, 29.0, 48.0, 77.0, 122.0, 185.0, 301.0, 440.0, 738.0, 1171.0, 1878.0, 3175.0, 5356.0, 9113.0, 15545.0, 26916.0, 47192.0, 83154.0, 146068.0, 252576.0, 415651.0, 609087.0, 726383.0, 664824.0, 479148.0, 300086.0, 174449.0, 99493.0, 55493.0, 31645.0, 18015.0, 10537.0, 5959.0, 3636.0, 2171.0, 1366.0, 804.0, 482.0, 316.0, 202.0, 146.0, 98.0, 58.0, 40.0, 24.0, 18.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0], "bins": [-31.046875, -30.12451171875, -29.2021484375, -28.27978515625, -27.357421875, -26.43505859375, -25.5126953125, -24.59033203125, -23.66796875, -22.74560546875, -21.8232421875, -20.90087890625, -19.978515625, -19.05615234375, -18.1337890625, -17.21142578125, -16.2890625, -15.36669921875, -14.4443359375, -13.52197265625, -12.599609375, -11.67724609375, -10.7548828125, -9.83251953125, -8.91015625, -7.98779296875, -7.0654296875, -6.14306640625, -5.220703125, -4.29833984375, -3.3759765625, -2.45361328125, -1.53125, -0.60888671875, 0.3134765625, 1.23583984375, 2.158203125, 3.08056640625, 4.0029296875, 4.92529296875, 5.84765625, 6.77001953125, 7.6923828125, 8.61474609375, 9.537109375, 10.45947265625, 11.3818359375, 12.30419921875, 13.2265625, 14.14892578125, 15.0712890625, 15.99365234375, 16.916015625, 17.83837890625, 18.7607421875, 19.68310546875, 20.60546875, 21.52783203125, 22.4501953125, 23.37255859375, 24.294921875, 25.21728515625, 26.1396484375, 27.06201171875, 27.984375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 8.0, 7.0, 15.0, 12.0, 15.0, 23.0, 15.0, 20.0, 29.0, 32.0, 36.0, 31.0, 31.0, 33.0, 45.0, 40.0, 55.0, 36.0, 29.0, 32.0, 30.0, 46.0, 31.0, 43.0, 39.0, 25.0, 23.0, 30.0, 23.0, 19.0, 18.0, 15.0, 20.0, 7.0, 6.0, 7.0, 7.0, 15.0, 8.0, 8.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-23.078125, -22.40576171875, -21.7333984375, -21.06103515625, -20.388671875, -19.71630859375, -19.0439453125, -18.37158203125, -17.69921875, -17.02685546875, -16.3544921875, -15.68212890625, -15.009765625, -14.33740234375, -13.6650390625, -12.99267578125, -12.3203125, -11.64794921875, -10.9755859375, -10.30322265625, -9.630859375, -8.95849609375, -8.2861328125, -7.61376953125, -6.94140625, -6.26904296875, -5.5966796875, -4.92431640625, -4.251953125, -3.57958984375, -2.9072265625, -2.23486328125, -1.5625, -0.89013671875, -0.2177734375, 0.45458984375, 1.126953125, 1.79931640625, 2.4716796875, 3.14404296875, 3.81640625, 4.48876953125, 5.1611328125, 5.83349609375, 6.505859375, 7.17822265625, 7.8505859375, 8.52294921875, 9.1953125, 9.86767578125, 10.5400390625, 11.21240234375, 11.884765625, 12.55712890625, 13.2294921875, 13.90185546875, 14.57421875, 15.24658203125, 15.9189453125, 16.59130859375, 17.263671875, 17.93603515625, 18.6083984375, 19.28076171875, 19.953125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 22.0, 25.0, 44.0, 55.0, 134.0, 190.0, 317.0, 538.0, 886.0, 1609.0, 2766.0, 4702.0, 8186.0, 14239.0, 25060.0, 42432.0, 73552.0, 125123.0, 203678.0, 316730.0, 456324.0, 580987.0, 624757.0, 556222.0, 422077.0, 287297.0, 181404.0, 110530.0, 65267.0, 37887.0, 21654.0, 12615.0, 7147.0, 4119.0, 2331.0, 1401.0, 749.0, 467.0, 301.0, 164.0, 107.0, 65.0, 53.0, 28.0, 9.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-27.75, -26.918701171875, -26.08740234375, -25.256103515625, -24.4248046875, -23.593505859375, -22.76220703125, -21.930908203125, -21.099609375, -20.268310546875, -19.43701171875, -18.605712890625, -17.7744140625, -16.943115234375, -16.11181640625, -15.280517578125, -14.44921875, -13.617919921875, -12.78662109375, -11.955322265625, -11.1240234375, -10.292724609375, -9.46142578125, -8.630126953125, -7.798828125, -6.967529296875, -6.13623046875, -5.304931640625, -4.4736328125, -3.642333984375, -2.81103515625, -1.979736328125, -1.1484375, -0.317138671875, 0.51416015625, 1.345458984375, 2.1767578125, 3.008056640625, 3.83935546875, 4.670654296875, 5.501953125, 6.333251953125, 7.16455078125, 7.995849609375, 8.8271484375, 9.658447265625, 10.48974609375, 11.321044921875, 12.15234375, 12.983642578125, 13.81494140625, 14.646240234375, 15.4775390625, 16.308837890625, 17.14013671875, 17.971435546875, 18.802734375, 19.634033203125, 20.46533203125, 21.296630859375, 22.1279296875, 22.959228515625, 23.79052734375, 24.621826171875, 25.453125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 8.0, 7.0, 8.0, 12.0, 18.0, 16.0, 16.0, 47.0, 46.0, 48.0, 51.0, 74.0, 93.0, 109.0, 117.0, 144.0, 161.0, 164.0, 186.0, 196.0, 221.0, 223.0, 222.0, 197.0, 217.0, 204.0, 182.0, 154.0, 142.0, 114.0, 141.0, 86.0, 87.0, 80.0, 53.0, 39.0, 43.0, 47.0, 20.0, 23.0, 16.0, 10.0, 8.0, 7.0, 5.0, 7.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-9.9453125, -9.609619140625, -9.27392578125, -8.938232421875, -8.6025390625, -8.266845703125, -7.93115234375, -7.595458984375, -7.259765625, -6.924072265625, -6.58837890625, -6.252685546875, -5.9169921875, -5.581298828125, -5.24560546875, -4.909912109375, -4.57421875, -4.238525390625, -3.90283203125, -3.567138671875, -3.2314453125, -2.895751953125, -2.56005859375, -2.224365234375, -1.888671875, -1.552978515625, -1.21728515625, -0.881591796875, -0.5458984375, -0.210205078125, 0.12548828125, 0.461181640625, 0.796875, 1.132568359375, 1.46826171875, 1.803955078125, 2.1396484375, 2.475341796875, 2.81103515625, 3.146728515625, 3.482421875, 3.818115234375, 4.15380859375, 4.489501953125, 4.8251953125, 5.160888671875, 5.49658203125, 5.832275390625, 6.16796875, 6.503662109375, 6.83935546875, 7.175048828125, 7.5107421875, 7.846435546875, 8.18212890625, 8.517822265625, 8.853515625, 9.189208984375, 9.52490234375, 9.860595703125, 10.1962890625, 10.531982421875, 10.86767578125, 11.203369140625, 11.5390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 9.0, 21.0, 23.0, 16.0, 19.0, 30.0, 24.0, 38.0, 43.0, 40.0, 49.0, 24.0, 48.0, 42.0, 46.0, 38.0, 41.0, 34.0, 47.0, 37.0, 45.0, 41.0, 21.0, 35.0, 27.0, 25.0, 18.0, 16.0, 17.0, 12.0, 9.0, 9.0, 13.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.804954528808594, -24.957992553710938, -24.11103057861328, -23.264068603515625, -22.41710662841797, -21.570144653320312, -20.723182678222656, -19.876220703125, -19.029258728027344, -18.182296752929688, -17.33533477783203, -16.488372802734375, -15.641410827636719, -14.794448852539062, -13.94748592376709, -13.100523948669434, -12.253561019897461, -11.406599044799805, -10.559637069702148, -9.712675094604492, -8.865713119506836, -8.01875114440918, -7.171788215637207, -6.324826240539551, -5.4778642654418945, -4.630902290344238, -3.783940076828003, -2.9369778633117676, -2.0900158882141113, -1.243053913116455, -0.3960914611816406, 0.4508705139160156, 1.2978324890136719, 2.144794464111328, 2.9917566776275635, 3.838718891143799, 4.685680866241455, 5.532642841339111, 6.379605293273926, 7.226567268371582, 8.073529243469238, 8.920491218566895, 9.76745319366455, 10.614416122436523, 11.46137809753418, 12.308340072631836, 13.155302047729492, 14.002264022827148, 14.849225997924805, 15.696187973022461, 16.543149948120117, 17.390111923217773, 18.23707389831543, 19.084035873413086, 19.930999755859375, 20.77796173095703, 21.624923706054688, 22.471885681152344, 23.31884765625, 24.165809631347656, 25.012771606445312, 25.85973358154297, 26.706695556640625, 27.55365753173828, 28.400619506835938]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 7.0, 4.0, 10.0, 6.0, 12.0, 12.0, 22.0, 21.0, 30.0, 23.0, 24.0, 22.0, 27.0, 21.0, 25.0, 34.0, 49.0, 35.0, 43.0, 39.0, 51.0, 39.0, 42.0, 24.0, 36.0, 32.0, 41.0, 28.0, 23.0, 23.0, 28.0, 21.0, 20.0, 22.0, 12.0, 18.0, 11.0, 10.0, 12.0, 9.0, 5.0, 4.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.896869659423828, -22.094961166381836, -21.293052673339844, -20.491146087646484, -19.689237594604492, -18.8873291015625, -18.085420608520508, -17.283512115478516, -16.481605529785156, -15.679697036743164, -14.877789497375488, -14.075881004333496, -13.27397346496582, -12.472064971923828, -11.670156478881836, -10.868247985839844, -10.066339492797852, -9.26443099975586, -8.462523460388184, -7.660614967346191, -6.858706951141357, -6.056798934936523, -5.254890441894531, -4.452982425689697, -3.6510744094848633, -2.8491663932800293, -2.047258138656616, -1.2453498840332031, -0.44344186782836914, 0.35846614837646484, 1.160374641418457, 1.962282657623291, 2.764190673828125, 3.566098690032959, 4.368006706237793, 5.169915199279785, 5.971823215484619, 6.773731231689453, 7.575639724731445, 8.377548217773438, 9.179455757141113, 9.981364250183105, 10.783271789550781, 11.585180282592773, 12.387088775634766, 13.188996315002441, 13.990904808044434, 14.79281234741211, 15.594720840454102, 16.396629333496094, 17.198537826538086, 18.000446319580078, 18.802352905273438, 19.60426139831543, 20.406169891357422, 21.208078384399414, 22.009986877441406, 22.8118953704834, 23.61380386352539, 24.41571044921875, 25.217618942260742, 26.019527435302734, 26.821435928344727, 27.62334442138672, 28.425251007080078]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 12.0, 34.0, 31.0, 56.0, 92.0, 110.0, 206.0, 303.0, 441.0, 747.0, 1115.0, 1826.0, 2750.0, 4119.0, 6431.0, 9410.0, 14419.0, 21292.0, 30624.0, 43834.0, 61289.0, 82360.0, 105290.0, 124282.0, 126018.0, 110470.0, 87300.0, 65190.0, 46888.0, 32790.0, 23105.0, 15540.0, 10471.0, 6954.0, 4404.0, 3014.0, 1806.0, 1232.0, 823.0, 507.0, 346.0, 217.0, 151.0, 94.0, 39.0, 47.0, 29.0, 18.0, 12.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0], "bins": [-27.5625, -26.703857421875, -25.84521484375, -24.986572265625, -24.1279296875, -23.269287109375, -22.41064453125, -21.552001953125, -20.693359375, -19.834716796875, -18.97607421875, -18.117431640625, -17.2587890625, -16.400146484375, -15.54150390625, -14.682861328125, -13.82421875, -12.965576171875, -12.10693359375, -11.248291015625, -10.3896484375, -9.531005859375, -8.67236328125, -7.813720703125, -6.955078125, -6.096435546875, -5.23779296875, -4.379150390625, -3.5205078125, -2.661865234375, -1.80322265625, -0.944580078125, -0.0859375, 0.772705078125, 1.63134765625, 2.489990234375, 3.3486328125, 4.207275390625, 5.06591796875, 5.924560546875, 6.783203125, 7.641845703125, 8.50048828125, 9.359130859375, 10.2177734375, 11.076416015625, 11.93505859375, 12.793701171875, 13.65234375, 14.510986328125, 15.36962890625, 16.228271484375, 17.0869140625, 17.945556640625, 18.80419921875, 19.662841796875, 20.521484375, 21.380126953125, 22.23876953125, 23.097412109375, 23.9560546875, 24.814697265625, 25.67333984375, 26.531982421875, 27.390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 17.0, 12.0, 17.0, 18.0, 22.0, 22.0, 30.0, 26.0, 29.0, 29.0, 30.0, 37.0, 43.0, 23.0, 37.0, 43.0, 42.0, 46.0, 38.0, 32.0, 38.0, 33.0, 28.0, 30.0, 26.0, 38.0, 25.0, 26.0, 23.0, 20.0, 15.0, 17.0, 14.0, 15.0, 8.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.29052734375, -19.5966796875, -18.90283203125, -18.208984375, -17.51513671875, -16.8212890625, -16.12744140625, -15.43359375, -14.73974609375, -14.0458984375, -13.35205078125, -12.658203125, -11.96435546875, -11.2705078125, -10.57666015625, -9.8828125, -9.18896484375, -8.4951171875, -7.80126953125, -7.107421875, -6.41357421875, -5.7197265625, -5.02587890625, -4.33203125, -3.63818359375, -2.9443359375, -2.25048828125, -1.556640625, -0.86279296875, -0.1689453125, 0.52490234375, 1.21875, 1.91259765625, 2.6064453125, 3.30029296875, 3.994140625, 4.68798828125, 5.3818359375, 6.07568359375, 6.76953125, 7.46337890625, 8.1572265625, 8.85107421875, 9.544921875, 10.23876953125, 10.9326171875, 11.62646484375, 12.3203125, 13.01416015625, 13.7080078125, 14.40185546875, 15.095703125, 15.78955078125, 16.4833984375, 17.17724609375, 17.87109375, 18.56494140625, 19.2587890625, 19.95263671875, 20.646484375, 21.34033203125, 22.0341796875, 22.72802734375, 23.421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 18.0, 23.0, 33.0, 48.0, 60.0, 94.0, 125.0, 200.0, 279.0, 419.0, 640.0, 976.0, 1297.0, 2163.0, 3112.0, 4903.0, 7566.0, 11867.0, 19107.0, 30508.0, 49894.0, 80161.0, 124964.0, 172296.0, 177433.0, 132403.0, 85340.0, 52980.0, 33059.0, 20664.0, 12766.0, 7941.0, 5287.0, 3375.0, 2179.0, 1394.0, 966.0, 669.0, 439.0, 283.0, 207.0, 130.0, 102.0, 51.0, 35.0, 31.0, 22.0, 9.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-35.375, -34.27197265625, -33.1689453125, -32.06591796875, -30.962890625, -29.85986328125, -28.7568359375, -27.65380859375, -26.55078125, -25.44775390625, -24.3447265625, -23.24169921875, -22.138671875, -21.03564453125, -19.9326171875, -18.82958984375, -17.7265625, -16.62353515625, -15.5205078125, -14.41748046875, -13.314453125, -12.21142578125, -11.1083984375, -10.00537109375, -8.90234375, -7.79931640625, -6.6962890625, -5.59326171875, -4.490234375, -3.38720703125, -2.2841796875, -1.18115234375, -0.078125, 1.02490234375, 2.1279296875, 3.23095703125, 4.333984375, 5.43701171875, 6.5400390625, 7.64306640625, 8.74609375, 9.84912109375, 10.9521484375, 12.05517578125, 13.158203125, 14.26123046875, 15.3642578125, 16.46728515625, 17.5703125, 18.67333984375, 19.7763671875, 20.87939453125, 21.982421875, 23.08544921875, 24.1884765625, 25.29150390625, 26.39453125, 27.49755859375, 28.6005859375, 29.70361328125, 30.806640625, 31.90966796875, 33.0126953125, 34.11572265625, 35.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 6.0, 9.0, 10.0, 9.0, 11.0, 30.0, 26.0, 24.0, 32.0, 24.0, 30.0, 44.0, 40.0, 40.0, 32.0, 41.0, 66.0, 50.0, 48.0, 56.0, 56.0, 28.0, 43.0, 38.0, 27.0, 22.0, 31.0, 20.0, 16.0, 12.0, 19.0, 18.0, 10.0, 2.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.182861328125, -18.50634765625, -17.829833984375, -17.1533203125, -16.476806640625, -15.80029296875, -15.123779296875, -14.447265625, -13.770751953125, -13.09423828125, -12.417724609375, -11.7412109375, -11.064697265625, -10.38818359375, -9.711669921875, -9.03515625, -8.358642578125, -7.68212890625, -7.005615234375, -6.3291015625, -5.652587890625, -4.97607421875, -4.299560546875, -3.623046875, -2.946533203125, -2.27001953125, -1.593505859375, -0.9169921875, -0.240478515625, 0.43603515625, 1.112548828125, 1.7890625, 2.465576171875, 3.14208984375, 3.818603515625, 4.4951171875, 5.171630859375, 5.84814453125, 6.524658203125, 7.201171875, 7.877685546875, 8.55419921875, 9.230712890625, 9.9072265625, 10.583740234375, 11.26025390625, 11.936767578125, 12.61328125, 13.289794921875, 13.96630859375, 14.642822265625, 15.3193359375, 15.995849609375, 16.67236328125, 17.348876953125, 18.025390625, 18.701904296875, 19.37841796875, 20.054931640625, 20.7314453125, 21.407958984375, 22.08447265625, 22.760986328125, 23.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 12.0, 16.0, 40.0, 44.0, 80.0, 90.0, 169.0, 260.0, 365.0, 579.0, 954.0, 1555.0, 2670.0, 4804.0, 8696.0, 16852.0, 35099.0, 85035.0, 295588.0, 395284.0, 112982.0, 43274.0, 20209.0, 10317.0, 5637.0, 3121.0, 1910.0, 1066.0, 646.0, 435.0, 258.0, 158.0, 98.0, 87.0, 51.0, 34.0, 21.0, 17.0, 12.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.65625, -34.43212890625, -33.2080078125, -31.98388671875, -30.759765625, -29.53564453125, -28.3115234375, -27.08740234375, -25.86328125, -24.63916015625, -23.4150390625, -22.19091796875, -20.966796875, -19.74267578125, -18.5185546875, -17.29443359375, -16.0703125, -14.84619140625, -13.6220703125, -12.39794921875, -11.173828125, -9.94970703125, -8.7255859375, -7.50146484375, -6.27734375, -5.05322265625, -3.8291015625, -2.60498046875, -1.380859375, -0.15673828125, 1.0673828125, 2.29150390625, 3.515625, 4.73974609375, 5.9638671875, 7.18798828125, 8.412109375, 9.63623046875, 10.8603515625, 12.08447265625, 13.30859375, 14.53271484375, 15.7568359375, 16.98095703125, 18.205078125, 19.42919921875, 20.6533203125, 21.87744140625, 23.1015625, 24.32568359375, 25.5498046875, 26.77392578125, 27.998046875, 29.22216796875, 30.4462890625, 31.67041015625, 32.89453125, 34.11865234375, 35.3427734375, 36.56689453125, 37.791015625, 39.01513671875, 40.2392578125, 41.46337890625, 42.6875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 4.0, 11.0, 17.0, 5.0, 16.0, 13.0, 18.0, 28.0, 42.0, 62.0, 101.0, 140.0, 158.0, 120.0, 54.0, 46.0, 33.0, 19.0, 19.0, 18.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00560760498046875, -0.00545656681060791, -0.00530552864074707, -0.0051544904708862305, -0.005003452301025391, -0.004852414131164551, -0.004701375961303711, -0.004550337791442871, -0.004399299621582031, -0.004248261451721191, -0.0040972232818603516, -0.003946185111999512, -0.003795146942138672, -0.003644108772277832, -0.003493070602416992, -0.0033420324325561523, -0.0031909942626953125, -0.0030399560928344727, -0.002888917922973633, -0.002737879753112793, -0.002586841583251953, -0.0024358034133911133, -0.0022847652435302734, -0.0021337270736694336, -0.0019826889038085938, -0.001831650733947754, -0.001680612564086914, -0.0015295743942260742, -0.0013785362243652344, -0.0012274980545043945, -0.0010764598846435547, -0.0009254217147827148, -0.000774383544921875, -0.0006233453750610352, -0.0004723072052001953, -0.00032126903533935547, -0.00017023086547851562, -1.919269561767578e-05, 0.00013184547424316406, 0.0002828836441040039, 0.00043392181396484375, 0.0005849599838256836, 0.0007359981536865234, 0.0008870363235473633, 0.0010380744934082031, 0.001189112663269043, 0.0013401508331298828, 0.0014911890029907227, 0.0016422271728515625, 0.0017932653427124023, 0.0019443035125732422, 0.002095341682434082, 0.002246379852294922, 0.0023974180221557617, 0.0025484561920166016, 0.0026994943618774414, 0.0028505325317382812, 0.003001570701599121, 0.003152608871459961, 0.0033036470413208008, 0.0034546852111816406, 0.0036057233810424805, 0.0037567615509033203, 0.00390779972076416, 0.004058837890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 0.0, 7.0, 6.0, 10.0, 11.0, 9.0, 30.0, 28.0, 43.0, 65.0, 89.0, 121.0, 153.0, 223.0, 304.0, 423.0, 588.0, 914.0, 1305.0, 1830.0, 2865.0, 4285.0, 6688.0, 10677.0, 17285.0, 29078.0, 51291.0, 104194.0, 252375.0, 291439.0, 127156.0, 58906.0, 32964.0, 19295.0, 12036.0, 7292.0, 4710.0, 3139.0, 2025.0, 1417.0, 936.0, 709.0, 435.0, 340.0, 252.0, 179.0, 109.0, 93.0, 60.0, 57.0, 33.0, 22.0, 23.0, 14.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0], "bins": [-33.21875, -32.215576171875, -31.21240234375, -30.209228515625, -29.2060546875, -28.202880859375, -27.19970703125, -26.196533203125, -25.193359375, -24.190185546875, -23.18701171875, -22.183837890625, -21.1806640625, -20.177490234375, -19.17431640625, -18.171142578125, -17.16796875, -16.164794921875, -15.16162109375, -14.158447265625, -13.1552734375, -12.152099609375, -11.14892578125, -10.145751953125, -9.142578125, -8.139404296875, -7.13623046875, -6.133056640625, -5.1298828125, -4.126708984375, -3.12353515625, -2.120361328125, -1.1171875, -0.114013671875, 0.88916015625, 1.892333984375, 2.8955078125, 3.898681640625, 4.90185546875, 5.905029296875, 6.908203125, 7.911376953125, 8.91455078125, 9.917724609375, 10.9208984375, 11.924072265625, 12.92724609375, 13.930419921875, 14.93359375, 15.936767578125, 16.93994140625, 17.943115234375, 18.9462890625, 19.949462890625, 20.95263671875, 21.955810546875, 22.958984375, 23.962158203125, 24.96533203125, 25.968505859375, 26.9716796875, 27.974853515625, 28.97802734375, 29.981201171875, 30.984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 5.0, 8.0, 12.0, 7.0, 9.0, 20.0, 13.0, 16.0, 24.0, 39.0, 59.0, 64.0, 102.0, 108.0, 117.0, 95.0, 72.0, 50.0, 35.0, 33.0, 24.0, 16.0, 10.0, 15.0, 8.0, 6.0, 6.0, 5.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0078125, -13.617919921875, -13.22802734375, -12.838134765625, -12.4482421875, -12.058349609375, -11.66845703125, -11.278564453125, -10.888671875, -10.498779296875, -10.10888671875, -9.718994140625, -9.3291015625, -8.939208984375, -8.54931640625, -8.159423828125, -7.76953125, -7.379638671875, -6.98974609375, -6.599853515625, -6.2099609375, -5.820068359375, -5.43017578125, -5.040283203125, -4.650390625, -4.260498046875, -3.87060546875, -3.480712890625, -3.0908203125, -2.700927734375, -2.31103515625, -1.921142578125, -1.53125, -1.141357421875, -0.75146484375, -0.361572265625, 0.0283203125, 0.418212890625, 0.80810546875, 1.197998046875, 1.587890625, 1.977783203125, 2.36767578125, 2.757568359375, 3.1474609375, 3.537353515625, 3.92724609375, 4.317138671875, 4.70703125, 5.096923828125, 5.48681640625, 5.876708984375, 6.2666015625, 6.656494140625, 7.04638671875, 7.436279296875, 7.826171875, 8.216064453125, 8.60595703125, 8.995849609375, 9.3857421875, 9.775634765625, 10.16552734375, 10.555419921875, 10.9453125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 7.0, 8.0, 7.0, 17.0, 20.0, 19.0, 18.0, 28.0, 27.0, 37.0, 47.0, 46.0, 43.0, 43.0, 51.0, 70.0, 48.0, 55.0, 40.0, 61.0, 39.0, 30.0, 35.0, 34.0, 25.0, 35.0, 25.0, 5.0, 13.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.15595054626465, -25.234140396118164, -24.31233024597168, -23.390522003173828, -22.468711853027344, -21.54690170288086, -20.625091552734375, -19.70328140258789, -18.781471252441406, -17.859661102294922, -16.937850952148438, -16.016040802001953, -15.094232559204102, -14.172422409057617, -13.250612258911133, -12.328802108764648, -11.406993865966797, -10.485183715820312, -9.563374519348145, -8.64156436920166, -7.719754695892334, -6.797945022583008, -5.876134872436523, -4.954325199127197, -4.032515525817871, -3.110705852508545, -2.1888959407806396, -1.2670860290527344, -0.3452763557434082, 0.576533317565918, 1.4983434677124023, 2.4201531410217285, 3.341960906982422, 4.263770580291748, 5.185580253601074, 6.107390403747559, 7.029200077056885, 7.951009750366211, 8.872819900512695, 9.79463005065918, 10.716439247131348, 11.638249397277832, 12.56005859375, 13.481868743896484, 14.403678894042969, 15.325488090515137, 16.247299194335938, 17.16910743713379, 18.090917587280273, 19.012727737426758, 19.934537887573242, 20.856346130371094, 21.778156280517578, 22.699966430664062, 23.621776580810547, 24.54358673095703, 25.465396881103516, 26.38720703125, 27.309017181396484, 28.23082733154297, 29.15263557434082, 30.074445724487305, 30.99625587463379, 31.918066024780273, 32.839874267578125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 6.0, 7.0, 6.0, 14.0, 12.0, 20.0, 10.0, 20.0, 17.0, 29.0, 29.0, 29.0, 31.0, 25.0, 30.0, 35.0, 37.0, 42.0, 39.0, 39.0, 30.0, 38.0, 41.0, 29.0, 36.0, 21.0, 32.0, 30.0, 22.0, 21.0, 26.0, 37.0, 20.0, 23.0, 15.0, 14.0, 14.0, 10.0, 13.0, 9.0, 8.0, 10.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.073280334472656, -20.336767196655273, -19.600255966186523, -18.86374282836914, -18.12723159790039, -17.390718460083008, -16.654205322265625, -15.917693138122559, -15.181180953979492, -14.444668769836426, -13.70815658569336, -12.971643447875977, -12.23513126373291, -11.498619079589844, -10.762105941772461, -10.025593757629395, -9.289081573486328, -8.552569389343262, -7.816056728363037, -7.0795440673828125, -6.343031883239746, -5.60651969909668, -4.870007038116455, -4.1334943771362305, -3.396982192993164, -2.6604697704315186, -1.923957347869873, -1.1874449253082275, -0.45093250274658203, 0.2855799198150635, 1.022092342376709, 1.7586050033569336, 2.495119094848633, 3.2316315174102783, 3.968143939971924, 4.704656600952148, 5.441168785095215, 6.177680969238281, 6.914193630218506, 7.6507062911987305, 8.387218475341797, 9.123730659484863, 9.86024284362793, 10.596755981445312, 11.333268165588379, 12.069780349731445, 12.806293487548828, 13.542805671691895, 14.279317855834961, 15.015830039978027, 15.752342224121094, 16.488855361938477, 17.22536849975586, 17.96187973022461, 18.698392868041992, 19.434906005859375, 20.171417236328125, 20.907930374145508, 21.644441604614258, 22.38095474243164, 23.11746597290039, 23.853979110717773, 24.590492248535156, 25.327003479003906, 26.06351661682129]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 8.0, 16.0, 13.0, 15.0, 40.0, 68.0, 87.0, 129.0, 211.0, 358.0, 540.0, 842.0, 1375.0, 2091.0, 3279.0, 5229.0, 7976.0, 12688.0, 19454.0, 29588.0, 44231.0, 62864.0, 85066.0, 107439.0, 122676.0, 124653.0, 113154.0, 91851.0, 68980.0, 48732.0, 33120.0, 22123.0, 14353.0, 9075.0, 5908.0, 3815.0, 2389.0, 1484.0, 967.0, 609.0, 397.0, 235.0, 159.0, 98.0, 57.0, 39.0, 33.0, 11.0, 11.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.890625, -22.155517578125, -21.42041015625, -20.685302734375, -19.9501953125, -19.215087890625, -18.47998046875, -17.744873046875, -17.009765625, -16.274658203125, -15.53955078125, -14.804443359375, -14.0693359375, -13.334228515625, -12.59912109375, -11.864013671875, -11.12890625, -10.393798828125, -9.65869140625, -8.923583984375, -8.1884765625, -7.453369140625, -6.71826171875, -5.983154296875, -5.248046875, -4.512939453125, -3.77783203125, -3.042724609375, -2.3076171875, -1.572509765625, -0.83740234375, -0.102294921875, 0.6328125, 1.367919921875, 2.10302734375, 2.838134765625, 3.5732421875, 4.308349609375, 5.04345703125, 5.778564453125, 6.513671875, 7.248779296875, 7.98388671875, 8.718994140625, 9.4541015625, 10.189208984375, 10.92431640625, 11.659423828125, 12.39453125, 13.129638671875, 13.86474609375, 14.599853515625, 15.3349609375, 16.070068359375, 16.80517578125, 17.540283203125, 18.275390625, 19.010498046875, 19.74560546875, 20.480712890625, 21.2158203125, 21.950927734375, 22.68603515625, 23.421142578125, 24.15625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [6.0, 3.0, 6.0, 6.0, 5.0, 4.0, 4.0, 7.0, 6.0, 14.0, 13.0, 14.0, 22.0, 12.0, 19.0, 27.0, 25.0, 28.0, 36.0, 26.0, 36.0, 41.0, 25.0, 47.0, 29.0, 24.0, 44.0, 33.0, 41.0, 38.0, 35.0, 29.0, 37.0, 25.0, 30.0, 16.0, 33.0, 22.0, 28.0, 18.0, 17.0, 14.0, 10.0, 4.0, 10.0, 12.0, 9.0, 10.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.51123046875, -17.7880859375, -17.06494140625, -16.341796875, -15.61865234375, -14.8955078125, -14.17236328125, -13.44921875, -12.72607421875, -12.0029296875, -11.27978515625, -10.556640625, -9.83349609375, -9.1103515625, -8.38720703125, -7.6640625, -6.94091796875, -6.2177734375, -5.49462890625, -4.771484375, -4.04833984375, -3.3251953125, -2.60205078125, -1.87890625, -1.15576171875, -0.4326171875, 0.29052734375, 1.013671875, 1.73681640625, 2.4599609375, 3.18310546875, 3.90625, 4.62939453125, 5.3525390625, 6.07568359375, 6.798828125, 7.52197265625, 8.2451171875, 8.96826171875, 9.69140625, 10.41455078125, 11.1376953125, 11.86083984375, 12.583984375, 13.30712890625, 14.0302734375, 14.75341796875, 15.4765625, 16.19970703125, 16.9228515625, 17.64599609375, 18.369140625, 19.09228515625, 19.8154296875, 20.53857421875, 21.26171875, 21.98486328125, 22.7080078125, 23.43115234375, 24.154296875, 24.87744140625, 25.6005859375, 26.32373046875, 27.046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 16.0, 20.0, 21.0, 57.0, 74.0, 112.0, 123.0, 216.0, 312.0, 508.0, 756.0, 1140.0, 1805.0, 2824.0, 4306.0, 6967.0, 10976.0, 17368.0, 27893.0, 44798.0, 70822.0, 106069.0, 141233.0, 157298.0, 144133.0, 108795.0, 73672.0, 47180.0, 29426.0, 17973.0, 11303.0, 7408.0, 4627.0, 2970.0, 1904.0, 1168.0, 793.0, 489.0, 337.0, 223.0, 147.0, 99.0, 62.0, 38.0, 27.0, 24.0, 17.0, 12.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.625, -33.453125, -32.28125, -31.109375, -29.9375, -28.765625, -27.59375, -26.421875, -25.25, -24.078125, -22.90625, -21.734375, -20.5625, -19.390625, -18.21875, -17.046875, -15.875, -14.703125, -13.53125, -12.359375, -11.1875, -10.015625, -8.84375, -7.671875, -6.5, -5.328125, -4.15625, -2.984375, -1.8125, -0.640625, 0.53125, 1.703125, 2.875, 4.046875, 5.21875, 6.390625, 7.5625, 8.734375, 9.90625, 11.078125, 12.25, 13.421875, 14.59375, 15.765625, 16.9375, 18.109375, 19.28125, 20.453125, 21.625, 22.796875, 23.96875, 25.140625, 26.3125, 27.484375, 28.65625, 29.828125, 31.0, 32.171875, 33.34375, 34.515625, 35.6875, 36.859375, 38.03125, 39.203125, 40.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 8.0, 12.0, 11.0, 18.0, 13.0, 22.0, 19.0, 21.0, 26.0, 40.0, 32.0, 33.0, 37.0, 44.0, 37.0, 34.0, 31.0, 41.0, 43.0, 38.0, 42.0, 28.0, 38.0, 46.0, 35.0, 23.0, 25.0, 21.0, 31.0, 23.0, 14.0, 17.0, 16.0, 10.0, 7.0, 8.0, 7.0, 2.0, 5.0, 8.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.95166015625, -16.3251953125, -15.69873046875, -15.072265625, -14.44580078125, -13.8193359375, -13.19287109375, -12.56640625, -11.93994140625, -11.3134765625, -10.68701171875, -10.060546875, -9.43408203125, -8.8076171875, -8.18115234375, -7.5546875, -6.92822265625, -6.3017578125, -5.67529296875, -5.048828125, -4.42236328125, -3.7958984375, -3.16943359375, -2.54296875, -1.91650390625, -1.2900390625, -0.66357421875, -0.037109375, 0.58935546875, 1.2158203125, 1.84228515625, 2.46875, 3.09521484375, 3.7216796875, 4.34814453125, 4.974609375, 5.60107421875, 6.2275390625, 6.85400390625, 7.48046875, 8.10693359375, 8.7333984375, 9.35986328125, 9.986328125, 10.61279296875, 11.2392578125, 11.86572265625, 12.4921875, 13.11865234375, 13.7451171875, 14.37158203125, 14.998046875, 15.62451171875, 16.2509765625, 16.87744140625, 17.50390625, 18.13037109375, 18.7568359375, 19.38330078125, 20.009765625, 20.63623046875, 21.2626953125, 21.88916015625, 22.515625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 8.0, 19.0, 17.0, 30.0, 36.0, 55.0, 101.0, 143.0, 210.0, 387.0, 719.0, 1342.0, 2807.0, 6392.0, 17343.0, 65814.0, 517127.0, 362299.0, 48846.0, 14307.0, 5346.0, 2435.0, 1193.0, 644.0, 345.0, 191.0, 112.0, 80.0, 62.0, 50.0, 27.0, 21.0, 12.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.25, -93.8857421875, -90.521484375, -87.1572265625, -83.79296875, -80.4287109375, -77.064453125, -73.7001953125, -70.3359375, -66.9716796875, -63.607421875, -60.2431640625, -56.87890625, -53.5146484375, -50.150390625, -46.7861328125, -43.421875, -40.0576171875, -36.693359375, -33.3291015625, -29.96484375, -26.6005859375, -23.236328125, -19.8720703125, -16.5078125, -13.1435546875, -9.779296875, -6.4150390625, -3.05078125, 0.3134765625, 3.677734375, 7.0419921875, 10.40625, 13.7705078125, 17.134765625, 20.4990234375, 23.86328125, 27.2275390625, 30.591796875, 33.9560546875, 37.3203125, 40.6845703125, 44.048828125, 47.4130859375, 50.77734375, 54.1416015625, 57.505859375, 60.8701171875, 64.234375, 67.5986328125, 70.962890625, 74.3271484375, 77.69140625, 81.0556640625, 84.419921875, 87.7841796875, 91.1484375, 94.5126953125, 97.876953125, 101.2412109375, 104.60546875, 107.9697265625, 111.333984375, 114.6982421875, 118.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 7.0, 13.0, 11.0, 11.0, 24.0, 25.0, 41.0, 51.0, 91.0, 96.0, 136.0, 136.0, 98.0, 75.0, 47.0, 28.0, 24.0, 18.0, 8.0, 10.0, 7.0, 5.0, 10.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0043792724609375, -0.004221916198730469, -0.0040645599365234375, -0.003907203674316406, -0.003749847412109375, -0.0035924911499023438, -0.0034351348876953125, -0.0032777786254882812, -0.00312042236328125, -0.0029630661010742188, -0.0028057098388671875, -0.0026483535766601562, -0.002490997314453125, -0.0023336410522460938, -0.0021762847900390625, -0.0020189285278320312, -0.001861572265625, -0.0017042160034179688, -0.0015468597412109375, -0.0013895034790039062, -0.001232147216796875, -0.0010747909545898438, -0.0009174346923828125, -0.0007600784301757812, -0.00060272216796875, -0.00044536590576171875, -0.0002880096435546875, -0.00013065338134765625, 2.6702880859375e-05, 0.00018405914306640625, 0.0003414154052734375, 0.0004987716674804688, 0.0006561279296875, 0.0008134841918945312, 0.0009708404541015625, 0.0011281967163085938, 0.001285552978515625, 0.0014429092407226562, 0.0016002655029296875, 0.0017576217651367188, 0.00191497802734375, 0.0020723342895507812, 0.0022296905517578125, 0.0023870468139648438, 0.002544403076171875, 0.0027017593383789062, 0.0028591156005859375, 0.0030164718627929688, 0.003173828125, 0.0033311843872070312, 0.0034885406494140625, 0.0036458969116210938, 0.003803253173828125, 0.003960609436035156, 0.0041179656982421875, 0.004275321960449219, 0.00443267822265625, 0.004590034484863281, 0.0047473907470703125, 0.004904747009277344, 0.005062103271484375, 0.005219459533691406, 0.0053768157958984375, 0.005534172058105469, 0.0056915283203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 12.0, 11.0, 18.0, 21.0, 33.0, 46.0, 67.0, 84.0, 126.0, 174.0, 234.0, 371.0, 536.0, 835.0, 1394.0, 2258.0, 4071.0, 7495.0, 16160.0, 41667.0, 148869.0, 461451.0, 253533.0, 64474.0, 22227.0, 9769.0, 4989.0, 2847.0, 1682.0, 1036.0, 649.0, 434.0, 311.0, 194.0, 140.0, 89.0, 90.0, 31.0, 36.0, 26.0, 13.0, 7.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.78125, -52.99609375, -51.2109375, -49.42578125, -47.640625, -45.85546875, -44.0703125, -42.28515625, -40.5, -38.71484375, -36.9296875, -35.14453125, -33.359375, -31.57421875, -29.7890625, -28.00390625, -26.21875, -24.43359375, -22.6484375, -20.86328125, -19.078125, -17.29296875, -15.5078125, -13.72265625, -11.9375, -10.15234375, -8.3671875, -6.58203125, -4.796875, -3.01171875, -1.2265625, 0.55859375, 2.34375, 4.12890625, 5.9140625, 7.69921875, 9.484375, 11.26953125, 13.0546875, 14.83984375, 16.625, 18.41015625, 20.1953125, 21.98046875, 23.765625, 25.55078125, 27.3359375, 29.12109375, 30.90625, 32.69140625, 34.4765625, 36.26171875, 38.046875, 39.83203125, 41.6171875, 43.40234375, 45.1875, 46.97265625, 48.7578125, 50.54296875, 52.328125, 54.11328125, 55.8984375, 57.68359375, 59.46875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 15.0, 18.0, 29.0, 26.0, 40.0, 56.0, 67.0, 103.0, 103.0, 108.0, 112.0, 75.0, 67.0, 43.0, 28.0, 28.0, 21.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.564697265625, -11.06689453125, -10.569091796875, -10.0712890625, -9.573486328125, -9.07568359375, -8.577880859375, -8.080078125, -7.582275390625, -7.08447265625, -6.586669921875, -6.0888671875, -5.591064453125, -5.09326171875, -4.595458984375, -4.09765625, -3.599853515625, -3.10205078125, -2.604248046875, -2.1064453125, -1.608642578125, -1.11083984375, -0.613037109375, -0.115234375, 0.382568359375, 0.88037109375, 1.378173828125, 1.8759765625, 2.373779296875, 2.87158203125, 3.369384765625, 3.8671875, 4.364990234375, 4.86279296875, 5.360595703125, 5.8583984375, 6.356201171875, 6.85400390625, 7.351806640625, 7.849609375, 8.347412109375, 8.84521484375, 9.343017578125, 9.8408203125, 10.338623046875, 10.83642578125, 11.334228515625, 11.83203125, 12.329833984375, 12.82763671875, 13.325439453125, 13.8232421875, 14.321044921875, 14.81884765625, 15.316650390625, 15.814453125, 16.312255859375, 16.81005859375, 17.307861328125, 17.8056640625, 18.303466796875, 18.80126953125, 19.299072265625, 19.796875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 6.0, 13.0, 13.0, 16.0, 22.0, 26.0, 33.0, 35.0, 28.0, 35.0, 42.0, 46.0, 49.0, 51.0, 56.0, 40.0, 59.0, 49.0, 36.0, 56.0, 33.0, 41.0, 35.0, 26.0, 22.0, 25.0, 12.0, 21.0, 6.0, 10.0, 9.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.917936325073242, -23.992137908935547, -23.06633758544922, -22.14053726196289, -21.214738845825195, -20.2889404296875, -19.363140106201172, -18.437339782714844, -17.51154136657715, -16.585742950439453, -15.659942626953125, -14.734143257141113, -13.808343887329102, -12.88254451751709, -11.956745147705078, -11.030945777893066, -10.105146408081055, -9.179347038269043, -8.253547668457031, -7.3277482986450195, -6.401948928833008, -5.476149559020996, -4.550350189208984, -3.6245508193969727, -2.698751449584961, -1.7729520797729492, -0.8471527099609375, 0.07864665985107422, 1.004446029663086, 1.9302453994750977, 2.8560447692871094, 3.781844139099121, 4.707645416259766, 5.633444786071777, 6.559244155883789, 7.485043525695801, 8.410842895507812, 9.336642265319824, 10.262441635131836, 11.188241004943848, 12.11404037475586, 13.039839744567871, 13.965639114379883, 14.891438484191895, 15.817237854003906, 16.743038177490234, 17.66883659362793, 18.594635009765625, 19.520435333251953, 20.44623565673828, 21.372034072875977, 22.297832489013672, 23.2236328125, 24.149433135986328, 25.075231552124023, 26.00102996826172, 26.926830291748047, 27.852630615234375, 28.77842903137207, 29.704227447509766, 30.630027770996094, 31.555828094482422, 32.48162841796875, 33.40742492675781, 34.33322525024414]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 7.0, 10.0, 2.0, 7.0, 13.0, 20.0, 19.0, 15.0, 23.0, 30.0, 21.0, 31.0, 34.0, 36.0, 34.0, 28.0, 42.0, 49.0, 43.0, 50.0, 39.0, 33.0, 37.0, 43.0, 37.0, 39.0, 34.0, 31.0, 30.0, 34.0, 25.0, 20.0, 16.0, 11.0, 9.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.683778762817383, -27.73978614807129, -26.795791625976562, -25.85179901123047, -24.907806396484375, -23.96381378173828, -23.019819259643555, -22.07582664489746, -21.131832122802734, -20.18783950805664, -19.243844985961914, -18.29985237121582, -17.355859756469727, -16.411865234375, -15.467872619628906, -14.523880004882812, -13.579887390136719, -12.635893821716309, -11.691901206970215, -10.747907638549805, -9.803915023803711, -8.8599214553833, -7.915927886962891, -6.971934795379639, -6.027941703796387, -5.083948612213135, -4.139955520629883, -3.1959619522094727, -2.2519688606262207, -1.3079757690429688, -0.3639822006225586, 0.5800108909606934, 1.5240020751953125, 2.4679951667785645, 3.4119884967803955, 4.355981826782227, 5.2999749183654785, 6.2439680099487305, 7.187961578369141, 8.131954193115234, 9.075947761535645, 10.019941329956055, 10.963933944702148, 11.907927513122559, 12.851921081542969, 13.795913696289062, 14.739907264709473, 15.683900833129883, 16.627893447875977, 17.57188606262207, 18.515880584716797, 19.45987319946289, 20.403865814208984, 21.347858428955078, 22.291852951049805, 23.2358455657959, 24.179840087890625, 25.12383270263672, 26.067827224731445, 27.01181983947754, 27.955812454223633, 28.89980697631836, 29.843799591064453, 30.787792205810547, 31.73178482055664]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 21.0, 30.0, 47.0, 82.0, 144.0, 207.0, 300.0, 550.0, 874.0, 1375.0, 2201.0, 3635.0, 6150.0, 10082.0, 17651.0, 30637.0, 54524.0, 97698.0, 181161.0, 326954.0, 547768.0, 748570.0, 765307.0, 587540.0, 361849.0, 200562.0, 108621.0, 60020.0, 33511.0, 18891.0, 11013.0, 6461.0, 3810.0, 2312.0, 1380.0, 855.0, 555.0, 335.0, 213.0, 135.0, 78.0, 47.0, 40.0, 31.0, 12.0, 13.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-24.46875, -23.6552734375, -22.841796875, -22.0283203125, -21.21484375, -20.4013671875, -19.587890625, -18.7744140625, -17.9609375, -17.1474609375, -16.333984375, -15.5205078125, -14.70703125, -13.8935546875, -13.080078125, -12.2666015625, -11.453125, -10.6396484375, -9.826171875, -9.0126953125, -8.19921875, -7.3857421875, -6.572265625, -5.7587890625, -4.9453125, -4.1318359375, -3.318359375, -2.5048828125, -1.69140625, -0.8779296875, -0.064453125, 0.7490234375, 1.5625, 2.3759765625, 3.189453125, 4.0029296875, 4.81640625, 5.6298828125, 6.443359375, 7.2568359375, 8.0703125, 8.8837890625, 9.697265625, 10.5107421875, 11.32421875, 12.1376953125, 12.951171875, 13.7646484375, 14.578125, 15.3916015625, 16.205078125, 17.0185546875, 17.83203125, 18.6455078125, 19.458984375, 20.2724609375, 21.0859375, 21.8994140625, 22.712890625, 23.5263671875, 24.33984375, 25.1533203125, 25.966796875, 26.7802734375, 27.59375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 10.0, 12.0, 11.0, 11.0, 11.0, 17.0, 19.0, 25.0, 28.0, 26.0, 33.0, 36.0, 36.0, 39.0, 34.0, 47.0, 41.0, 49.0, 34.0, 50.0, 57.0, 41.0, 38.0, 36.0, 28.0, 39.0, 28.0, 30.0, 34.0, 20.0, 17.0, 19.0, 8.0, 6.0, 15.0, 4.0, 5.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.12353515625, -22.2783203125, -21.43310546875, -20.587890625, -19.74267578125, -18.8974609375, -18.05224609375, -17.20703125, -16.36181640625, -15.5166015625, -14.67138671875, -13.826171875, -12.98095703125, -12.1357421875, -11.29052734375, -10.4453125, -9.60009765625, -8.7548828125, -7.90966796875, -7.064453125, -6.21923828125, -5.3740234375, -4.52880859375, -3.68359375, -2.83837890625, -1.9931640625, -1.14794921875, -0.302734375, 0.54248046875, 1.3876953125, 2.23291015625, 3.078125, 3.92333984375, 4.7685546875, 5.61376953125, 6.458984375, 7.30419921875, 8.1494140625, 8.99462890625, 9.83984375, 10.68505859375, 11.5302734375, 12.37548828125, 13.220703125, 14.06591796875, 14.9111328125, 15.75634765625, 16.6015625, 17.44677734375, 18.2919921875, 19.13720703125, 19.982421875, 20.82763671875, 21.6728515625, 22.51806640625, 23.36328125, 24.20849609375, 25.0537109375, 25.89892578125, 26.744140625, 27.58935546875, 28.4345703125, 29.27978515625, 30.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 16.0, 21.0, 37.0, 44.0, 69.0, 118.0, 151.0, 290.0, 420.0, 757.0, 1215.0, 2198.0, 3718.0, 6507.0, 11509.0, 21253.0, 39549.0, 74316.0, 143192.0, 274206.0, 492360.0, 760670.0, 858059.0, 659231.0, 394222.0, 212372.0, 110929.0, 57812.0, 30474.0, 16796.0, 9220.0, 5179.0, 3013.0, 1681.0, 1041.0, 617.0, 359.0, 221.0, 163.0, 82.0, 62.0, 45.0, 24.0, 19.0, 11.0, 9.0, 10.0, 3.0, 6.0, 0.0, 1.0], "bins": [-36.0, -34.980224609375, -33.96044921875, -32.940673828125, -31.9208984375, -30.901123046875, -29.88134765625, -28.861572265625, -27.841796875, -26.822021484375, -25.80224609375, -24.782470703125, -23.7626953125, -22.742919921875, -21.72314453125, -20.703369140625, -19.68359375, -18.663818359375, -17.64404296875, -16.624267578125, -15.6044921875, -14.584716796875, -13.56494140625, -12.545166015625, -11.525390625, -10.505615234375, -9.48583984375, -8.466064453125, -7.4462890625, -6.426513671875, -5.40673828125, -4.386962890625, -3.3671875, -2.347412109375, -1.32763671875, -0.307861328125, 0.7119140625, 1.731689453125, 2.75146484375, 3.771240234375, 4.791015625, 5.810791015625, 6.83056640625, 7.850341796875, 8.8701171875, 9.889892578125, 10.90966796875, 11.929443359375, 12.94921875, 13.968994140625, 14.98876953125, 16.008544921875, 17.0283203125, 18.048095703125, 19.06787109375, 20.087646484375, 21.107421875, 22.127197265625, 23.14697265625, 24.166748046875, 25.1865234375, 26.206298828125, 27.22607421875, 28.245849609375, 29.265625]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 8.0, 11.0, 18.0, 23.0, 30.0, 27.0, 46.0, 54.0, 84.0, 87.0, 116.0, 149.0, 167.0, 184.0, 211.0, 245.0, 245.0, 286.0, 280.0, 278.0, 239.0, 248.0, 190.0, 156.0, 153.0, 109.0, 89.0, 74.0, 60.0, 39.0, 41.0, 25.0, 18.0, 25.0, 10.0, 14.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.4609375, -14.0726318359375, -13.684326171875, -13.2960205078125, -12.90771484375, -12.5194091796875, -12.131103515625, -11.7427978515625, -11.3544921875, -10.9661865234375, -10.577880859375, -10.1895751953125, -9.80126953125, -9.4129638671875, -9.024658203125, -8.6363525390625, -8.248046875, -7.8597412109375, -7.471435546875, -7.0831298828125, -6.69482421875, -6.3065185546875, -5.918212890625, -5.5299072265625, -5.1416015625, -4.7532958984375, -4.364990234375, -3.9766845703125, -3.58837890625, -3.2000732421875, -2.811767578125, -2.4234619140625, -2.03515625, -1.6468505859375, -1.258544921875, -0.8702392578125, -0.48193359375, -0.0936279296875, 0.294677734375, 0.6829833984375, 1.0712890625, 1.4595947265625, 1.847900390625, 2.2362060546875, 2.62451171875, 3.0128173828125, 3.401123046875, 3.7894287109375, 4.177734375, 4.5660400390625, 4.954345703125, 5.3426513671875, 5.73095703125, 6.1192626953125, 6.507568359375, 6.8958740234375, 7.2841796875, 7.6724853515625, 8.060791015625, 8.4490966796875, 8.83740234375, 9.2257080078125, 9.614013671875, 10.0023193359375, 10.390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 4.0, 14.0, 14.0, 15.0, 15.0, 23.0, 20.0, 36.0, 36.0, 36.0, 42.0, 32.0, 32.0, 57.0, 50.0, 56.0, 51.0, 59.0, 46.0, 51.0, 47.0, 37.0, 26.0, 27.0, 17.0, 25.0, 25.0, 12.0, 15.0, 11.0, 13.0, 8.0, 8.0, 8.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.204660415649414, -25.30303192138672, -24.401405334472656, -23.49977684020996, -22.598148345947266, -21.696521759033203, -20.794893264770508, -19.893264770507812, -18.99163818359375, -18.090009689331055, -17.188383102416992, -16.286754608154297, -15.385126113891602, -14.483498573303223, -13.581871032714844, -12.680242538452148, -11.778614044189453, -10.876986503601074, -9.975358009338379, -9.07373046875, -8.172101974487305, -7.270474433898926, -6.368846893310547, -5.46721887588501, -4.565590858459473, -3.6639628410339355, -2.7623350620269775, -1.8607072830200195, -0.9590792655944824, -0.05745124816894531, 0.8441762924194336, 1.7458043098449707, 2.6474342346191406, 3.5490622520446777, 4.450690269470215, 5.352317810058594, 6.253945827484131, 7.155573844909668, 8.057201385498047, 8.958829879760742, 9.860457420349121, 10.7620849609375, 11.663713455200195, 12.565340995788574, 13.466968536376953, 14.368597030639648, 15.270224571228027, 16.171852111816406, 17.0734806060791, 17.975109100341797, 18.87673568725586, 19.778364181518555, 20.67999267578125, 21.581619262695312, 22.483247756958008, 23.384876251220703, 24.286502838134766, 25.18813133239746, 26.089757919311523, 26.99138641357422, 27.893014907836914, 28.79464340209961, 29.696269989013672, 30.597898483276367, 31.499526977539062]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 8.0, 7.0, 12.0, 13.0, 12.0, 27.0, 13.0, 28.0, 12.0, 23.0, 23.0, 27.0, 28.0, 30.0, 34.0, 33.0, 50.0, 42.0, 33.0, 49.0, 45.0, 54.0, 42.0, 37.0, 30.0, 45.0, 33.0, 31.0, 21.0, 26.0, 16.0, 15.0, 14.0, 19.0, 12.0, 19.0, 7.0, 9.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.648866653442383, -26.766971588134766, -25.885074615478516, -25.0031795501709, -24.12128448486328, -23.23938751220703, -22.357492446899414, -21.475597381591797, -20.593700408935547, -19.71180534362793, -18.82990837097168, -17.948013305664062, -17.066118240356445, -16.184223175048828, -15.302326202392578, -14.420431137084961, -13.538536071777344, -12.65664005279541, -11.774744987487793, -10.89284896850586, -10.010953903198242, -9.129057884216309, -8.247161865234375, -7.3652663230896, -6.483370780944824, -5.601475238800049, -4.719579696655273, -3.83768367767334, -2.9557881355285645, -2.073892593383789, -1.1919965744018555, -0.3101010322570801, 0.5717926025390625, 1.4536882638931274, 2.3355839252471924, 3.217479705810547, 4.099375247955322, 4.981270790100098, 5.863166809082031, 6.745062351226807, 7.626957893371582, 8.508853912353516, 9.390748977661133, 10.272644996643066, 11.154541015625, 12.036436080932617, 12.91833209991455, 13.800228118896484, 14.682123184204102, 15.564019203186035, 16.44591522216797, 17.327810287475586, 18.209705352783203, 19.091602325439453, 19.97349739074707, 20.855392456054688, 21.737289428710938, 22.619184494018555, 23.501081466674805, 24.382976531982422, 25.26487159729004, 26.146766662597656, 27.028663635253906, 27.910558700561523, 28.79245376586914]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 23.0, 19.0, 28.0, 32.0, 55.0, 83.0, 137.0, 178.0, 220.0, 334.0, 476.0, 718.0, 990.0, 1494.0, 2409.0, 3759.0, 6065.0, 10199.0, 17286.0, 30708.0, 56765.0, 109912.0, 200249.0, 245652.0, 166052.0, 86842.0, 45487.0, 25086.0, 14256.0, 8412.0, 5213.0, 3191.0, 2070.0, 1326.0, 841.0, 578.0, 428.0, 292.0, 221.0, 126.0, 92.0, 77.0, 59.0, 32.0, 28.0, 20.0, 15.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-44.9375, -43.54736328125, -42.1572265625, -40.76708984375, -39.376953125, -37.98681640625, -36.5966796875, -35.20654296875, -33.81640625, -32.42626953125, -31.0361328125, -29.64599609375, -28.255859375, -26.86572265625, -25.4755859375, -24.08544921875, -22.6953125, -21.30517578125, -19.9150390625, -18.52490234375, -17.134765625, -15.74462890625, -14.3544921875, -12.96435546875, -11.57421875, -10.18408203125, -8.7939453125, -7.40380859375, -6.013671875, -4.62353515625, -3.2333984375, -1.84326171875, -0.453125, 0.93701171875, 2.3271484375, 3.71728515625, 5.107421875, 6.49755859375, 7.8876953125, 9.27783203125, 10.66796875, 12.05810546875, 13.4482421875, 14.83837890625, 16.228515625, 17.61865234375, 19.0087890625, 20.39892578125, 21.7890625, 23.17919921875, 24.5693359375, 25.95947265625, 27.349609375, 28.73974609375, 30.1298828125, 31.52001953125, 32.91015625, 34.30029296875, 35.6904296875, 37.08056640625, 38.470703125, 39.86083984375, 41.2509765625, 42.64111328125, 44.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 6.0, 4.0, 3.0, 9.0, 12.0, 3.0, 16.0, 16.0, 19.0, 21.0, 25.0, 18.0, 24.0, 25.0, 29.0, 29.0, 30.0, 37.0, 34.0, 47.0, 50.0, 35.0, 51.0, 47.0, 43.0, 45.0, 37.0, 42.0, 38.0, 23.0, 24.0, 26.0, 19.0, 18.0, 16.0, 14.0, 12.0, 8.0, 12.0, 13.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.671875, -24.80126953125, -23.9306640625, -23.06005859375, -22.189453125, -21.31884765625, -20.4482421875, -19.57763671875, -18.70703125, -17.83642578125, -16.9658203125, -16.09521484375, -15.224609375, -14.35400390625, -13.4833984375, -12.61279296875, -11.7421875, -10.87158203125, -10.0009765625, -9.13037109375, -8.259765625, -7.38916015625, -6.5185546875, -5.64794921875, -4.77734375, -3.90673828125, -3.0361328125, -2.16552734375, -1.294921875, -0.42431640625, 0.4462890625, 1.31689453125, 2.1875, 3.05810546875, 3.9287109375, 4.79931640625, 5.669921875, 6.54052734375, 7.4111328125, 8.28173828125, 9.15234375, 10.02294921875, 10.8935546875, 11.76416015625, 12.634765625, 13.50537109375, 14.3759765625, 15.24658203125, 16.1171875, 16.98779296875, 17.8583984375, 18.72900390625, 19.599609375, 20.47021484375, 21.3408203125, 22.21142578125, 23.08203125, 23.95263671875, 24.8232421875, 25.69384765625, 26.564453125, 27.43505859375, 28.3056640625, 29.17626953125, 30.046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 12.0, 22.0, 24.0, 36.0, 57.0, 92.0, 128.0, 199.0, 289.0, 432.0, 686.0, 1170.0, 1943.0, 3297.0, 5702.0, 10592.0, 20392.0, 42266.0, 97294.0, 232380.0, 324786.0, 169309.0, 70000.0, 31657.0, 15793.0, 8390.0, 4565.0, 2741.0, 1609.0, 998.0, 570.0, 384.0, 257.0, 168.0, 103.0, 53.0, 44.0, 41.0, 17.0, 8.0, 16.0, 13.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-62.8125, -61.03369140625, -59.2548828125, -57.47607421875, -55.697265625, -53.91845703125, -52.1396484375, -50.36083984375, -48.58203125, -46.80322265625, -45.0244140625, -43.24560546875, -41.466796875, -39.68798828125, -37.9091796875, -36.13037109375, -34.3515625, -32.57275390625, -30.7939453125, -29.01513671875, -27.236328125, -25.45751953125, -23.6787109375, -21.89990234375, -20.12109375, -18.34228515625, -16.5634765625, -14.78466796875, -13.005859375, -11.22705078125, -9.4482421875, -7.66943359375, -5.890625, -4.11181640625, -2.3330078125, -0.55419921875, 1.224609375, 3.00341796875, 4.7822265625, 6.56103515625, 8.33984375, 10.11865234375, 11.8974609375, 13.67626953125, 15.455078125, 17.23388671875, 19.0126953125, 20.79150390625, 22.5703125, 24.34912109375, 26.1279296875, 27.90673828125, 29.685546875, 31.46435546875, 33.2431640625, 35.02197265625, 36.80078125, 38.57958984375, 40.3583984375, 42.13720703125, 43.916015625, 45.69482421875, 47.4736328125, 49.25244140625, 51.03125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 10.0, 14.0, 12.0, 27.0, 23.0, 33.0, 44.0, 40.0, 36.0, 43.0, 68.0, 64.0, 57.0, 53.0, 46.0, 58.0, 52.0, 56.0, 62.0, 30.0, 40.0, 26.0, 19.0, 13.0, 20.0, 12.0, 8.0, 8.0, 4.0, 1.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.40625, -33.435791015625, -32.46533203125, -31.494873046875, -30.5244140625, -29.553955078125, -28.58349609375, -27.613037109375, -26.642578125, -25.672119140625, -24.70166015625, -23.731201171875, -22.7607421875, -21.790283203125, -20.81982421875, -19.849365234375, -18.87890625, -17.908447265625, -16.93798828125, -15.967529296875, -14.9970703125, -14.026611328125, -13.05615234375, -12.085693359375, -11.115234375, -10.144775390625, -9.17431640625, -8.203857421875, -7.2333984375, -6.262939453125, -5.29248046875, -4.322021484375, -3.3515625, -2.381103515625, -1.41064453125, -0.440185546875, 0.5302734375, 1.500732421875, 2.47119140625, 3.441650390625, 4.412109375, 5.382568359375, 6.35302734375, 7.323486328125, 8.2939453125, 9.264404296875, 10.23486328125, 11.205322265625, 12.17578125, 13.146240234375, 14.11669921875, 15.087158203125, 16.0576171875, 17.028076171875, 17.99853515625, 18.968994140625, 19.939453125, 20.909912109375, 21.88037109375, 22.850830078125, 23.8212890625, 24.791748046875, 25.76220703125, 26.732666015625, 27.703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 15.0, 23.0, 27.0, 38.0, 60.0, 64.0, 77.0, 134.0, 188.0, 228.0, 324.0, 495.0, 669.0, 918.0, 1400.0, 1897.0, 2849.0, 4230.0, 6612.0, 10572.0, 19720.0, 51259.0, 261841.0, 519958.0, 98304.0, 28848.0, 13899.0, 7980.0, 4905.0, 3321.0, 2328.0, 1607.0, 1100.0, 736.0, 529.0, 374.0, 277.0, 171.0, 154.0, 95.0, 90.0, 69.0, 44.0, 30.0, 23.0, 15.0, 12.0, 5.0, 4.0, 12.0, 7.0, 5.0], "bins": [-44.3125, -43.0546875, -41.796875, -40.5390625, -39.28125, -38.0234375, -36.765625, -35.5078125, -34.25, -32.9921875, -31.734375, -30.4765625, -29.21875, -27.9609375, -26.703125, -25.4453125, -24.1875, -22.9296875, -21.671875, -20.4140625, -19.15625, -17.8984375, -16.640625, -15.3828125, -14.125, -12.8671875, -11.609375, -10.3515625, -9.09375, -7.8359375, -6.578125, -5.3203125, -4.0625, -2.8046875, -1.546875, -0.2890625, 0.96875, 2.2265625, 3.484375, 4.7421875, 6.0, 7.2578125, 8.515625, 9.7734375, 11.03125, 12.2890625, 13.546875, 14.8046875, 16.0625, 17.3203125, 18.578125, 19.8359375, 21.09375, 22.3515625, 23.609375, 24.8671875, 26.125, 27.3828125, 28.640625, 29.8984375, 31.15625, 32.4140625, 33.671875, 34.9296875, 36.1875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 10.0, 12.0, 23.0, 33.0, 172.0, 392.0, 171.0, 54.0, 24.0, 12.0, 14.0, 9.0, 8.0, 3.0, 4.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0084381103515625, -0.008170723915100098, -0.007903337478637695, -0.007635951042175293, -0.007368564605712891, -0.007101178169250488, -0.006833791732788086, -0.006566405296325684, -0.006299018859863281, -0.006031632423400879, -0.0057642459869384766, -0.005496859550476074, -0.005229473114013672, -0.0049620866775512695, -0.004694700241088867, -0.004427313804626465, -0.0041599273681640625, -0.00389254093170166, -0.003625154495239258, -0.0033577680587768555, -0.003090381622314453, -0.0028229951858520508, -0.0025556087493896484, -0.002288222312927246, -0.0020208358764648438, -0.0017534494400024414, -0.001486063003540039, -0.0012186765670776367, -0.0009512901306152344, -0.000683903694152832, -0.0004165172576904297, -0.00014913082122802734, 0.000118255615234375, 0.00038564205169677734, 0.0006530284881591797, 0.000920414924621582, 0.0011878013610839844, 0.0014551877975463867, 0.001722574234008789, 0.0019899606704711914, 0.0022573471069335938, 0.002524733543395996, 0.0027921199798583984, 0.0030595064163208008, 0.003326892852783203, 0.0035942792892456055, 0.003861665725708008, 0.00412905216217041, 0.0043964385986328125, 0.004663825035095215, 0.004931211471557617, 0.0051985979080200195, 0.005465984344482422, 0.005733370780944824, 0.0060007572174072266, 0.006268143653869629, 0.006535530090332031, 0.006802916526794434, 0.007070302963256836, 0.007337689399719238, 0.007605075836181641, 0.007872462272644043, 0.008139848709106445, 0.008407235145568848, 0.00867462158203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 13.0, 10.0, 23.0, 39.0, 46.0, 77.0, 95.0, 142.0, 222.0, 394.0, 591.0, 979.0, 1541.0, 2569.0, 4588.0, 7824.0, 14355.0, 29607.0, 100954.0, 492144.0, 288116.0, 56150.0, 21425.0, 11156.0, 6205.0, 3638.0, 2173.0, 1375.0, 790.0, 498.0, 290.0, 174.0, 116.0, 74.0, 56.0, 30.0, 28.0, 12.0, 11.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.15625, -45.57373046875, -43.9912109375, -42.40869140625, -40.826171875, -39.24365234375, -37.6611328125, -36.07861328125, -34.49609375, -32.91357421875, -31.3310546875, -29.74853515625, -28.166015625, -26.58349609375, -25.0009765625, -23.41845703125, -21.8359375, -20.25341796875, -18.6708984375, -17.08837890625, -15.505859375, -13.92333984375, -12.3408203125, -10.75830078125, -9.17578125, -7.59326171875, -6.0107421875, -4.42822265625, -2.845703125, -1.26318359375, 0.3193359375, 1.90185546875, 3.484375, 5.06689453125, 6.6494140625, 8.23193359375, 9.814453125, 11.39697265625, 12.9794921875, 14.56201171875, 16.14453125, 17.72705078125, 19.3095703125, 20.89208984375, 22.474609375, 24.05712890625, 25.6396484375, 27.22216796875, 28.8046875, 30.38720703125, 31.9697265625, 33.55224609375, 35.134765625, 36.71728515625, 38.2998046875, 39.88232421875, 41.46484375, 43.04736328125, 44.6298828125, 46.21240234375, 47.794921875, 49.37744140625, 50.9599609375, 52.54248046875, 54.125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 8.0, 10.0, 10.0, 15.0, 24.0, 39.0, 62.0, 95.0, 168.0, 152.0, 139.0, 81.0, 49.0, 30.0, 16.0, 11.0, 12.0, 4.0, 10.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.6873779296875, -15.187255859375, -14.6871337890625, -14.18701171875, -13.6868896484375, -13.186767578125, -12.6866455078125, -12.1865234375, -11.6864013671875, -11.186279296875, -10.6861572265625, -10.18603515625, -9.6859130859375, -9.185791015625, -8.6856689453125, -8.185546875, -7.6854248046875, -7.185302734375, -6.6851806640625, -6.18505859375, -5.6849365234375, -5.184814453125, -4.6846923828125, -4.1845703125, -3.6844482421875, -3.184326171875, -2.6842041015625, -2.18408203125, -1.6839599609375, -1.183837890625, -0.6837158203125, -0.18359375, 0.3165283203125, 0.816650390625, 1.3167724609375, 1.81689453125, 2.3170166015625, 2.817138671875, 3.3172607421875, 3.8173828125, 4.3175048828125, 4.817626953125, 5.3177490234375, 5.81787109375, 6.3179931640625, 6.818115234375, 7.3182373046875, 7.818359375, 8.3184814453125, 8.818603515625, 9.3187255859375, 9.81884765625, 10.3189697265625, 10.819091796875, 11.3192138671875, 11.8193359375, 12.3194580078125, 12.819580078125, 13.3197021484375, 13.81982421875, 14.3199462890625, 14.820068359375, 15.3201904296875, 15.8203125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 12.0, 3.0, 5.0, 9.0, 10.0, 13.0, 15.0, 16.0, 22.0, 28.0, 39.0, 55.0, 51.0, 55.0, 49.0, 61.0, 56.0, 65.0, 45.0, 64.0, 60.0, 37.0, 44.0, 33.0, 24.0, 24.0, 29.0, 19.0, 13.0, 16.0, 7.0, 6.0, 9.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.815786361694336, -28.7351131439209, -27.654438018798828, -26.57376480102539, -25.493091583251953, -24.412418365478516, -23.331743240356445, -22.251070022583008, -21.170394897460938, -20.0897216796875, -19.00904655456543, -17.928373336791992, -16.847700119018555, -15.7670259475708, -14.686351776123047, -13.60567855834961, -12.525005340576172, -11.444331169128418, -10.36365795135498, -9.282983779907227, -8.202310562133789, -7.121636390686035, -6.040962219238281, -4.9602885246276855, -3.87961483001709, -2.798941135406494, -1.7182672023773193, -0.6375932693481445, 0.44308042526245117, 1.5237541198730469, 2.604428291320801, 3.6851019859313965, 4.765777587890625, 5.846451282501221, 6.927124977111816, 8.00779914855957, 9.088472366333008, 10.169146537780762, 11.249820709228516, 12.330493927001953, 13.411168098449707, 14.491842269897461, 15.572515487670898, 16.65319061279297, 17.733863830566406, 18.814537048339844, 19.89521026611328, 20.97588539123535, 22.05655860900879, 23.137231826782227, 24.217906951904297, 25.298580169677734, 26.379253387451172, 27.45992660522461, 28.54060173034668, 29.621274948120117, 30.701950073242188, 31.782623291015625, 32.86329650878906, 33.9439697265625, 35.0246467590332, 36.10531997680664, 37.18599319458008, 38.266666412353516, 39.34733963012695]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 5.0, 11.0, 8.0, 21.0, 20.0, 13.0, 24.0, 17.0, 25.0, 33.0, 30.0, 38.0, 38.0, 30.0, 47.0, 33.0, 42.0, 42.0, 37.0, 49.0, 46.0, 44.0, 50.0, 38.0, 39.0, 26.0, 30.0, 21.0, 25.0, 28.0, 17.0, 16.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.58155059814453, -26.625232696533203, -25.668916702270508, -24.71259880065918, -23.756282806396484, -22.799964904785156, -21.84364891052246, -20.887331008911133, -19.931015014648438, -18.97469711303711, -18.018381118774414, -17.062063217163086, -16.10574722290039, -15.149429321289062, -14.193113327026367, -13.236795425415039, -12.280478477478027, -11.324161529541016, -10.367844581604004, -9.411527633666992, -8.45521068572998, -7.4988932609558105, -6.542576313018799, -5.586259365081787, -4.629942417144775, -3.6736254692077637, -2.717308521270752, -1.7609913349151611, -0.8046743869781494, 0.1516427993774414, 1.1079597473144531, 2.064276695251465, 3.0205936431884766, 3.9769105911254883, 4.9332275390625, 5.889544486999512, 6.845861434936523, 7.802178859710693, 8.758495330810547, 9.714813232421875, 10.67112922668457, 11.627446174621582, 12.583763122558594, 13.540080070495605, 14.496397018432617, 15.452714920043945, 16.40903091430664, 17.36534881591797, 18.321666717529297, 19.277984619140625, 20.23430061340332, 21.19061851501465, 22.146934509277344, 23.103252410888672, 24.059568405151367, 25.015886306762695, 25.97220230102539, 26.92852020263672, 27.884836196899414, 28.841154098510742, 29.797470092773438, 30.753787994384766, 31.71010398864746, 32.666419982910156, 33.622737884521484]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 9.0, 30.0, 37.0, 53.0, 82.0, 130.0, 203.0, 308.0, 487.0, 768.0, 1125.0, 1865.0, 2887.0, 4666.0, 7599.0, 11832.0, 19014.0, 29574.0, 46537.0, 68938.0, 96982.0, 124774.0, 141477.0, 136109.0, 111797.0, 82614.0, 57115.0, 37283.0, 23539.0, 14905.0, 9446.0, 6013.0, 3752.0, 2376.0, 1539.0, 941.0, 615.0, 423.0, 267.0, 148.0, 98.0, 58.0, 41.0, 24.0, 20.0, 20.0, 4.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-29.484375, -28.61083984375, -27.7373046875, -26.86376953125, -25.990234375, -25.11669921875, -24.2431640625, -23.36962890625, -22.49609375, -21.62255859375, -20.7490234375, -19.87548828125, -19.001953125, -18.12841796875, -17.2548828125, -16.38134765625, -15.5078125, -14.63427734375, -13.7607421875, -12.88720703125, -12.013671875, -11.14013671875, -10.2666015625, -9.39306640625, -8.51953125, -7.64599609375, -6.7724609375, -5.89892578125, -5.025390625, -4.15185546875, -3.2783203125, -2.40478515625, -1.53125, -0.65771484375, 0.2158203125, 1.08935546875, 1.962890625, 2.83642578125, 3.7099609375, 4.58349609375, 5.45703125, 6.33056640625, 7.2041015625, 8.07763671875, 8.951171875, 9.82470703125, 10.6982421875, 11.57177734375, 12.4453125, 13.31884765625, 14.1923828125, 15.06591796875, 15.939453125, 16.81298828125, 17.6865234375, 18.56005859375, 19.43359375, 20.30712890625, 21.1806640625, 22.05419921875, 22.927734375, 23.80126953125, 24.6748046875, 25.54833984375, 26.421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 8.0, 6.0, 14.0, 6.0, 20.0, 24.0, 16.0, 15.0, 23.0, 30.0, 28.0, 36.0, 34.0, 34.0, 37.0, 44.0, 50.0, 43.0, 53.0, 51.0, 49.0, 55.0, 40.0, 40.0, 26.0, 40.0, 30.0, 29.0, 22.0, 18.0, 21.0, 12.0, 9.0, 9.0, 4.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.078125, -27.083251953125, -26.08837890625, -25.093505859375, -24.0986328125, -23.103759765625, -22.10888671875, -21.114013671875, -20.119140625, -19.124267578125, -18.12939453125, -17.134521484375, -16.1396484375, -15.144775390625, -14.14990234375, -13.155029296875, -12.16015625, -11.165283203125, -10.17041015625, -9.175537109375, -8.1806640625, -7.185791015625, -6.19091796875, -5.196044921875, -4.201171875, -3.206298828125, -2.21142578125, -1.216552734375, -0.2216796875, 0.773193359375, 1.76806640625, 2.762939453125, 3.7578125, 4.752685546875, 5.74755859375, 6.742431640625, 7.7373046875, 8.732177734375, 9.72705078125, 10.721923828125, 11.716796875, 12.711669921875, 13.70654296875, 14.701416015625, 15.6962890625, 16.691162109375, 17.68603515625, 18.680908203125, 19.67578125, 20.670654296875, 21.66552734375, 22.660400390625, 23.6552734375, 24.650146484375, 25.64501953125, 26.639892578125, 27.634765625, 28.629638671875, 29.62451171875, 30.619384765625, 31.6142578125, 32.609130859375, 33.60400390625, 34.598876953125, 35.59375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 11.0, 23.0, 26.0, 28.0, 45.0, 81.0, 107.0, 193.0, 343.0, 536.0, 914.0, 1673.0, 2870.0, 5250.0, 9889.0, 18584.0, 35513.0, 66306.0, 117412.0, 179854.0, 208078.0, 168507.0, 105873.0, 58829.0, 31403.0, 16669.0, 8659.0, 4681.0, 2621.0, 1460.0, 835.0, 441.0, 292.0, 202.0, 113.0, 68.0, 55.0, 31.0, 19.0, 17.0, 14.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-46.9375, -45.44287109375, -43.9482421875, -42.45361328125, -40.958984375, -39.46435546875, -37.9697265625, -36.47509765625, -34.98046875, -33.48583984375, -31.9912109375, -30.49658203125, -29.001953125, -27.50732421875, -26.0126953125, -24.51806640625, -23.0234375, -21.52880859375, -20.0341796875, -18.53955078125, -17.044921875, -15.55029296875, -14.0556640625, -12.56103515625, -11.06640625, -9.57177734375, -8.0771484375, -6.58251953125, -5.087890625, -3.59326171875, -2.0986328125, -0.60400390625, 0.890625, 2.38525390625, 3.8798828125, 5.37451171875, 6.869140625, 8.36376953125, 9.8583984375, 11.35302734375, 12.84765625, 14.34228515625, 15.8369140625, 17.33154296875, 18.826171875, 20.32080078125, 21.8154296875, 23.31005859375, 24.8046875, 26.29931640625, 27.7939453125, 29.28857421875, 30.783203125, 32.27783203125, 33.7724609375, 35.26708984375, 36.76171875, 38.25634765625, 39.7509765625, 41.24560546875, 42.740234375, 44.23486328125, 45.7294921875, 47.22412109375, 48.71875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 7.0, 4.0, 7.0, 6.0, 10.0, 11.0, 11.0, 10.0, 18.0, 27.0, 26.0, 30.0, 36.0, 37.0, 50.0, 36.0, 54.0, 48.0, 48.0, 50.0, 64.0, 53.0, 57.0, 47.0, 36.0, 42.0, 37.0, 32.0, 26.0, 16.0, 22.0, 11.0, 7.0, 7.0, 13.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.015625, -26.24169921875, -25.4677734375, -24.69384765625, -23.919921875, -23.14599609375, -22.3720703125, -21.59814453125, -20.82421875, -20.05029296875, -19.2763671875, -18.50244140625, -17.728515625, -16.95458984375, -16.1806640625, -15.40673828125, -14.6328125, -13.85888671875, -13.0849609375, -12.31103515625, -11.537109375, -10.76318359375, -9.9892578125, -9.21533203125, -8.44140625, -7.66748046875, -6.8935546875, -6.11962890625, -5.345703125, -4.57177734375, -3.7978515625, -3.02392578125, -2.25, -1.47607421875, -0.7021484375, 0.07177734375, 0.845703125, 1.61962890625, 2.3935546875, 3.16748046875, 3.94140625, 4.71533203125, 5.4892578125, 6.26318359375, 7.037109375, 7.81103515625, 8.5849609375, 9.35888671875, 10.1328125, 10.90673828125, 11.6806640625, 12.45458984375, 13.228515625, 14.00244140625, 14.7763671875, 15.55029296875, 16.32421875, 17.09814453125, 17.8720703125, 18.64599609375, 19.419921875, 20.19384765625, 20.9677734375, 21.74169921875, 22.515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 9.0, 13.0, 20.0, 31.0, 39.0, 61.0, 96.0, 134.0, 189.0, 297.0, 532.0, 775.0, 1351.0, 2183.0, 3690.0, 6456.0, 11488.0, 22805.0, 47416.0, 112802.0, 272519.0, 311081.0, 139947.0, 56761.0, 26551.0, 13515.0, 7439.0, 4049.0, 2335.0, 1464.0, 840.0, 555.0, 366.0, 258.0, 156.0, 94.0, 63.0, 57.0, 32.0, 22.0, 16.0, 9.0, 10.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.49462890625, -30.3330078125, -29.17138671875, -28.009765625, -26.84814453125, -25.6865234375, -24.52490234375, -23.36328125, -22.20166015625, -21.0400390625, -19.87841796875, -18.716796875, -17.55517578125, -16.3935546875, -15.23193359375, -14.0703125, -12.90869140625, -11.7470703125, -10.58544921875, -9.423828125, -8.26220703125, -7.1005859375, -5.93896484375, -4.77734375, -3.61572265625, -2.4541015625, -1.29248046875, -0.130859375, 1.03076171875, 2.1923828125, 3.35400390625, 4.515625, 5.67724609375, 6.8388671875, 8.00048828125, 9.162109375, 10.32373046875, 11.4853515625, 12.64697265625, 13.80859375, 14.97021484375, 16.1318359375, 17.29345703125, 18.455078125, 19.61669921875, 20.7783203125, 21.93994140625, 23.1015625, 24.26318359375, 25.4248046875, 26.58642578125, 27.748046875, 28.90966796875, 30.0712890625, 31.23291015625, 32.39453125, 33.55615234375, 34.7177734375, 35.87939453125, 37.041015625, 38.20263671875, 39.3642578125, 40.52587890625, 41.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 10.0, 9.0, 12.0, 14.0, 17.0, 26.0, 33.0, 42.0, 66.0, 73.0, 71.0, 79.0, 104.0, 92.0, 75.0, 58.0, 47.0, 29.0, 23.0, 20.0, 15.0, 9.0, 15.0, 6.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0035305023193359375, -0.003426879644393921, -0.0033232569694519043, -0.0032196342945098877, -0.003116011619567871, -0.0030123889446258545, -0.002908766269683838, -0.0028051435947418213, -0.0027015209197998047, -0.002597898244857788, -0.0024942755699157715, -0.002390652894973755, -0.0022870302200317383, -0.0021834075450897217, -0.002079784870147705, -0.0019761621952056885, -0.0018725395202636719, -0.0017689168453216553, -0.0016652941703796387, -0.001561671495437622, -0.0014580488204956055, -0.0013544261455535889, -0.0012508034706115723, -0.0011471807956695557, -0.001043558120727539, -0.0009399354457855225, -0.0008363127708435059, -0.0007326900959014893, -0.0006290674209594727, -0.0005254447460174561, -0.00042182207107543945, -0.00031819939613342285, -0.00021457672119140625, -0.00011095404624938965, -7.331371307373047e-06, 9.629130363464355e-05, 0.00019991397857666016, 0.00030353665351867676, 0.00040715932846069336, 0.00051078200340271, 0.0006144046783447266, 0.0007180273532867432, 0.0008216500282287598, 0.0009252727031707764, 0.001028895378112793, 0.0011325180530548096, 0.0012361407279968262, 0.0013397634029388428, 0.0014433860778808594, 0.001547008752822876, 0.0016506314277648926, 0.0017542541027069092, 0.0018578767776489258, 0.0019614994525909424, 0.002065122127532959, 0.0021687448024749756, 0.002272367477416992, 0.002375990152359009, 0.0024796128273010254, 0.002583235502243042, 0.0026868581771850586, 0.002790480852127075, 0.002894103527069092, 0.0029977262020111084, 0.003101348876953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 13.0, 10.0, 9.0, 13.0, 25.0, 33.0, 38.0, 45.0, 60.0, 101.0, 144.0, 180.0, 302.0, 424.0, 673.0, 1068.0, 1799.0, 3154.0, 5878.0, 12352.0, 28577.0, 78555.0, 232677.0, 381356.0, 190279.0, 63367.0, 24062.0, 10783.0, 5207.0, 2885.0, 1645.0, 925.0, 592.0, 405.0, 274.0, 191.0, 141.0, 74.0, 64.0, 45.0, 39.0, 28.0, 12.0, 21.0, 11.0, 4.0, 4.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.0625, -36.810546875, -35.55859375, -34.306640625, -33.0546875, -31.802734375, -30.55078125, -29.298828125, -28.046875, -26.794921875, -25.54296875, -24.291015625, -23.0390625, -21.787109375, -20.53515625, -19.283203125, -18.03125, -16.779296875, -15.52734375, -14.275390625, -13.0234375, -11.771484375, -10.51953125, -9.267578125, -8.015625, -6.763671875, -5.51171875, -4.259765625, -3.0078125, -1.755859375, -0.50390625, 0.748046875, 2.0, 3.251953125, 4.50390625, 5.755859375, 7.0078125, 8.259765625, 9.51171875, 10.763671875, 12.015625, 13.267578125, 14.51953125, 15.771484375, 17.0234375, 18.275390625, 19.52734375, 20.779296875, 22.03125, 23.283203125, 24.53515625, 25.787109375, 27.0390625, 28.291015625, 29.54296875, 30.794921875, 32.046875, 33.298828125, 34.55078125, 35.802734375, 37.0546875, 38.306640625, 39.55859375, 40.810546875, 42.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 9.0, 16.0, 13.0, 11.0, 18.0, 19.0, 31.0, 35.0, 44.0, 52.0, 76.0, 57.0, 81.0, 73.0, 76.0, 64.0, 70.0, 54.0, 36.0, 37.0, 24.0, 19.0, 16.0, 21.0, 14.0, 12.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.890625, -10.5810546875, -10.271484375, -9.9619140625, -9.65234375, -9.3427734375, -9.033203125, -8.7236328125, -8.4140625, -8.1044921875, -7.794921875, -7.4853515625, -7.17578125, -6.8662109375, -6.556640625, -6.2470703125, -5.9375, -5.6279296875, -5.318359375, -5.0087890625, -4.69921875, -4.3896484375, -4.080078125, -3.7705078125, -3.4609375, -3.1513671875, -2.841796875, -2.5322265625, -2.22265625, -1.9130859375, -1.603515625, -1.2939453125, -0.984375, -0.6748046875, -0.365234375, -0.0556640625, 0.25390625, 0.5634765625, 0.873046875, 1.1826171875, 1.4921875, 1.8017578125, 2.111328125, 2.4208984375, 2.73046875, 3.0400390625, 3.349609375, 3.6591796875, 3.96875, 4.2783203125, 4.587890625, 4.8974609375, 5.20703125, 5.5166015625, 5.826171875, 6.1357421875, 6.4453125, 6.7548828125, 7.064453125, 7.3740234375, 7.68359375, 7.9931640625, 8.302734375, 8.6123046875, 8.921875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 12.0, 12.0, 8.0, 11.0, 13.0, 22.0, 31.0, 29.0, 46.0, 40.0, 46.0, 54.0, 58.0, 49.0, 62.0, 51.0, 56.0, 54.0, 38.0, 33.0, 39.0, 45.0, 42.0, 24.0, 19.0, 16.0, 13.0, 22.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.433563232421875, -26.409563064575195, -25.385562896728516, -24.361562728881836, -23.337562561035156, -22.31356430053711, -21.28956413269043, -20.26556396484375, -19.24156379699707, -18.21756362915039, -17.19356346130371, -16.16956329345703, -15.145564079284668, -14.121563911437988, -13.097564697265625, -12.073564529418945, -11.049564361572266, -10.025564193725586, -9.001564025878906, -7.977564811706543, -6.953564643859863, -5.929564476013184, -4.905564785003662, -3.8815650939941406, -2.857564926147461, -1.8335649967193604, -0.8095650672912598, 0.21443486213684082, 1.2384347915649414, 2.262434959411621, 3.2864346504211426, 4.310434341430664, 5.334434509277344, 6.358434677124023, 7.382434368133545, 8.406434059143066, 9.430434226989746, 10.454434394836426, 11.478433609008789, 12.502433776855469, 13.526433944702148, 14.550434112548828, 15.574434280395508, 16.598434448242188, 17.622432708740234, 18.646434783935547, 19.670433044433594, 20.694433212280273, 21.718433380126953, 22.742433547973633, 23.766433715820312, 24.790433883666992, 25.814434051513672, 26.83843231201172, 27.8624324798584, 28.886432647705078, 29.910432815551758, 30.934432983398438, 31.958433151245117, 32.9824333190918, 34.006431579589844, 35.030433654785156, 36.0544319152832, 37.07843017578125, 38.10243225097656]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 11.0, 10.0, 8.0, 24.0, 18.0, 21.0, 18.0, 30.0, 28.0, 24.0, 36.0, 37.0, 33.0, 32.0, 53.0, 40.0, 45.0, 39.0, 47.0, 42.0, 37.0, 40.0, 35.0, 29.0, 33.0, 36.0, 28.0, 16.0, 22.0, 17.0, 16.0, 17.0, 6.0, 11.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.413799285888672, -26.500789642333984, -25.587778091430664, -24.674766540527344, -23.761756896972656, -22.84874725341797, -21.93573570251465, -21.022724151611328, -20.10971450805664, -19.196704864501953, -18.283693313598633, -17.370681762695312, -16.457672119140625, -15.544661521911621, -14.631650924682617, -13.718640327453613, -12.80562973022461, -11.892619132995605, -10.979608535766602, -10.066597938537598, -9.153587341308594, -8.24057674407959, -7.327566146850586, -6.414555549621582, -5.501544952392578, -4.588534355163574, -3.6755237579345703, -2.7625131607055664, -1.8495025634765625, -0.9364919662475586, -0.023481369018554688, 0.8895292282104492, 1.802541732788086, 2.71555233001709, 3.6285629272460938, 4.541573524475098, 5.454584121704102, 6.3675947189331055, 7.280605316162109, 8.193615913391113, 9.106626510620117, 10.019637107849121, 10.932647705078125, 11.845658302307129, 12.758668899536133, 13.671679496765137, 14.58469009399414, 15.497700691223145, 16.41071128845215, 17.32372283935547, 18.236732482910156, 19.149742126464844, 20.062753677368164, 20.975765228271484, 21.888774871826172, 22.80178451538086, 23.71479606628418, 24.6278076171875, 25.540817260742188, 26.453826904296875, 27.366838455200195, 28.279850006103516, 29.192859649658203, 30.10586929321289, 31.01888084411621]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 6.0, 11.0, 21.0, 36.0, 52.0, 56.0, 136.0, 203.0, 344.0, 535.0, 844.0, 1346.0, 2225.0, 3514.0, 5793.0, 9512.0, 16231.0, 28510.0, 52314.0, 99857.0, 200680.0, 407846.0, 736519.0, 945563.0, 777592.0, 445445.0, 220266.0, 108409.0, 56690.0, 30864.0, 17104.0, 9872.0, 5943.0, 3691.0, 2327.0, 1448.0, 871.0, 550.0, 400.0, 224.0, 141.0, 93.0, 58.0, 47.0, 29.0, 18.0, 19.0, 12.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.35791015625, -24.4033203125, -23.44873046875, -22.494140625, -21.53955078125, -20.5849609375, -19.63037109375, -18.67578125, -17.72119140625, -16.7666015625, -15.81201171875, -14.857421875, -13.90283203125, -12.9482421875, -11.99365234375, -11.0390625, -10.08447265625, -9.1298828125, -8.17529296875, -7.220703125, -6.26611328125, -5.3115234375, -4.35693359375, -3.40234375, -2.44775390625, -1.4931640625, -0.53857421875, 0.416015625, 1.37060546875, 2.3251953125, 3.27978515625, 4.234375, 5.18896484375, 6.1435546875, 7.09814453125, 8.052734375, 9.00732421875, 9.9619140625, 10.91650390625, 11.87109375, 12.82568359375, 13.7802734375, 14.73486328125, 15.689453125, 16.64404296875, 17.5986328125, 18.55322265625, 19.5078125, 20.46240234375, 21.4169921875, 22.37158203125, 23.326171875, 24.28076171875, 25.2353515625, 26.18994140625, 27.14453125, 28.09912109375, 29.0537109375, 30.00830078125, 30.962890625, 31.91748046875, 32.8720703125, 33.82666015625, 34.78125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 1.0, 9.0, 9.0, 5.0, 6.0, 9.0, 11.0, 15.0, 23.0, 21.0, 27.0, 17.0, 42.0, 34.0, 29.0, 24.0, 38.0, 35.0, 30.0, 41.0, 45.0, 46.0, 35.0, 47.0, 40.0, 42.0, 34.0, 31.0, 36.0, 31.0, 27.0, 21.0, 18.0, 20.0, 17.0, 10.0, 8.0, 11.0, 18.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.109375, -21.3740234375, -20.638671875, -19.9033203125, -19.16796875, -18.4326171875, -17.697265625, -16.9619140625, -16.2265625, -15.4912109375, -14.755859375, -14.0205078125, -13.28515625, -12.5498046875, -11.814453125, -11.0791015625, -10.34375, -9.6083984375, -8.873046875, -8.1376953125, -7.40234375, -6.6669921875, -5.931640625, -5.1962890625, -4.4609375, -3.7255859375, -2.990234375, -2.2548828125, -1.51953125, -0.7841796875, -0.048828125, 0.6865234375, 1.421875, 2.1572265625, 2.892578125, 3.6279296875, 4.36328125, 5.0986328125, 5.833984375, 6.5693359375, 7.3046875, 8.0400390625, 8.775390625, 9.5107421875, 10.24609375, 10.9814453125, 11.716796875, 12.4521484375, 13.1875, 13.9228515625, 14.658203125, 15.3935546875, 16.12890625, 16.8642578125, 17.599609375, 18.3349609375, 19.0703125, 19.8056640625, 20.541015625, 21.2763671875, 22.01171875, 22.7470703125, 23.482421875, 24.2177734375, 24.953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 21.0, 20.0, 20.0, 47.0, 69.0, 104.0, 154.0, 241.0, 386.0, 561.0, 877.0, 1410.0, 2189.0, 3592.0, 5726.0, 9337.0, 15481.0, 26347.0, 45203.0, 80555.0, 146782.0, 268056.0, 475989.0, 742071.0, 847481.0, 645143.0, 387409.0, 214092.0, 116982.0, 64904.0, 37323.0, 21646.0, 12894.0, 7887.0, 4885.0, 3001.0, 1964.0, 1246.0, 746.0, 494.0, 311.0, 226.0, 145.0, 88.0, 51.0, 41.0, 27.0, 14.0, 13.0, 9.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0], "bins": [-31.1875, -30.222412109375, -29.25732421875, -28.292236328125, -27.3271484375, -26.362060546875, -25.39697265625, -24.431884765625, -23.466796875, -22.501708984375, -21.53662109375, -20.571533203125, -19.6064453125, -18.641357421875, -17.67626953125, -16.711181640625, -15.74609375, -14.781005859375, -13.81591796875, -12.850830078125, -11.8857421875, -10.920654296875, -9.95556640625, -8.990478515625, -8.025390625, -7.060302734375, -6.09521484375, -5.130126953125, -4.1650390625, -3.199951171875, -2.23486328125, -1.269775390625, -0.3046875, 0.660400390625, 1.62548828125, 2.590576171875, 3.5556640625, 4.520751953125, 5.48583984375, 6.450927734375, 7.416015625, 8.381103515625, 9.34619140625, 10.311279296875, 11.2763671875, 12.241455078125, 13.20654296875, 14.171630859375, 15.13671875, 16.101806640625, 17.06689453125, 18.031982421875, 18.9970703125, 19.962158203125, 20.92724609375, 21.892333984375, 22.857421875, 23.822509765625, 24.78759765625, 25.752685546875, 26.7177734375, 27.682861328125, 28.64794921875, 29.613037109375, 30.578125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 9.0, 17.0, 16.0, 20.0, 30.0, 37.0, 33.0, 50.0, 68.0, 84.0, 105.0, 132.0, 148.0, 196.0, 204.0, 211.0, 272.0, 282.0, 284.0, 283.0, 257.0, 245.0, 208.0, 147.0, 139.0, 125.0, 105.0, 75.0, 61.0, 44.0, 38.0, 21.0, 24.0, 19.0, 16.0, 15.0, 18.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.0703125, -12.6917724609375, -12.313232421875, -11.9346923828125, -11.55615234375, -11.1776123046875, -10.799072265625, -10.4205322265625, -10.0419921875, -9.6634521484375, -9.284912109375, -8.9063720703125, -8.52783203125, -8.1492919921875, -7.770751953125, -7.3922119140625, -7.013671875, -6.6351318359375, -6.256591796875, -5.8780517578125, -5.49951171875, -5.1209716796875, -4.742431640625, -4.3638916015625, -3.9853515625, -3.6068115234375, -3.228271484375, -2.8497314453125, -2.47119140625, -2.0926513671875, -1.714111328125, -1.3355712890625, -0.95703125, -0.5784912109375, -0.199951171875, 0.1785888671875, 0.55712890625, 0.9356689453125, 1.314208984375, 1.6927490234375, 2.0712890625, 2.4498291015625, 2.828369140625, 3.2069091796875, 3.58544921875, 3.9639892578125, 4.342529296875, 4.7210693359375, 5.099609375, 5.4781494140625, 5.856689453125, 6.2352294921875, 6.61376953125, 6.9923095703125, 7.370849609375, 7.7493896484375, 8.1279296875, 8.5064697265625, 8.885009765625, 9.2635498046875, 9.64208984375, 10.0206298828125, 10.399169921875, 10.7777099609375, 11.15625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 13.0, 19.0, 19.0, 25.0, 20.0, 27.0, 31.0, 37.0, 34.0, 43.0, 46.0, 39.0, 56.0, 51.0, 60.0, 46.0, 55.0, 53.0, 45.0, 36.0, 46.0, 28.0, 24.0, 22.0, 20.0, 20.0, 14.0, 13.0, 12.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.818099975585938, -27.872392654418945, -26.926685333251953, -25.98097801208496, -25.03527069091797, -24.089563369750977, -23.143856048583984, -22.198148727416992, -21.25244140625, -20.306734085083008, -19.361026763916016, -18.415319442749023, -17.46961212158203, -16.52390480041504, -15.578197479248047, -14.632490158081055, -13.686782836914062, -12.74107551574707, -11.795368194580078, -10.849660873413086, -9.903953552246094, -8.958246231079102, -8.01253890991211, -7.066831588745117, -6.121124267578125, -5.175416946411133, -4.229709625244141, -3.2840023040771484, -2.3382949829101562, -1.392587661743164, -0.4468803405761719, 0.4988269805908203, 1.4445323944091797, 2.390239715576172, 3.335947036743164, 4.281654357910156, 5.227361679077148, 6.173069000244141, 7.118776321411133, 8.064483642578125, 9.010190963745117, 9.95589828491211, 10.901605606079102, 11.847312927246094, 12.793020248413086, 13.738727569580078, 14.68443489074707, 15.630142211914062, 16.575849533081055, 17.521556854248047, 18.46726417541504, 19.41297149658203, 20.358678817749023, 21.304386138916016, 22.250093460083008, 23.19580078125, 24.141508102416992, 25.087215423583984, 26.032922744750977, 26.97863006591797, 27.92433738708496, 28.870044708251953, 29.815752029418945, 30.761459350585938, 31.70716667175293]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 12.0, 9.0, 21.0, 18.0, 17.0, 25.0, 23.0, 26.0, 21.0, 28.0, 30.0, 20.0, 35.0, 43.0, 37.0, 37.0, 33.0, 51.0, 44.0, 35.0, 47.0, 41.0, 33.0, 33.0, 33.0, 22.0, 28.0, 24.0, 25.0, 22.0, 23.0, 9.0, 20.0, 9.0, 9.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.12867546081543, -23.302513122558594, -22.476348876953125, -21.65018653869629, -20.824024200439453, -19.997859954833984, -19.17169761657715, -18.345535278320312, -17.519371032714844, -16.693208694458008, -15.867044448852539, -15.040882110595703, -14.21471881866455, -13.388555526733398, -12.562393188476562, -11.73622989654541, -10.910066604614258, -10.083903312683105, -9.257740020751953, -8.431577682495117, -7.605414390563965, -6.7792510986328125, -5.953088283538818, -5.126925468444824, -4.300762176513672, -3.4745991230010986, -2.6484360694885254, -1.8222730159759521, -0.9961099624633789, -0.16994667053222656, 0.6562161445617676, 1.4823789596557617, 2.3085403442382812, 3.1347033977508545, 3.9608664512634277, 4.787029266357422, 5.613192558288574, 6.439355850219727, 7.265518665313721, 8.091681480407715, 8.917844772338867, 9.74400806427002, 10.570171356201172, 11.396333694458008, 12.22249698638916, 13.048660278320312, 13.874822616577148, 14.7009859085083, 15.527149200439453, 16.35331153869629, 17.179475784301758, 18.005638122558594, 18.831802368164062, 19.6579647064209, 20.484127044677734, 21.310291290283203, 22.13645362854004, 22.962615966796875, 23.788780212402344, 24.61494255065918, 25.441104888916016, 26.267269134521484, 27.09343147277832, 27.919593811035156, 28.745758056640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 14.0, 14.0, 17.0, 21.0, 39.0, 64.0, 79.0, 135.0, 192.0, 288.0, 394.0, 591.0, 912.0, 1520.0, 2533.0, 4514.0, 9067.0, 18197.0, 39050.0, 86705.0, 181037.0, 286228.0, 215337.0, 106119.0, 48585.0, 22604.0, 10884.0, 5531.0, 3003.0, 1760.0, 1079.0, 651.0, 486.0, 286.0, 209.0, 135.0, 84.0, 62.0, 49.0, 22.0, 21.0, 12.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.46875, -41.08251953125, -39.6962890625, -38.31005859375, -36.923828125, -35.53759765625, -34.1513671875, -32.76513671875, -31.37890625, -29.99267578125, -28.6064453125, -27.22021484375, -25.833984375, -24.44775390625, -23.0615234375, -21.67529296875, -20.2890625, -18.90283203125, -17.5166015625, -16.13037109375, -14.744140625, -13.35791015625, -11.9716796875, -10.58544921875, -9.19921875, -7.81298828125, -6.4267578125, -5.04052734375, -3.654296875, -2.26806640625, -0.8818359375, 0.50439453125, 1.890625, 3.27685546875, 4.6630859375, 6.04931640625, 7.435546875, 8.82177734375, 10.2080078125, 11.59423828125, 12.98046875, 14.36669921875, 15.7529296875, 17.13916015625, 18.525390625, 19.91162109375, 21.2978515625, 22.68408203125, 24.0703125, 25.45654296875, 26.8427734375, 28.22900390625, 29.615234375, 31.00146484375, 32.3876953125, 33.77392578125, 35.16015625, 36.54638671875, 37.9326171875, 39.31884765625, 40.705078125, 42.09130859375, 43.4775390625, 44.86376953125, 46.25]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 6.0, 9.0, 15.0, 13.0, 19.0, 16.0, 20.0, 24.0, 21.0, 25.0, 31.0, 38.0, 26.0, 32.0, 33.0, 30.0, 46.0, 35.0, 38.0, 38.0, 41.0, 44.0, 53.0, 39.0, 38.0, 18.0, 34.0, 27.0, 28.0, 21.0, 28.0, 26.0, 12.0, 16.0, 11.0, 6.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-28.21875, -27.362548828125, -26.50634765625, -25.650146484375, -24.7939453125, -23.937744140625, -23.08154296875, -22.225341796875, -21.369140625, -20.512939453125, -19.65673828125, -18.800537109375, -17.9443359375, -17.088134765625, -16.23193359375, -15.375732421875, -14.51953125, -13.663330078125, -12.80712890625, -11.950927734375, -11.0947265625, -10.238525390625, -9.38232421875, -8.526123046875, -7.669921875, -6.813720703125, -5.95751953125, -5.101318359375, -4.2451171875, -3.388916015625, -2.53271484375, -1.676513671875, -0.8203125, 0.035888671875, 0.89208984375, 1.748291015625, 2.6044921875, 3.460693359375, 4.31689453125, 5.173095703125, 6.029296875, 6.885498046875, 7.74169921875, 8.597900390625, 9.4541015625, 10.310302734375, 11.16650390625, 12.022705078125, 12.87890625, 13.735107421875, 14.59130859375, 15.447509765625, 16.3037109375, 17.159912109375, 18.01611328125, 18.872314453125, 19.728515625, 20.584716796875, 21.44091796875, 22.297119140625, 23.1533203125, 24.009521484375, 24.86572265625, 25.721923828125, 26.578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 12.0, 12.0, 11.0, 13.0, 30.0, 34.0, 49.0, 79.0, 127.0, 197.0, 270.0, 426.0, 657.0, 1034.0, 1577.0, 2644.0, 4418.0, 7863.0, 14255.0, 28216.0, 56593.0, 117973.0, 227217.0, 267745.0, 158814.0, 77011.0, 37729.0, 19231.0, 9936.0, 5667.0, 3232.0, 2017.0, 1210.0, 749.0, 517.0, 299.0, 220.0, 155.0, 97.0, 68.0, 51.0, 31.0, 34.0, 14.0, 14.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-44.90625, -43.630859375, -42.35546875, -41.080078125, -39.8046875, -38.529296875, -37.25390625, -35.978515625, -34.703125, -33.427734375, -32.15234375, -30.876953125, -29.6015625, -28.326171875, -27.05078125, -25.775390625, -24.5, -23.224609375, -21.94921875, -20.673828125, -19.3984375, -18.123046875, -16.84765625, -15.572265625, -14.296875, -13.021484375, -11.74609375, -10.470703125, -9.1953125, -7.919921875, -6.64453125, -5.369140625, -4.09375, -2.818359375, -1.54296875, -0.267578125, 1.0078125, 2.283203125, 3.55859375, 4.833984375, 6.109375, 7.384765625, 8.66015625, 9.935546875, 11.2109375, 12.486328125, 13.76171875, 15.037109375, 16.3125, 17.587890625, 18.86328125, 20.138671875, 21.4140625, 22.689453125, 23.96484375, 25.240234375, 26.515625, 27.791015625, 29.06640625, 30.341796875, 31.6171875, 32.892578125, 34.16796875, 35.443359375, 36.71875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 7.0, 22.0, 10.0, 9.0, 18.0, 32.0, 34.0, 34.0, 38.0, 25.0, 44.0, 54.0, 49.0, 44.0, 64.0, 51.0, 50.0, 48.0, 44.0, 59.0, 36.0, 37.0, 30.0, 24.0, 26.0, 22.0, 16.0, 12.0, 15.0, 9.0, 6.0, 6.0, 8.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.46875, -28.689453125, -27.91015625, -27.130859375, -26.3515625, -25.572265625, -24.79296875, -24.013671875, -23.234375, -22.455078125, -21.67578125, -20.896484375, -20.1171875, -19.337890625, -18.55859375, -17.779296875, -17.0, -16.220703125, -15.44140625, -14.662109375, -13.8828125, -13.103515625, -12.32421875, -11.544921875, -10.765625, -9.986328125, -9.20703125, -8.427734375, -7.6484375, -6.869140625, -6.08984375, -5.310546875, -4.53125, -3.751953125, -2.97265625, -2.193359375, -1.4140625, -0.634765625, 0.14453125, 0.923828125, 1.703125, 2.482421875, 3.26171875, 4.041015625, 4.8203125, 5.599609375, 6.37890625, 7.158203125, 7.9375, 8.716796875, 9.49609375, 10.275390625, 11.0546875, 11.833984375, 12.61328125, 13.392578125, 14.171875, 14.951171875, 15.73046875, 16.509765625, 17.2890625, 18.068359375, 18.84765625, 19.626953125, 20.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 7.0, 13.0, 18.0, 19.0, 33.0, 54.0, 66.0, 82.0, 110.0, 188.0, 220.0, 359.0, 497.0, 749.0, 1150.0, 1910.0, 3592.0, 7565.0, 19644.0, 65872.0, 279953.0, 473455.0, 134874.0, 34286.0, 11656.0, 5271.0, 2625.0, 1448.0, 883.0, 588.0, 392.0, 251.0, 204.0, 133.0, 108.0, 59.0, 51.0, 37.0, 25.0, 27.0, 22.0, 12.0, 10.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0], "bins": [-25.78125, -25.070068359375, -24.35888671875, -23.647705078125, -22.9365234375, -22.225341796875, -21.51416015625, -20.802978515625, -20.091796875, -19.380615234375, -18.66943359375, -17.958251953125, -17.2470703125, -16.535888671875, -15.82470703125, -15.113525390625, -14.40234375, -13.691162109375, -12.97998046875, -12.268798828125, -11.5576171875, -10.846435546875, -10.13525390625, -9.424072265625, -8.712890625, -8.001708984375, -7.29052734375, -6.579345703125, -5.8681640625, -5.156982421875, -4.44580078125, -3.734619140625, -3.0234375, -2.312255859375, -1.60107421875, -0.889892578125, -0.1787109375, 0.532470703125, 1.24365234375, 1.954833984375, 2.666015625, 3.377197265625, 4.08837890625, 4.799560546875, 5.5107421875, 6.221923828125, 6.93310546875, 7.644287109375, 8.35546875, 9.066650390625, 9.77783203125, 10.489013671875, 11.2001953125, 11.911376953125, 12.62255859375, 13.333740234375, 14.044921875, 14.756103515625, 15.46728515625, 16.178466796875, 16.8896484375, 17.600830078125, 18.31201171875, 19.023193359375, 19.734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 8.0, 5.0, 6.0, 10.0, 10.0, 20.0, 52.0, 144.0, 255.0, 261.0, 126.0, 53.0, 23.0, 11.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024566650390625, -0.0023118257522583008, -0.0021669864654541016, -0.0020221471786499023, -0.0018773078918457031, -0.001732468605041504, -0.0015876293182373047, -0.0014427900314331055, -0.0012979507446289062, -0.001153111457824707, -0.0010082721710205078, -0.0008634328842163086, -0.0007185935974121094, -0.0005737543106079102, -0.00042891502380371094, -0.0002840757369995117, -0.0001392364501953125, 5.602836608886719e-06, 0.00015044212341308594, 0.00029528141021728516, 0.0004401206970214844, 0.0005849599838256836, 0.0007297992706298828, 0.000874638557434082, 0.0010194778442382812, 0.0011643171310424805, 0.0013091564178466797, 0.001453995704650879, 0.0015988349914550781, 0.0017436742782592773, 0.0018885135650634766, 0.0020333528518676758, 0.002178192138671875, 0.0023230314254760742, 0.0024678707122802734, 0.0026127099990844727, 0.002757549285888672, 0.002902388572692871, 0.0030472278594970703, 0.0031920671463012695, 0.0033369064331054688, 0.003481745719909668, 0.003626585006713867, 0.0037714242935180664, 0.003916263580322266, 0.004061102867126465, 0.004205942153930664, 0.004350781440734863, 0.0044956207275390625, 0.004640460014343262, 0.004785299301147461, 0.00493013858795166, 0.005074977874755859, 0.005219817161560059, 0.005364656448364258, 0.005509495735168457, 0.005654335021972656, 0.0057991743087768555, 0.005944013595581055, 0.006088852882385254, 0.006233692169189453, 0.006378531455993652, 0.0065233707427978516, 0.006668210029602051, 0.00681304931640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 4.0, 24.0, 31.0, 39.0, 42.0, 64.0, 97.0, 133.0, 159.0, 249.0, 297.0, 412.0, 559.0, 679.0, 1091.0, 1558.0, 2358.0, 4030.0, 7364.0, 14625.0, 34619.0, 96638.0, 273448.0, 354491.0, 157112.0, 53000.0, 21010.0, 9810.0, 5185.0, 3025.0, 1883.0, 1269.0, 882.0, 614.0, 459.0, 367.0, 209.0, 210.0, 134.0, 99.0, 70.0, 51.0, 49.0, 27.0, 23.0, 17.0, 12.0, 8.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.296875, -20.65576171875, -20.0146484375, -19.37353515625, -18.732421875, -18.09130859375, -17.4501953125, -16.80908203125, -16.16796875, -15.52685546875, -14.8857421875, -14.24462890625, -13.603515625, -12.96240234375, -12.3212890625, -11.68017578125, -11.0390625, -10.39794921875, -9.7568359375, -9.11572265625, -8.474609375, -7.83349609375, -7.1923828125, -6.55126953125, -5.91015625, -5.26904296875, -4.6279296875, -3.98681640625, -3.345703125, -2.70458984375, -2.0634765625, -1.42236328125, -0.78125, -0.14013671875, 0.5009765625, 1.14208984375, 1.783203125, 2.42431640625, 3.0654296875, 3.70654296875, 4.34765625, 4.98876953125, 5.6298828125, 6.27099609375, 6.912109375, 7.55322265625, 8.1943359375, 8.83544921875, 9.4765625, 10.11767578125, 10.7587890625, 11.39990234375, 12.041015625, 12.68212890625, 13.3232421875, 13.96435546875, 14.60546875, 15.24658203125, 15.8876953125, 16.52880859375, 17.169921875, 17.81103515625, 18.4521484375, 19.09326171875, 19.734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 9.0, 6.0, 13.0, 15.0, 37.0, 52.0, 84.0, 97.0, 115.0, 128.0, 130.0, 90.0, 74.0, 40.0, 23.0, 20.0, 15.0, 4.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.04290771484375, -6.7850341796875, -6.52716064453125, -6.269287109375, -6.01141357421875, -5.7535400390625, -5.49566650390625, -5.23779296875, -4.97991943359375, -4.7220458984375, -4.46417236328125, -4.206298828125, -3.94842529296875, -3.6905517578125, -3.43267822265625, -3.1748046875, -2.91693115234375, -2.6590576171875, -2.40118408203125, -2.143310546875, -1.88543701171875, -1.6275634765625, -1.36968994140625, -1.11181640625, -0.85394287109375, -0.5960693359375, -0.33819580078125, -0.080322265625, 0.17755126953125, 0.4354248046875, 0.69329833984375, 0.951171875, 1.20904541015625, 1.4669189453125, 1.72479248046875, 1.982666015625, 2.24053955078125, 2.4984130859375, 2.75628662109375, 3.01416015625, 3.27203369140625, 3.5299072265625, 3.78778076171875, 4.045654296875, 4.30352783203125, 4.5614013671875, 4.81927490234375, 5.0771484375, 5.33502197265625, 5.5928955078125, 5.85076904296875, 6.108642578125, 6.36651611328125, 6.6243896484375, 6.88226318359375, 7.14013671875, 7.39801025390625, 7.6558837890625, 7.91375732421875, 8.171630859375, 8.42950439453125, 8.6873779296875, 8.94525146484375, 9.203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 7.0, 9.0, 9.0, 16.0, 19.0, 16.0, 29.0, 28.0, 35.0, 49.0, 37.0, 52.0, 49.0, 55.0, 56.0, 58.0, 57.0, 51.0, 46.0, 35.0, 52.0, 42.0, 44.0, 18.0, 21.0, 25.0, 15.0, 10.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.20750617980957, -29.230022430419922, -28.252538681030273, -27.275054931640625, -26.297569274902344, -25.320085525512695, -24.342601776123047, -23.3651180267334, -22.38763427734375, -21.4101505279541, -20.432666778564453, -19.455181121826172, -18.477697372436523, -17.500213623046875, -16.522729873657227, -15.545246124267578, -14.567760467529297, -13.590276718139648, -12.612792015075684, -11.635308265686035, -10.65782356262207, -9.680339813232422, -8.702856063842773, -7.725371837615967, -6.74788761138916, -5.7704033851623535, -4.792919158935547, -3.8154354095458984, -2.837951183319092, -1.8604669570922852, -0.8829832077026367, 0.09450101852416992, 1.0719871520996094, 2.049471378326416, 3.0269553661346436, 4.004439353942871, 4.981923580169678, 5.959407806396484, 6.936891555786133, 7.9143757820129395, 8.891860008239746, 9.869343757629395, 10.84682846069336, 11.824312210083008, 12.801795959472656, 13.779280662536621, 14.75676441192627, 15.734249114990234, 16.711732864379883, 17.68921661376953, 18.66670036315918, 19.644184112548828, 20.62166976928711, 21.599153518676758, 22.576637268066406, 23.554121017456055, 24.531604766845703, 25.50908851623535, 26.486572265625, 27.46405792236328, 28.44154167175293, 29.419025421142578, 30.396509170532227, 31.373992919921875, 32.351478576660156]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 12.0, 17.0, 16.0, 18.0, 25.0, 25.0, 20.0, 34.0, 19.0, 36.0, 32.0, 33.0, 40.0, 47.0, 47.0, 51.0, 44.0, 37.0, 41.0, 44.0, 39.0, 35.0, 28.0, 26.0, 32.0, 31.0, 24.0, 25.0, 17.0, 12.0, 20.0, 7.0, 9.0, 2.0, 3.0, 8.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.00399398803711, -25.13258171081543, -24.261171340942383, -23.389759063720703, -22.518346786499023, -21.646934509277344, -20.775524139404297, -19.904111862182617, -19.032699584960938, -18.161287307739258, -17.28987693786621, -16.41846466064453, -15.547052383422852, -14.675641059875488, -13.804229736328125, -12.932817459106445, -12.061407089233398, -11.189995765686035, -10.318583488464355, -9.447172164916992, -8.575759887695312, -7.704348564147949, -6.832937240600586, -5.9615254402160645, -5.090113639831543, -4.2187018394470215, -3.347290277481079, -2.4758787155151367, -1.6044669151306152, -0.7330551147460938, 0.13835620880126953, 1.009768009185791, 1.8811798095703125, 2.752591609954834, 3.6240031719207764, 4.495414733886719, 5.36682653427124, 6.238238334655762, 7.109649658203125, 7.9810614585876465, 8.852473258972168, 9.723884582519531, 10.595296859741211, 11.466708183288574, 12.338119506835938, 13.209531784057617, 14.08094310760498, 14.952354431152344, 15.823766708374023, 16.695178985595703, 17.56658935546875, 18.43800163269043, 19.30941390991211, 20.180824279785156, 21.052236557006836, 21.923648834228516, 22.795059204101562, 23.666471481323242, 24.53788185119629, 25.40929412841797, 26.28070640563965, 27.152118682861328, 28.023529052734375, 28.894941329956055, 29.766353607177734]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 17.0, 29.0, 32.0, 58.0, 72.0, 126.0, 193.0, 287.0, 422.0, 683.0, 1025.0, 1577.0, 2469.0, 3930.0, 6025.0, 9444.0, 14690.0, 22644.0, 34995.0, 53014.0, 76424.0, 103712.0, 127862.0, 137354.0, 126727.0, 102437.0, 74718.0, 51338.0, 33909.0, 22315.0, 14306.0, 9132.0, 5825.0, 3799.0, 2435.0, 1579.0, 1053.0, 641.0, 431.0, 290.0, 186.0, 104.0, 91.0, 54.0, 33.0, 19.0, 10.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.625, -26.774169921875, -25.92333984375, -25.072509765625, -24.2216796875, -23.370849609375, -22.52001953125, -21.669189453125, -20.818359375, -19.967529296875, -19.11669921875, -18.265869140625, -17.4150390625, -16.564208984375, -15.71337890625, -14.862548828125, -14.01171875, -13.160888671875, -12.31005859375, -11.459228515625, -10.6083984375, -9.757568359375, -8.90673828125, -8.055908203125, -7.205078125, -6.354248046875, -5.50341796875, -4.652587890625, -3.8017578125, -2.950927734375, -2.10009765625, -1.249267578125, -0.3984375, 0.452392578125, 1.30322265625, 2.154052734375, 3.0048828125, 3.855712890625, 4.70654296875, 5.557373046875, 6.408203125, 7.259033203125, 8.10986328125, 8.960693359375, 9.8115234375, 10.662353515625, 11.51318359375, 12.364013671875, 13.21484375, 14.065673828125, 14.91650390625, 15.767333984375, 16.6181640625, 17.468994140625, 18.31982421875, 19.170654296875, 20.021484375, 20.872314453125, 21.72314453125, 22.573974609375, 23.4248046875, 24.275634765625, 25.12646484375, 25.977294921875, 26.828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 12.0, 21.0, 17.0, 26.0, 19.0, 31.0, 15.0, 27.0, 40.0, 23.0, 40.0, 35.0, 44.0, 32.0, 51.0, 47.0, 35.0, 35.0, 56.0, 48.0, 49.0, 35.0, 38.0, 22.0, 28.0, 18.0, 29.0, 18.0, 27.0, 15.0, 8.0, 9.0, 3.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.468994140625, -24.57861328125, -23.688232421875, -22.7978515625, -21.907470703125, -21.01708984375, -20.126708984375, -19.236328125, -18.345947265625, -17.45556640625, -16.565185546875, -15.6748046875, -14.784423828125, -13.89404296875, -13.003662109375, -12.11328125, -11.222900390625, -10.33251953125, -9.442138671875, -8.5517578125, -7.661376953125, -6.77099609375, -5.880615234375, -4.990234375, -4.099853515625, -3.20947265625, -2.319091796875, -1.4287109375, -0.538330078125, 0.35205078125, 1.242431640625, 2.1328125, 3.023193359375, 3.91357421875, 4.803955078125, 5.6943359375, 6.584716796875, 7.47509765625, 8.365478515625, 9.255859375, 10.146240234375, 11.03662109375, 11.927001953125, 12.8173828125, 13.707763671875, 14.59814453125, 15.488525390625, 16.37890625, 17.269287109375, 18.15966796875, 19.050048828125, 19.9404296875, 20.830810546875, 21.72119140625, 22.611572265625, 23.501953125, 24.392333984375, 25.28271484375, 26.173095703125, 27.0634765625, 27.953857421875, 28.84423828125, 29.734619140625, 30.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 6.0, 5.0, 6.0, 5.0, 15.0, 26.0, 28.0, 49.0, 71.0, 115.0, 157.0, 243.0, 348.0, 534.0, 759.0, 1135.0, 1725.0, 2602.0, 4074.0, 6282.0, 9788.0, 14939.0, 23948.0, 36965.0, 56926.0, 83416.0, 115351.0, 140204.0, 144576.0, 124965.0, 93851.0, 64798.0, 43166.0, 27495.0, 17670.0, 11366.0, 7387.0, 4731.0, 2979.0, 1976.0, 1263.0, 802.0, 567.0, 398.0, 270.0, 179.0, 118.0, 88.0, 63.0, 54.0, 23.0, 20.0, 17.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.09619140625, -28.0986328125, -27.10107421875, -26.103515625, -25.10595703125, -24.1083984375, -23.11083984375, -22.11328125, -21.11572265625, -20.1181640625, -19.12060546875, -18.123046875, -17.12548828125, -16.1279296875, -15.13037109375, -14.1328125, -13.13525390625, -12.1376953125, -11.14013671875, -10.142578125, -9.14501953125, -8.1474609375, -7.14990234375, -6.15234375, -5.15478515625, -4.1572265625, -3.15966796875, -2.162109375, -1.16455078125, -0.1669921875, 0.83056640625, 1.828125, 2.82568359375, 3.8232421875, 4.82080078125, 5.818359375, 6.81591796875, 7.8134765625, 8.81103515625, 9.80859375, 10.80615234375, 11.8037109375, 12.80126953125, 13.798828125, 14.79638671875, 15.7939453125, 16.79150390625, 17.7890625, 18.78662109375, 19.7841796875, 20.78173828125, 21.779296875, 22.77685546875, 23.7744140625, 24.77197265625, 25.76953125, 26.76708984375, 27.7646484375, 28.76220703125, 29.759765625, 30.75732421875, 31.7548828125, 32.75244140625, 33.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 3.0, 4.0, 6.0, 6.0, 15.0, 13.0, 9.0, 13.0, 18.0, 19.0, 28.0, 31.0, 20.0, 25.0, 33.0, 30.0, 38.0, 55.0, 35.0, 56.0, 43.0, 45.0, 43.0, 39.0, 36.0, 43.0, 44.0, 29.0, 32.0, 27.0, 26.0, 27.0, 17.0, 13.0, 16.0, 8.0, 16.0, 7.0, 4.0, 8.0, 6.0, 3.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.951904296875, -18.38818359375, -17.824462890625, -17.2607421875, -16.697021484375, -16.13330078125, -15.569580078125, -15.005859375, -14.442138671875, -13.87841796875, -13.314697265625, -12.7509765625, -12.187255859375, -11.62353515625, -11.059814453125, -10.49609375, -9.932373046875, -9.36865234375, -8.804931640625, -8.2412109375, -7.677490234375, -7.11376953125, -6.550048828125, -5.986328125, -5.422607421875, -4.85888671875, -4.295166015625, -3.7314453125, -3.167724609375, -2.60400390625, -2.040283203125, -1.4765625, -0.912841796875, -0.34912109375, 0.214599609375, 0.7783203125, 1.342041015625, 1.90576171875, 2.469482421875, 3.033203125, 3.596923828125, 4.16064453125, 4.724365234375, 5.2880859375, 5.851806640625, 6.41552734375, 6.979248046875, 7.54296875, 8.106689453125, 8.67041015625, 9.234130859375, 9.7978515625, 10.361572265625, 10.92529296875, 11.489013671875, 12.052734375, 12.616455078125, 13.18017578125, 13.743896484375, 14.3076171875, 14.871337890625, 15.43505859375, 15.998779296875, 16.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 7.0, 8.0, 16.0, 30.0, 34.0, 36.0, 44.0, 63.0, 83.0, 118.0, 184.0, 254.0, 378.0, 486.0, 736.0, 1191.0, 1662.0, 2621.0, 4208.0, 7303.0, 13662.0, 31133.0, 87290.0, 265575.0, 377011.0, 157424.0, 51213.0, 20405.0, 9889.0, 5596.0, 3351.0, 2093.0, 1415.0, 904.0, 606.0, 447.0, 292.0, 231.0, 168.0, 115.0, 74.0, 55.0, 44.0, 26.0, 20.0, 15.0, 9.0, 11.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.34375, -36.18603515625, -35.0283203125, -33.87060546875, -32.712890625, -31.55517578125, -30.3974609375, -29.23974609375, -28.08203125, -26.92431640625, -25.7666015625, -24.60888671875, -23.451171875, -22.29345703125, -21.1357421875, -19.97802734375, -18.8203125, -17.66259765625, -16.5048828125, -15.34716796875, -14.189453125, -13.03173828125, -11.8740234375, -10.71630859375, -9.55859375, -8.40087890625, -7.2431640625, -6.08544921875, -4.927734375, -3.77001953125, -2.6123046875, -1.45458984375, -0.296875, 0.86083984375, 2.0185546875, 3.17626953125, 4.333984375, 5.49169921875, 6.6494140625, 7.80712890625, 8.96484375, 10.12255859375, 11.2802734375, 12.43798828125, 13.595703125, 14.75341796875, 15.9111328125, 17.06884765625, 18.2265625, 19.38427734375, 20.5419921875, 21.69970703125, 22.857421875, 24.01513671875, 25.1728515625, 26.33056640625, 27.48828125, 28.64599609375, 29.8037109375, 30.96142578125, 32.119140625, 33.27685546875, 34.4345703125, 35.59228515625, 36.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 5.0, 6.0, 4.0, 9.0, 12.0, 12.0, 12.0, 19.0, 14.0, 17.0, 29.0, 46.0, 61.0, 55.0, 59.0, 76.0, 66.0, 81.0, 74.0, 62.0, 50.0, 37.0, 45.0, 34.0, 13.0, 19.0, 8.0, 14.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002613067626953125, -0.0025361180305480957, -0.0024591684341430664, -0.002382218837738037, -0.002305269241333008, -0.0022283196449279785, -0.0021513700485229492, -0.00207442045211792, -0.0019974708557128906, -0.0019205212593078613, -0.001843571662902832, -0.0017666220664978027, -0.0016896724700927734, -0.0016127228736877441, -0.0015357732772827148, -0.0014588236808776855, -0.0013818740844726562, -0.001304924488067627, -0.0012279748916625977, -0.0011510252952575684, -0.001074075698852539, -0.0009971261024475098, -0.0009201765060424805, -0.0008432269096374512, -0.0007662773132324219, -0.0006893277168273926, -0.0006123781204223633, -0.000535428524017334, -0.0004584789276123047, -0.0003815293312072754, -0.0003045797348022461, -0.0002276301383972168, -0.0001506805419921875, -7.37309455871582e-05, 3.2186508178710938e-06, 8.016824722290039e-05, 0.0001571178436279297, 0.00023406744003295898, 0.0003110170364379883, 0.0003879666328430176, 0.0004649162292480469, 0.0005418658256530762, 0.0006188154220581055, 0.0006957650184631348, 0.0007727146148681641, 0.0008496642112731934, 0.0009266138076782227, 0.001003563404083252, 0.0010805130004882812, 0.0011574625968933105, 0.0012344121932983398, 0.0013113617897033691, 0.0013883113861083984, 0.0014652609825134277, 0.001542210578918457, 0.0016191601753234863, 0.0016961097717285156, 0.001773059368133545, 0.0018500089645385742, 0.0019269585609436035, 0.002003908157348633, 0.002080857753753662, 0.0021578073501586914, 0.0022347569465637207, 0.00231170654296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 9.0, 11.0, 12.0, 14.0, 29.0, 43.0, 54.0, 63.0, 104.0, 124.0, 156.0, 243.0, 326.0, 435.0, 575.0, 792.0, 1080.0, 1484.0, 2234.0, 3223.0, 4800.0, 7469.0, 12776.0, 23292.0, 50112.0, 117597.0, 244449.0, 281861.0, 155904.0, 66727.0, 30216.0, 15253.0, 8999.0, 5569.0, 3705.0, 2519.0, 1781.0, 1230.0, 887.0, 653.0, 520.0, 327.0, 248.0, 187.0, 135.0, 98.0, 74.0, 47.0, 32.0, 25.0, 19.0, 15.0, 10.0, 6.0, 6.0, 1.0, 4.0, 2.0], "bins": [-26.96875, -26.15576171875, -25.3427734375, -24.52978515625, -23.716796875, -22.90380859375, -22.0908203125, -21.27783203125, -20.46484375, -19.65185546875, -18.8388671875, -18.02587890625, -17.212890625, -16.39990234375, -15.5869140625, -14.77392578125, -13.9609375, -13.14794921875, -12.3349609375, -11.52197265625, -10.708984375, -9.89599609375, -9.0830078125, -8.27001953125, -7.45703125, -6.64404296875, -5.8310546875, -5.01806640625, -4.205078125, -3.39208984375, -2.5791015625, -1.76611328125, -0.953125, -0.14013671875, 0.6728515625, 1.48583984375, 2.298828125, 3.11181640625, 3.9248046875, 4.73779296875, 5.55078125, 6.36376953125, 7.1767578125, 7.98974609375, 8.802734375, 9.61572265625, 10.4287109375, 11.24169921875, 12.0546875, 12.86767578125, 13.6806640625, 14.49365234375, 15.306640625, 16.11962890625, 16.9326171875, 17.74560546875, 18.55859375, 19.37158203125, 20.1845703125, 20.99755859375, 21.810546875, 22.62353515625, 23.4365234375, 24.24951171875, 25.0625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 10.0, 10.0, 8.0, 16.0, 10.0, 19.0, 22.0, 41.0, 37.0, 49.0, 59.0, 64.0, 105.0, 79.0, 85.0, 66.0, 50.0, 45.0, 42.0, 38.0, 26.0, 16.0, 19.0, 15.0, 12.0, 7.0, 5.0, 10.0, 5.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.25, -8.972900390625, -8.69580078125, -8.418701171875, -8.1416015625, -7.864501953125, -7.58740234375, -7.310302734375, -7.033203125, -6.756103515625, -6.47900390625, -6.201904296875, -5.9248046875, -5.647705078125, -5.37060546875, -5.093505859375, -4.81640625, -4.539306640625, -4.26220703125, -3.985107421875, -3.7080078125, -3.430908203125, -3.15380859375, -2.876708984375, -2.599609375, -2.322509765625, -2.04541015625, -1.768310546875, -1.4912109375, -1.214111328125, -0.93701171875, -0.659912109375, -0.3828125, -0.105712890625, 0.17138671875, 0.448486328125, 0.7255859375, 1.002685546875, 1.27978515625, 1.556884765625, 1.833984375, 2.111083984375, 2.38818359375, 2.665283203125, 2.9423828125, 3.219482421875, 3.49658203125, 3.773681640625, 4.05078125, 4.327880859375, 4.60498046875, 4.882080078125, 5.1591796875, 5.436279296875, 5.71337890625, 5.990478515625, 6.267578125, 6.544677734375, 6.82177734375, 7.098876953125, 7.3759765625, 7.653076171875, 7.93017578125, 8.207275390625, 8.484375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 6.0, 15.0, 19.0, 23.0, 26.0, 35.0, 41.0, 57.0, 49.0, 62.0, 67.0, 75.0, 41.0, 52.0, 70.0, 66.0, 45.0, 41.0, 38.0, 38.0, 30.0, 21.0, 7.0, 22.0, 9.0, 11.0, 10.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.146114349365234, -31.970399856567383, -30.79468536376953, -29.61897087097168, -28.443256378173828, -27.267539978027344, -26.091825485229492, -24.91611099243164, -23.74039649963379, -22.564682006835938, -21.388967514038086, -20.213253021240234, -19.03753662109375, -17.86182403564453, -16.686107635498047, -15.510393142700195, -14.334678649902344, -13.158964157104492, -11.98324966430664, -10.807534217834473, -9.631819725036621, -8.45610523223877, -7.28039026260376, -6.10467529296875, -4.928960800170898, -3.7532460689544678, -2.577531337738037, -1.4018166065216064, -0.22610187530517578, 0.9496126174926758, 2.1253275871276855, 3.3010425567626953, 4.4767608642578125, 5.652475357055664, 6.828190326690674, 8.003905296325684, 9.179619789123535, 10.355334281921387, 11.531049728393555, 12.706764221191406, 13.882478713989258, 15.05819320678711, 16.23390769958496, 17.409622192382812, 18.585338592529297, 19.761051177978516, 20.936767578125, 22.11248207092285, 23.288196563720703, 24.463911056518555, 25.639625549316406, 26.815340042114258, 27.99105453491211, 29.166770935058594, 30.342485427856445, 31.518199920654297, 32.69391632080078, 33.869632720947266, 35.045345306396484, 36.22106170654297, 37.39677429199219, 38.57249069213867, 39.74820327758789, 40.923919677734375, 42.099632263183594]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 10.0, 9.0, 11.0, 16.0, 25.0, 10.0, 19.0, 32.0, 21.0, 24.0, 24.0, 21.0, 26.0, 33.0, 27.0, 47.0, 40.0, 40.0, 45.0, 50.0, 45.0, 41.0, 41.0, 35.0, 30.0, 40.0, 40.0, 15.0, 26.0, 30.0, 24.0, 25.0, 14.0, 14.0, 8.0, 9.0, 8.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-28.99245834350586, -28.15785026550293, -27.3232421875, -26.48863410949707, -25.65402603149414, -24.81941795349121, -23.98480987548828, -23.15020179748535, -22.315593719482422, -21.480985641479492, -20.646377563476562, -19.811769485473633, -18.977161407470703, -18.142553329467773, -17.307945251464844, -16.473337173461914, -15.638729095458984, -14.804121017456055, -13.969512939453125, -13.134904861450195, -12.300296783447266, -11.465688705444336, -10.631080627441406, -9.796472549438477, -8.961864471435547, -8.127256393432617, -7.2926483154296875, -6.458040237426758, -5.623432159423828, -4.788824081420898, -3.9542160034179688, -3.119607925415039, -2.2849998474121094, -1.4503917694091797, -0.61578369140625, 0.2188243865966797, 1.0534324645996094, 1.888040542602539, 2.7226486206054688, 3.5572566986083984, 4.391864776611328, 5.226472854614258, 6.0610809326171875, 6.895689010620117, 7.730297088623047, 8.564905166625977, 9.399513244628906, 10.234121322631836, 11.068729400634766, 11.903337478637695, 12.737945556640625, 13.572553634643555, 14.407161712646484, 15.241769790649414, 16.076377868652344, 16.910985946655273, 17.745594024658203, 18.580202102661133, 19.414810180664062, 20.249418258666992, 21.084026336669922, 21.91863441467285, 22.75324249267578, 23.58785057067871, 24.42245864868164]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 6.0, 11.0, 11.0, 17.0, 41.0, 41.0, 77.0, 82.0, 142.0, 257.0, 359.0, 587.0, 1012.0, 1684.0, 2851.0, 4798.0, 8103.0, 14293.0, 26355.0, 48138.0, 93935.0, 191044.0, 409254.0, 785075.0, 1017686.0, 781667.0, 413493.0, 193334.0, 92919.0, 47677.0, 25414.0, 14013.0, 7964.0, 4750.0, 2846.0, 1702.0, 957.0, 618.0, 333.0, 262.0, 147.0, 118.0, 60.0, 53.0, 34.0, 19.0, 23.0, 9.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-33.125, -32.13623046875, -31.1474609375, -30.15869140625, -29.169921875, -28.18115234375, -27.1923828125, -26.20361328125, -25.21484375, -24.22607421875, -23.2373046875, -22.24853515625, -21.259765625, -20.27099609375, -19.2822265625, -18.29345703125, -17.3046875, -16.31591796875, -15.3271484375, -14.33837890625, -13.349609375, -12.36083984375, -11.3720703125, -10.38330078125, -9.39453125, -8.40576171875, -7.4169921875, -6.42822265625, -5.439453125, -4.45068359375, -3.4619140625, -2.47314453125, -1.484375, -0.49560546875, 0.4931640625, 1.48193359375, 2.470703125, 3.45947265625, 4.4482421875, 5.43701171875, 6.42578125, 7.41455078125, 8.4033203125, 9.39208984375, 10.380859375, 11.36962890625, 12.3583984375, 13.34716796875, 14.3359375, 15.32470703125, 16.3134765625, 17.30224609375, 18.291015625, 19.27978515625, 20.2685546875, 21.25732421875, 22.24609375, 23.23486328125, 24.2236328125, 25.21240234375, 26.201171875, 27.18994140625, 28.1787109375, 29.16748046875, 30.15625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 16.0, 16.0, 14.0, 19.0, 22.0, 17.0, 20.0, 26.0, 27.0, 32.0, 34.0, 31.0, 47.0, 39.0, 33.0, 36.0, 49.0, 37.0, 41.0, 51.0, 39.0, 55.0, 25.0, 29.0, 30.0, 25.0, 23.0, 25.0, 28.0, 16.0, 12.0, 12.0, 8.0, 7.0, 5.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.46875, -20.763671875, -20.05859375, -19.353515625, -18.6484375, -17.943359375, -17.23828125, -16.533203125, -15.828125, -15.123046875, -14.41796875, -13.712890625, -13.0078125, -12.302734375, -11.59765625, -10.892578125, -10.1875, -9.482421875, -8.77734375, -8.072265625, -7.3671875, -6.662109375, -5.95703125, -5.251953125, -4.546875, -3.841796875, -3.13671875, -2.431640625, -1.7265625, -1.021484375, -0.31640625, 0.388671875, 1.09375, 1.798828125, 2.50390625, 3.208984375, 3.9140625, 4.619140625, 5.32421875, 6.029296875, 6.734375, 7.439453125, 8.14453125, 8.849609375, 9.5546875, 10.259765625, 10.96484375, 11.669921875, 12.375, 13.080078125, 13.78515625, 14.490234375, 15.1953125, 15.900390625, 16.60546875, 17.310546875, 18.015625, 18.720703125, 19.42578125, 20.130859375, 20.8359375, 21.541015625, 22.24609375, 22.951171875, 23.65625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 8.0, 10.0, 11.0, 16.0, 39.0, 50.0, 59.0, 98.0, 141.0, 223.0, 385.0, 529.0, 818.0, 1305.0, 2096.0, 3269.0, 5137.0, 8536.0, 14480.0, 25285.0, 44260.0, 81035.0, 148131.0, 273714.0, 492411.0, 778330.0, 871112.0, 629407.0, 365439.0, 199602.0, 107925.0, 59267.0, 33178.0, 18928.0, 11202.0, 6662.0, 4077.0, 2495.0, 1628.0, 1048.0, 618.0, 439.0, 286.0, 218.0, 125.0, 82.0, 56.0, 35.0, 31.0, 16.0, 11.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-29.28125, -28.31298828125, -27.3447265625, -26.37646484375, -25.408203125, -24.43994140625, -23.4716796875, -22.50341796875, -21.53515625, -20.56689453125, -19.5986328125, -18.63037109375, -17.662109375, -16.69384765625, -15.7255859375, -14.75732421875, -13.7890625, -12.82080078125, -11.8525390625, -10.88427734375, -9.916015625, -8.94775390625, -7.9794921875, -7.01123046875, -6.04296875, -5.07470703125, -4.1064453125, -3.13818359375, -2.169921875, -1.20166015625, -0.2333984375, 0.73486328125, 1.703125, 2.67138671875, 3.6396484375, 4.60791015625, 5.576171875, 6.54443359375, 7.5126953125, 8.48095703125, 9.44921875, 10.41748046875, 11.3857421875, 12.35400390625, 13.322265625, 14.29052734375, 15.2587890625, 16.22705078125, 17.1953125, 18.16357421875, 19.1318359375, 20.10009765625, 21.068359375, 22.03662109375, 23.0048828125, 23.97314453125, 24.94140625, 25.90966796875, 26.8779296875, 27.84619140625, 28.814453125, 29.78271484375, 30.7509765625, 31.71923828125, 32.6875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 4.0, 10.0, 7.0, 14.0, 19.0, 34.0, 29.0, 51.0, 76.0, 87.0, 108.0, 126.0, 174.0, 174.0, 238.0, 256.0, 279.0, 318.0, 301.0, 297.0, 304.0, 246.0, 188.0, 151.0, 112.0, 90.0, 90.0, 55.0, 60.0, 35.0, 31.0, 30.0, 15.0, 12.0, 18.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.6875, -13.2861328125, -12.884765625, -12.4833984375, -12.08203125, -11.6806640625, -11.279296875, -10.8779296875, -10.4765625, -10.0751953125, -9.673828125, -9.2724609375, -8.87109375, -8.4697265625, -8.068359375, -7.6669921875, -7.265625, -6.8642578125, -6.462890625, -6.0615234375, -5.66015625, -5.2587890625, -4.857421875, -4.4560546875, -4.0546875, -3.6533203125, -3.251953125, -2.8505859375, -2.44921875, -2.0478515625, -1.646484375, -1.2451171875, -0.84375, -0.4423828125, -0.041015625, 0.3603515625, 0.76171875, 1.1630859375, 1.564453125, 1.9658203125, 2.3671875, 2.7685546875, 3.169921875, 3.5712890625, 3.97265625, 4.3740234375, 4.775390625, 5.1767578125, 5.578125, 5.9794921875, 6.380859375, 6.7822265625, 7.18359375, 7.5849609375, 7.986328125, 8.3876953125, 8.7890625, 9.1904296875, 9.591796875, 9.9931640625, 10.39453125, 10.7958984375, 11.197265625, 11.5986328125, 12.0]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 6.0, 5.0, 12.0, 18.0, 12.0, 26.0, 18.0, 21.0, 32.0, 29.0, 45.0, 46.0, 56.0, 63.0, 67.0, 49.0, 63.0, 62.0, 43.0, 49.0, 37.0, 32.0, 39.0, 29.0, 24.0, 29.0, 20.0, 13.0, 10.0, 8.0, 7.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.22088623046875, -33.20854568481445, -32.19620895385742, -31.183870315551758, -30.171531677246094, -29.159191131591797, -28.146852493286133, -27.13451385498047, -26.122175216674805, -25.10983657836914, -24.097497940063477, -23.085159301757812, -22.072818756103516, -21.060482025146484, -20.048141479492188, -19.035802841186523, -18.02346420288086, -17.011125564575195, -15.998786926269531, -14.98644733428955, -13.974108695983887, -12.961770057678223, -11.949430465698242, -10.937091827392578, -9.924753189086914, -8.91241455078125, -7.900075435638428, -6.8877363204956055, -5.875397682189941, -4.863059043884277, -3.850719928741455, -2.838380813598633, -1.8260459899902344, -0.8137071132659912, 0.19863176345825195, 1.2109706401824951, 2.2233095169067383, 3.2356481552124023, 4.247987270355225, 5.260326385498047, 6.272665023803711, 7.285003662109375, 8.297342300415039, 9.30968189239502, 10.322020530700684, 11.334359169006348, 12.346698760986328, 13.359037399291992, 14.371376037597656, 15.38371467590332, 16.396053314208984, 17.40839195251465, 18.420730590820312, 19.43307113647461, 20.445409774780273, 21.457748413085938, 22.4700870513916, 23.482425689697266, 24.49476432800293, 25.507102966308594, 26.51944351196289, 27.531780242919922, 28.54412078857422, 29.556459426879883, 30.568798065185547]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 12.0, 10.0, 18.0, 13.0, 12.0, 14.0, 21.0, 12.0, 25.0, 27.0, 27.0, 34.0, 30.0, 35.0, 50.0, 30.0, 38.0, 40.0, 38.0, 37.0, 41.0, 43.0, 43.0, 35.0, 36.0, 32.0, 39.0, 27.0, 27.0, 20.0, 31.0, 14.0, 15.0, 11.0, 7.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.25445556640625, -25.47844123840332, -24.702425003051758, -23.926410675048828, -23.150394439697266, -22.374380111694336, -21.598365783691406, -20.822349548339844, -20.04633331298828, -19.27031898498535, -18.49430274963379, -17.71828842163086, -16.942272186279297, -16.166257858276367, -15.390242576599121, -14.614227294921875, -13.838212966918945, -13.0621976852417, -12.286182403564453, -11.510168075561523, -10.734151840209961, -9.958137512207031, -9.182122230529785, -8.406106948852539, -7.630091667175293, -6.854076385498047, -6.078061103820801, -5.302046298980713, -4.526031017303467, -3.7500157356262207, -2.974000930786133, -2.1979856491088867, -1.4219703674316406, -0.6459552049636841, 0.13005995750427246, 0.9060750007629395, 1.6820902824401855, 2.4581055641174316, 3.2341203689575195, 4.010135650634766, 4.786150932312012, 5.562166213989258, 6.338181495666504, 7.114196300506592, 7.890211582183838, 8.666227340698242, 9.442241668701172, 10.218256950378418, 10.994272232055664, 11.77028751373291, 12.546302795410156, 13.322317123413086, 14.098333358764648, 14.874347686767578, 15.650362968444824, 16.42637825012207, 17.202392578125, 17.97840690612793, 18.754423141479492, 19.530437469482422, 20.306453704833984, 21.082468032836914, 21.858482360839844, 22.634498596191406, 23.41051483154297]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 11.0, 15.0, 20.0, 23.0, 43.0, 42.0, 79.0, 125.0, 152.0, 222.0, 322.0, 414.0, 634.0, 971.0, 1380.0, 2269.0, 3348.0, 5672.0, 9850.0, 18484.0, 36941.0, 78072.0, 158764.0, 251676.0, 226544.0, 126391.0, 60811.0, 28912.0, 14775.0, 8073.0, 4719.0, 2882.0, 1936.0, 1246.0, 851.0, 570.0, 423.0, 259.0, 180.0, 131.0, 96.0, 57.0, 65.0, 30.0, 20.0, 18.0, 12.0, 8.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.09375, -29.0849609375, -28.076171875, -27.0673828125, -26.05859375, -25.0498046875, -24.041015625, -23.0322265625, -22.0234375, -21.0146484375, -20.005859375, -18.9970703125, -17.98828125, -16.9794921875, -15.970703125, -14.9619140625, -13.953125, -12.9443359375, -11.935546875, -10.9267578125, -9.91796875, -8.9091796875, -7.900390625, -6.8916015625, -5.8828125, -4.8740234375, -3.865234375, -2.8564453125, -1.84765625, -0.8388671875, 0.169921875, 1.1787109375, 2.1875, 3.1962890625, 4.205078125, 5.2138671875, 6.22265625, 7.2314453125, 8.240234375, 9.2490234375, 10.2578125, 11.2666015625, 12.275390625, 13.2841796875, 14.29296875, 15.3017578125, 16.310546875, 17.3193359375, 18.328125, 19.3369140625, 20.345703125, 21.3544921875, 22.36328125, 23.3720703125, 24.380859375, 25.3896484375, 26.3984375, 27.4072265625, 28.416015625, 29.4248046875, 30.43359375, 31.4423828125, 32.451171875, 33.4599609375, 34.46875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 13.0, 10.0, 19.0, 17.0, 9.0, 15.0, 26.0, 25.0, 17.0, 33.0, 28.0, 37.0, 38.0, 39.0, 46.0, 42.0, 36.0, 45.0, 42.0, 38.0, 46.0, 36.0, 40.0, 44.0, 33.0, 35.0, 23.0, 22.0, 21.0, 16.0, 19.0, 12.0, 17.0, 8.0, 3.0, 10.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.5, -28.65673828125, -27.8134765625, -26.97021484375, -26.126953125, -25.28369140625, -24.4404296875, -23.59716796875, -22.75390625, -21.91064453125, -21.0673828125, -20.22412109375, -19.380859375, -18.53759765625, -17.6943359375, -16.85107421875, -16.0078125, -15.16455078125, -14.3212890625, -13.47802734375, -12.634765625, -11.79150390625, -10.9482421875, -10.10498046875, -9.26171875, -8.41845703125, -7.5751953125, -6.73193359375, -5.888671875, -5.04541015625, -4.2021484375, -3.35888671875, -2.515625, -1.67236328125, -0.8291015625, 0.01416015625, 0.857421875, 1.70068359375, 2.5439453125, 3.38720703125, 4.23046875, 5.07373046875, 5.9169921875, 6.76025390625, 7.603515625, 8.44677734375, 9.2900390625, 10.13330078125, 10.9765625, 11.81982421875, 12.6630859375, 13.50634765625, 14.349609375, 15.19287109375, 16.0361328125, 16.87939453125, 17.72265625, 18.56591796875, 19.4091796875, 20.25244140625, 21.095703125, 21.93896484375, 22.7822265625, 23.62548828125, 24.46875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 7.0, 16.0, 19.0, 13.0, 38.0, 55.0, 75.0, 79.0, 120.0, 181.0, 280.0, 407.0, 613.0, 912.0, 1392.0, 2110.0, 3481.0, 5805.0, 10017.0, 18332.0, 34565.0, 68868.0, 139676.0, 245364.0, 239120.0, 134452.0, 66647.0, 33645.0, 17384.0, 9728.0, 5656.0, 3290.0, 2072.0, 1363.0, 877.0, 570.0, 406.0, 295.0, 181.0, 116.0, 86.0, 71.0, 42.0, 26.0, 36.0, 13.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-31.609375, -30.588623046875, -29.56787109375, -28.547119140625, -27.5263671875, -26.505615234375, -25.48486328125, -24.464111328125, -23.443359375, -22.422607421875, -21.40185546875, -20.381103515625, -19.3603515625, -18.339599609375, -17.31884765625, -16.298095703125, -15.27734375, -14.256591796875, -13.23583984375, -12.215087890625, -11.1943359375, -10.173583984375, -9.15283203125, -8.132080078125, -7.111328125, -6.090576171875, -5.06982421875, -4.049072265625, -3.0283203125, -2.007568359375, -0.98681640625, 0.033935546875, 1.0546875, 2.075439453125, 3.09619140625, 4.116943359375, 5.1376953125, 6.158447265625, 7.17919921875, 8.199951171875, 9.220703125, 10.241455078125, 11.26220703125, 12.282958984375, 13.3037109375, 14.324462890625, 15.34521484375, 16.365966796875, 17.38671875, 18.407470703125, 19.42822265625, 20.448974609375, 21.4697265625, 22.490478515625, 23.51123046875, 24.531982421875, 25.552734375, 26.573486328125, 27.59423828125, 28.614990234375, 29.6357421875, 30.656494140625, 31.67724609375, 32.697998046875, 33.71875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 5.0, 5.0, 10.0, 8.0, 8.0, 13.0, 22.0, 18.0, 17.0, 25.0, 37.0, 26.0, 43.0, 39.0, 47.0, 44.0, 60.0, 47.0, 30.0, 48.0, 50.0, 41.0, 40.0, 41.0, 31.0, 27.0, 34.0, 30.0, 35.0, 22.0, 17.0, 14.0, 13.0, 13.0, 6.0, 9.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.652099609375, -16.99169921875, -16.331298828125, -15.6708984375, -15.010498046875, -14.35009765625, -13.689697265625, -13.029296875, -12.368896484375, -11.70849609375, -11.048095703125, -10.3876953125, -9.727294921875, -9.06689453125, -8.406494140625, -7.74609375, -7.085693359375, -6.42529296875, -5.764892578125, -5.1044921875, -4.444091796875, -3.78369140625, -3.123291015625, -2.462890625, -1.802490234375, -1.14208984375, -0.481689453125, 0.1787109375, 0.839111328125, 1.49951171875, 2.159912109375, 2.8203125, 3.480712890625, 4.14111328125, 4.801513671875, 5.4619140625, 6.122314453125, 6.78271484375, 7.443115234375, 8.103515625, 8.763916015625, 9.42431640625, 10.084716796875, 10.7451171875, 11.405517578125, 12.06591796875, 12.726318359375, 13.38671875, 14.047119140625, 14.70751953125, 15.367919921875, 16.0283203125, 16.688720703125, 17.34912109375, 18.009521484375, 18.669921875, 19.330322265625, 19.99072265625, 20.651123046875, 21.3115234375, 21.971923828125, 22.63232421875, 23.292724609375, 23.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 3.0, 5.0, 10.0, 22.0, 10.0, 26.0, 36.0, 33.0, 61.0, 78.0, 107.0, 153.0, 245.0, 367.0, 593.0, 893.0, 1463.0, 2656.0, 5200.0, 12005.0, 36199.0, 167381.0, 570946.0, 186039.0, 38664.0, 12764.0, 5455.0, 2787.0, 1557.0, 946.0, 584.0, 391.0, 241.0, 161.0, 132.0, 89.0, 73.0, 54.0, 38.0, 19.0, 14.0, 11.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-28.625, -27.8193359375, -27.013671875, -26.2080078125, -25.40234375, -24.5966796875, -23.791015625, -22.9853515625, -22.1796875, -21.3740234375, -20.568359375, -19.7626953125, -18.95703125, -18.1513671875, -17.345703125, -16.5400390625, -15.734375, -14.9287109375, -14.123046875, -13.3173828125, -12.51171875, -11.7060546875, -10.900390625, -10.0947265625, -9.2890625, -8.4833984375, -7.677734375, -6.8720703125, -6.06640625, -5.2607421875, -4.455078125, -3.6494140625, -2.84375, -2.0380859375, -1.232421875, -0.4267578125, 0.37890625, 1.1845703125, 1.990234375, 2.7958984375, 3.6015625, 4.4072265625, 5.212890625, 6.0185546875, 6.82421875, 7.6298828125, 8.435546875, 9.2412109375, 10.046875, 10.8525390625, 11.658203125, 12.4638671875, 13.26953125, 14.0751953125, 14.880859375, 15.6865234375, 16.4921875, 17.2978515625, 18.103515625, 18.9091796875, 19.71484375, 20.5205078125, 21.326171875, 22.1318359375, 22.9375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 14.0, 25.0, 23.0, 41.0, 32.0, 50.0, 70.0, 85.0, 106.0, 81.0, 82.0, 77.0, 56.0, 39.0, 29.0, 32.0, 23.0, 16.0, 8.0, 13.0, 6.0, 12.0, 8.0, 2.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.001216888427734375, -0.001173555850982666, -0.001130223274230957, -0.001086890697479248, -0.001043558120727539, -0.00100022554397583, -0.0009568929672241211, -0.0009135603904724121, -0.0008702278137207031, -0.0008268952369689941, -0.0007835626602172852, -0.0007402300834655762, -0.0006968975067138672, -0.0006535649299621582, -0.0006102323532104492, -0.0005668997764587402, -0.0005235671997070312, -0.00048023462295532227, -0.0004369020462036133, -0.0003935694694519043, -0.0003502368927001953, -0.00030690431594848633, -0.00026357173919677734, -0.00022023916244506836, -0.00017690658569335938, -0.0001335740089416504, -9.02414321899414e-05, -4.690885543823242e-05, -3.5762786865234375e-06, 3.975629806518555e-05, 8.308887481689453e-05, 0.00012642145156860352, 0.0001697540283203125, 0.00021308660507202148, 0.00025641918182373047, 0.00029975175857543945, 0.00034308433532714844, 0.0003864169120788574, 0.0004297494888305664, 0.0004730820655822754, 0.0005164146423339844, 0.0005597472190856934, 0.0006030797958374023, 0.0006464123725891113, 0.0006897449493408203, 0.0007330775260925293, 0.0007764101028442383, 0.0008197426795959473, 0.0008630752563476562, 0.0009064078330993652, 0.0009497404098510742, 0.0009930729866027832, 0.0010364055633544922, 0.0010797381401062012, 0.0011230707168579102, 0.0011664032936096191, 0.0012097358703613281, 0.0012530684471130371, 0.001296401023864746, 0.001339733600616455, 0.001383066177368164, 0.001426398754119873, 0.001469731330871582, 0.001513063907623291, 0.001556396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 12.0, 10.0, 17.0, 28.0, 43.0, 50.0, 71.0, 76.0, 102.0, 188.0, 252.0, 342.0, 467.0, 661.0, 881.0, 1339.0, 1974.0, 3421.0, 6219.0, 14012.0, 41340.0, 156644.0, 457157.0, 258123.0, 65021.0, 20191.0, 8298.0, 4142.0, 2308.0, 1564.0, 1079.0, 734.0, 491.0, 352.0, 259.0, 164.0, 157.0, 106.0, 75.0, 56.0, 33.0, 27.0, 21.0, 11.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.546875, -23.746826171875, -22.94677734375, -22.146728515625, -21.3466796875, -20.546630859375, -19.74658203125, -18.946533203125, -18.146484375, -17.346435546875, -16.54638671875, -15.746337890625, -14.9462890625, -14.146240234375, -13.34619140625, -12.546142578125, -11.74609375, -10.946044921875, -10.14599609375, -9.345947265625, -8.5458984375, -7.745849609375, -6.94580078125, -6.145751953125, -5.345703125, -4.545654296875, -3.74560546875, -2.945556640625, -2.1455078125, -1.345458984375, -0.54541015625, 0.254638671875, 1.0546875, 1.854736328125, 2.65478515625, 3.454833984375, 4.2548828125, 5.054931640625, 5.85498046875, 6.655029296875, 7.455078125, 8.255126953125, 9.05517578125, 9.855224609375, 10.6552734375, 11.455322265625, 12.25537109375, 13.055419921875, 13.85546875, 14.655517578125, 15.45556640625, 16.255615234375, 17.0556640625, 17.855712890625, 18.65576171875, 19.455810546875, 20.255859375, 21.055908203125, 21.85595703125, 22.656005859375, 23.4560546875, 24.256103515625, 25.05615234375, 25.856201171875, 26.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 16.0, 17.0, 47.0, 64.0, 123.0, 191.0, 177.0, 150.0, 76.0, 31.0, 26.0, 18.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8359375, -10.498291015625, -10.16064453125, -9.822998046875, -9.4853515625, -9.147705078125, -8.81005859375, -8.472412109375, -8.134765625, -7.797119140625, -7.45947265625, -7.121826171875, -6.7841796875, -6.446533203125, -6.10888671875, -5.771240234375, -5.43359375, -5.095947265625, -4.75830078125, -4.420654296875, -4.0830078125, -3.745361328125, -3.40771484375, -3.070068359375, -2.732421875, -2.394775390625, -2.05712890625, -1.719482421875, -1.3818359375, -1.044189453125, -0.70654296875, -0.368896484375, -0.03125, 0.306396484375, 0.64404296875, 0.981689453125, 1.3193359375, 1.656982421875, 1.99462890625, 2.332275390625, 2.669921875, 3.007568359375, 3.34521484375, 3.682861328125, 4.0205078125, 4.358154296875, 4.69580078125, 5.033447265625, 5.37109375, 5.708740234375, 6.04638671875, 6.384033203125, 6.7216796875, 7.059326171875, 7.39697265625, 7.734619140625, 8.072265625, 8.409912109375, 8.74755859375, 9.085205078125, 9.4228515625, 9.760498046875, 10.09814453125, 10.435791015625, 10.7734375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 6.0, 3.0, 15.0, 12.0, 17.0, 23.0, 16.0, 29.0, 32.0, 41.0, 41.0, 47.0, 64.0, 61.0, 64.0, 56.0, 53.0, 46.0, 61.0, 52.0, 34.0, 41.0, 35.0, 26.0, 22.0, 19.0, 17.0, 12.0, 15.0, 5.0, 2.0, 5.0, 3.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-38.39461135864258, -37.37541198730469, -36.35620880126953, -35.33700942993164, -34.317806243896484, -33.298606872558594, -32.27940368652344, -31.260204315185547, -30.24100112915039, -29.221799850463867, -28.202598571777344, -27.18339729309082, -26.164196014404297, -25.144994735717773, -24.12579345703125, -23.10659408569336, -22.087392807006836, -21.068191528320312, -20.04899024963379, -19.029788970947266, -18.010587692260742, -16.99138641357422, -15.972186088562012, -14.952984809875488, -13.933783531188965, -12.914582252502441, -11.895380973815918, -10.876180648803711, -9.856979370117188, -8.837778091430664, -7.818576812744141, -6.799375534057617, -5.780176162719727, -4.760974884033203, -3.741773843765259, -2.7225728034973145, -1.703371524810791, -0.6841702461242676, 0.33503055572509766, 1.354231834411621, 2.3734331130981445, 3.392634391784668, 4.411835670471191, 5.431036472320557, 6.45023775100708, 7.4694390296936035, 8.488639831542969, 9.507841110229492, 10.527042388916016, 11.546243667602539, 12.565444946289062, 13.584646224975586, 14.60384750366211, 15.623048782348633, 16.642250061035156, 17.661449432373047, 18.680652618408203, 19.699853897094727, 20.71905517578125, 21.738256454467773, 22.757457733154297, 23.77665901184082, 24.795860290527344, 25.815059661865234, 26.834260940551758]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 5.0, 11.0, 15.0, 11.0, 12.0, 20.0, 12.0, 12.0, 18.0, 27.0, 25.0, 33.0, 34.0, 32.0, 35.0, 43.0, 43.0, 49.0, 39.0, 49.0, 44.0, 36.0, 44.0, 36.0, 37.0, 42.0, 33.0, 31.0, 21.0, 24.0, 18.0, 15.0, 16.0, 17.0, 13.0, 10.0, 5.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-27.41048812866211, -26.582136154174805, -25.7537841796875, -24.925432205200195, -24.09708023071289, -23.268728256225586, -22.44037628173828, -21.61202621459961, -20.783672332763672, -19.955320358276367, -19.126968383789062, -18.298616409301758, -17.470264434814453, -16.64191246032715, -15.81356143951416, -14.985209465026855, -14.156858444213867, -13.328506469726562, -12.500154495239258, -11.671802520751953, -10.843450546264648, -10.015098571777344, -9.186747550964355, -8.35839557647705, -7.530043601989746, -6.701691627502441, -5.873339653015137, -5.04498815536499, -4.2166361808776855, -3.388284206390381, -2.5599327087402344, -1.7315807342529297, -0.9032268524169922, -0.07487499713897705, 0.7534768581390381, 1.5818285942077637, 2.4101805686950684, 3.238532543182373, 4.0668840408325195, 4.895236015319824, 5.723587989807129, 6.551939964294434, 7.380291938781738, 8.208642959594727, 9.036994934082031, 9.865346908569336, 10.69369888305664, 11.522050857543945, 12.35040283203125, 13.178754806518555, 14.00710678100586, 14.835458755493164, 15.663810729980469, 16.492162704467773, 17.320514678955078, 18.14886474609375, 18.977218627929688, 19.805570602416992, 20.633922576904297, 21.4622745513916, 22.290626525878906, 23.11897850036621, 23.947330474853516, 24.775680541992188, 25.604032516479492]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 5.0, 6.0, 8.0, 8.0, 21.0, 25.0, 34.0, 76.0, 114.0, 157.0, 219.0, 352.0, 524.0, 770.0, 1195.0, 1851.0, 2763.0, 4231.0, 6705.0, 10238.0, 15846.0, 23611.0, 35473.0, 51175.0, 71283.0, 93891.0, 114369.0, 124486.0, 120001.0, 103018.0, 81177.0, 60085.0, 42131.0, 28254.0, 18824.0, 12237.0, 8066.0, 5423.0, 3357.0, 2248.0, 1496.0, 982.0, 635.0, 385.0, 265.0, 203.0, 108.0, 88.0, 47.0, 33.0, 23.0, 21.0, 8.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.4951171875, -19.755859375, -19.0166015625, -18.27734375, -17.5380859375, -16.798828125, -16.0595703125, -15.3203125, -14.5810546875, -13.841796875, -13.1025390625, -12.36328125, -11.6240234375, -10.884765625, -10.1455078125, -9.40625, -8.6669921875, -7.927734375, -7.1884765625, -6.44921875, -5.7099609375, -4.970703125, -4.2314453125, -3.4921875, -2.7529296875, -2.013671875, -1.2744140625, -0.53515625, 0.2041015625, 0.943359375, 1.6826171875, 2.421875, 3.1611328125, 3.900390625, 4.6396484375, 5.37890625, 6.1181640625, 6.857421875, 7.5966796875, 8.3359375, 9.0751953125, 9.814453125, 10.5537109375, 11.29296875, 12.0322265625, 12.771484375, 13.5107421875, 14.25, 14.9892578125, 15.728515625, 16.4677734375, 17.20703125, 17.9462890625, 18.685546875, 19.4248046875, 20.1640625, 20.9033203125, 21.642578125, 22.3818359375, 23.12109375, 23.8603515625, 24.599609375, 25.3388671875, 26.078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 10.0, 9.0, 13.0, 10.0, 11.0, 16.0, 18.0, 21.0, 30.0, 19.0, 29.0, 33.0, 36.0, 29.0, 33.0, 41.0, 52.0, 47.0, 46.0, 42.0, 39.0, 36.0, 42.0, 38.0, 30.0, 37.0, 41.0, 25.0, 17.0, 24.0, 18.0, 18.0, 15.0, 15.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-25.640625, -24.82861328125, -24.0166015625, -23.20458984375, -22.392578125, -21.58056640625, -20.7685546875, -19.95654296875, -19.14453125, -18.33251953125, -17.5205078125, -16.70849609375, -15.896484375, -15.08447265625, -14.2724609375, -13.46044921875, -12.6484375, -11.83642578125, -11.0244140625, -10.21240234375, -9.400390625, -8.58837890625, -7.7763671875, -6.96435546875, -6.15234375, -5.34033203125, -4.5283203125, -3.71630859375, -2.904296875, -2.09228515625, -1.2802734375, -0.46826171875, 0.34375, 1.15576171875, 1.9677734375, 2.77978515625, 3.591796875, 4.40380859375, 5.2158203125, 6.02783203125, 6.83984375, 7.65185546875, 8.4638671875, 9.27587890625, 10.087890625, 10.89990234375, 11.7119140625, 12.52392578125, 13.3359375, 14.14794921875, 14.9599609375, 15.77197265625, 16.583984375, 17.39599609375, 18.2080078125, 19.02001953125, 19.83203125, 20.64404296875, 21.4560546875, 22.26806640625, 23.080078125, 23.89208984375, 24.7041015625, 25.51611328125, 26.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 11.0, 15.0, 29.0, 41.0, 52.0, 90.0, 156.0, 226.0, 357.0, 603.0, 955.0, 1483.0, 2519.0, 4256.0, 6886.0, 11770.0, 19133.0, 30908.0, 50875.0, 79786.0, 115669.0, 149662.0, 159265.0, 138178.0, 101016.0, 67076.0, 42365.0, 25654.0, 15617.0, 9205.0, 5761.0, 3484.0, 2100.0, 1241.0, 779.0, 486.0, 324.0, 202.0, 128.0, 64.0, 48.0, 39.0, 19.0, 9.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.40625, -32.3720703125, -31.337890625, -30.3037109375, -29.26953125, -28.2353515625, -27.201171875, -26.1669921875, -25.1328125, -24.0986328125, -23.064453125, -22.0302734375, -20.99609375, -19.9619140625, -18.927734375, -17.8935546875, -16.859375, -15.8251953125, -14.791015625, -13.7568359375, -12.72265625, -11.6884765625, -10.654296875, -9.6201171875, -8.5859375, -7.5517578125, -6.517578125, -5.4833984375, -4.44921875, -3.4150390625, -2.380859375, -1.3466796875, -0.3125, 0.7216796875, 1.755859375, 2.7900390625, 3.82421875, 4.8583984375, 5.892578125, 6.9267578125, 7.9609375, 8.9951171875, 10.029296875, 11.0634765625, 12.09765625, 13.1318359375, 14.166015625, 15.2001953125, 16.234375, 17.2685546875, 18.302734375, 19.3369140625, 20.37109375, 21.4052734375, 22.439453125, 23.4736328125, 24.5078125, 25.5419921875, 26.576171875, 27.6103515625, 28.64453125, 29.6787109375, 30.712890625, 31.7470703125, 32.78125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 10.0, 7.0, 12.0, 13.0, 20.0, 30.0, 21.0, 13.0, 23.0, 26.0, 37.0, 34.0, 28.0, 36.0, 38.0, 40.0, 37.0, 42.0, 36.0, 37.0, 39.0, 43.0, 27.0, 40.0, 28.0, 36.0, 35.0, 22.0, 24.0, 18.0, 16.0, 16.0, 17.0, 10.0, 16.0, 8.0, 5.0, 13.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.265625, -16.730224609375, -16.19482421875, -15.659423828125, -15.1240234375, -14.588623046875, -14.05322265625, -13.517822265625, -12.982421875, -12.447021484375, -11.91162109375, -11.376220703125, -10.8408203125, -10.305419921875, -9.77001953125, -9.234619140625, -8.69921875, -8.163818359375, -7.62841796875, -7.093017578125, -6.5576171875, -6.022216796875, -5.48681640625, -4.951416015625, -4.416015625, -3.880615234375, -3.34521484375, -2.809814453125, -2.2744140625, -1.739013671875, -1.20361328125, -0.668212890625, -0.1328125, 0.402587890625, 0.93798828125, 1.473388671875, 2.0087890625, 2.544189453125, 3.07958984375, 3.614990234375, 4.150390625, 4.685791015625, 5.22119140625, 5.756591796875, 6.2919921875, 6.827392578125, 7.36279296875, 7.898193359375, 8.43359375, 8.968994140625, 9.50439453125, 10.039794921875, 10.5751953125, 11.110595703125, 11.64599609375, 12.181396484375, 12.716796875, 13.252197265625, 13.78759765625, 14.322998046875, 14.8583984375, 15.393798828125, 15.92919921875, 16.464599609375, 17.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 8.0, 8.0, 16.0, 27.0, 40.0, 48.0, 80.0, 122.0, 198.0, 291.0, 455.0, 673.0, 1093.0, 1786.0, 3151.0, 5695.0, 12047.0, 29781.0, 90323.0, 284125.0, 385485.0, 150756.0, 47163.0, 17557.0, 7804.0, 3868.0, 2338.0, 1279.0, 823.0, 508.0, 324.0, 236.0, 142.0, 102.0, 60.0, 49.0, 30.0, 18.0, 12.0, 10.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.59375, -38.4365234375, -37.279296875, -36.1220703125, -34.96484375, -33.8076171875, -32.650390625, -31.4931640625, -30.3359375, -29.1787109375, -28.021484375, -26.8642578125, -25.70703125, -24.5498046875, -23.392578125, -22.2353515625, -21.078125, -19.9208984375, -18.763671875, -17.6064453125, -16.44921875, -15.2919921875, -14.134765625, -12.9775390625, -11.8203125, -10.6630859375, -9.505859375, -8.3486328125, -7.19140625, -6.0341796875, -4.876953125, -3.7197265625, -2.5625, -1.4052734375, -0.248046875, 0.9091796875, 2.06640625, 3.2236328125, 4.380859375, 5.5380859375, 6.6953125, 7.8525390625, 9.009765625, 10.1669921875, 11.32421875, 12.4814453125, 13.638671875, 14.7958984375, 15.953125, 17.1103515625, 18.267578125, 19.4248046875, 20.58203125, 21.7392578125, 22.896484375, 24.0537109375, 25.2109375, 26.3681640625, 27.525390625, 28.6826171875, 29.83984375, 30.9970703125, 32.154296875, 33.3115234375, 34.46875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 11.0, 19.0, 33.0, 43.0, 49.0, 81.0, 106.0, 135.0, 135.0, 91.0, 83.0, 57.0, 43.0, 29.0, 18.0, 11.0, 10.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003662109375, -0.0035507678985595703, -0.0034394264221191406, -0.003328084945678711, -0.0032167434692382812, -0.0031054019927978516, -0.002994060516357422, -0.002882719039916992, -0.0027713775634765625, -0.002660036087036133, -0.002548694610595703, -0.0024373531341552734, -0.0023260116577148438, -0.002214670181274414, -0.0021033287048339844, -0.0019919872283935547, -0.001880645751953125, -0.0017693042755126953, -0.0016579627990722656, -0.001546621322631836, -0.0014352798461914062, -0.0013239383697509766, -0.0012125968933105469, -0.0011012554168701172, -0.0009899139404296875, -0.0008785724639892578, -0.0007672309875488281, -0.0006558895111083984, -0.0005445480346679688, -0.00043320655822753906, -0.0003218650817871094, -0.0002105236053466797, -9.918212890625e-05, 1.2159347534179688e-05, 0.00012350082397460938, 0.00023484230041503906, 0.00034618377685546875, 0.00045752525329589844, 0.0005688667297363281, 0.0006802082061767578, 0.0007915496826171875, 0.0009028911590576172, 0.0010142326354980469, 0.0011255741119384766, 0.0012369155883789062, 0.001348257064819336, 0.0014595985412597656, 0.0015709400177001953, 0.001682281494140625, 0.0017936229705810547, 0.0019049644470214844, 0.002016305923461914, 0.0021276473999023438, 0.0022389888763427734, 0.002350330352783203, 0.002461671829223633, 0.0025730133056640625, 0.002684354782104492, 0.002795696258544922, 0.0029070377349853516, 0.0030183792114257812, 0.003129720687866211, 0.0032410621643066406, 0.0033524036407470703, 0.0034637451171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 9.0, 15.0, 13.0, 26.0, 44.0, 58.0, 76.0, 108.0, 123.0, 246.0, 346.0, 599.0, 1040.0, 1789.0, 3489.0, 6741.0, 14972.0, 35618.0, 100705.0, 285386.0, 357986.0, 149698.0, 50719.0, 19802.0, 8915.0, 4405.0, 2296.0, 1274.0, 733.0, 471.0, 249.0, 189.0, 101.0, 81.0, 49.0, 33.0, 34.0, 25.0, 20.0, 9.0, 12.0, 6.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-36.59375, -35.582275390625, -34.57080078125, -33.559326171875, -32.5478515625, -31.536376953125, -30.52490234375, -29.513427734375, -28.501953125, -27.490478515625, -26.47900390625, -25.467529296875, -24.4560546875, -23.444580078125, -22.43310546875, -21.421630859375, -20.41015625, -19.398681640625, -18.38720703125, -17.375732421875, -16.3642578125, -15.352783203125, -14.34130859375, -13.329833984375, -12.318359375, -11.306884765625, -10.29541015625, -9.283935546875, -8.2724609375, -7.260986328125, -6.24951171875, -5.238037109375, -4.2265625, -3.215087890625, -2.20361328125, -1.192138671875, -0.1806640625, 0.830810546875, 1.84228515625, 2.853759765625, 3.865234375, 4.876708984375, 5.88818359375, 6.899658203125, 7.9111328125, 8.922607421875, 9.93408203125, 10.945556640625, 11.95703125, 12.968505859375, 13.97998046875, 14.991455078125, 16.0029296875, 17.014404296875, 18.02587890625, 19.037353515625, 20.048828125, 21.060302734375, 22.07177734375, 23.083251953125, 24.0947265625, 25.106201171875, 26.11767578125, 27.129150390625, 28.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 4.0, 5.0, 11.0, 17.0, 11.0, 21.0, 26.0, 36.0, 45.0, 50.0, 76.0, 99.0, 102.0, 89.0, 93.0, 62.0, 43.0, 40.0, 40.0, 25.0, 16.0, 10.0, 15.0, 10.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.75390625, -6.47296142578125, -6.1920166015625, -5.91107177734375, -5.630126953125, -5.34918212890625, -5.0682373046875, -4.78729248046875, -4.50634765625, -4.22540283203125, -3.9444580078125, -3.66351318359375, -3.382568359375, -3.10162353515625, -2.8206787109375, -2.53973388671875, -2.2587890625, -1.97784423828125, -1.6968994140625, -1.41595458984375, -1.135009765625, -0.85406494140625, -0.5731201171875, -0.29217529296875, -0.01123046875, 0.26971435546875, 0.5506591796875, 0.83160400390625, 1.112548828125, 1.39349365234375, 1.6744384765625, 1.95538330078125, 2.236328125, 2.51727294921875, 2.7982177734375, 3.07916259765625, 3.360107421875, 3.64105224609375, 3.9219970703125, 4.20294189453125, 4.48388671875, 4.76483154296875, 5.0457763671875, 5.32672119140625, 5.607666015625, 5.88861083984375, 6.1695556640625, 6.45050048828125, 6.7314453125, 7.01239013671875, 7.2933349609375, 7.57427978515625, 7.855224609375, 8.13616943359375, 8.4171142578125, 8.69805908203125, 8.97900390625, 9.25994873046875, 9.5408935546875, 9.82183837890625, 10.102783203125, 10.38372802734375, 10.6646728515625, 10.94561767578125, 11.2265625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 9.0, 20.0, 17.0, 18.0, 21.0, 21.0, 23.0, 35.0, 43.0, 41.0, 45.0, 45.0, 55.0, 50.0, 45.0, 60.0, 38.0, 40.0, 55.0, 38.0, 47.0, 31.0, 35.0, 36.0, 16.0, 17.0, 15.0, 8.0, 14.0, 8.0, 5.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.01079559326172, -31.08550453186035, -30.160213470458984, -29.23492431640625, -28.309633255004883, -27.384342193603516, -26.45905303955078, -25.533761978149414, -24.608470916748047, -23.68317985534668, -22.757888793945312, -21.832599639892578, -20.90730857849121, -19.982017517089844, -19.05672836303711, -18.131437301635742, -17.206146240234375, -16.280855178833008, -15.355565071105957, -14.430274963378906, -13.504983901977539, -12.579692840576172, -11.654402732849121, -10.72911262512207, -9.803821563720703, -8.878530502319336, -7.953240394592285, -7.027949810028076, -6.102659225463867, -5.177368640899658, -4.252078056335449, -3.3267874717712402, -2.4014949798583984, -1.4762043952941895, -0.5509138107299805, 0.3743767738342285, 1.2996673583984375, 2.2249579429626465, 3.1502485275268555, 4.0755391120910645, 5.000829696655273, 5.926120281219482, 6.851410865783691, 7.7767014503479, 8.70199203491211, 9.627283096313477, 10.552573204040527, 11.477863311767578, 12.403154373168945, 13.328445434570312, 14.253735542297363, 15.179025650024414, 16.10431671142578, 17.02960777282715, 17.954898834228516, 18.88018798828125, 19.805479049682617, 20.730770111083984, 21.65605926513672, 22.581350326538086, 23.506641387939453, 24.43193244934082, 25.357223510742188, 26.282512664794922, 27.20780372619629]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 5.0, 11.0, 15.0, 14.0, 18.0, 11.0, 16.0, 21.0, 28.0, 31.0, 28.0, 31.0, 23.0, 38.0, 53.0, 36.0, 32.0, 44.0, 43.0, 40.0, 49.0, 46.0, 36.0, 39.0, 28.0, 37.0, 37.0, 27.0, 27.0, 18.0, 22.0, 13.0, 8.0, 12.0, 13.0, 10.0, 9.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.625940322875977, -24.803417205810547, -23.98089599609375, -23.15837287902832, -22.335851669311523, -21.513328552246094, -20.690807342529297, -19.868284225463867, -19.045761108398438, -18.223237991333008, -17.40071678161621, -16.57819366455078, -15.755671501159668, -14.933149337768555, -14.110627174377441, -13.288105010986328, -12.465582847595215, -11.643060684204102, -10.820538520812988, -9.998016357421875, -9.175493240356445, -8.352971076965332, -7.530448913574219, -6.707926273345947, -5.885404109954834, -5.062881946563721, -4.240359306335449, -3.417837142944336, -2.5953147411346436, -1.7727923393249512, -0.9502701759338379, -0.1277475357055664, 0.6947746276855469, 1.5172970294952393, 2.3398194313049316, 3.162341594696045, 3.9848639965057373, 4.80738639831543, 5.629908561706543, 6.4524312019348145, 7.274953365325928, 8.0974760055542, 8.919998168945312, 9.742520332336426, 10.565042495727539, 11.387565612792969, 12.210086822509766, 13.032609939575195, 13.855132102966309, 14.677654266357422, 15.500176429748535, 16.32269859313965, 17.145221710205078, 17.967742919921875, 18.790266036987305, 19.612789154052734, 20.43531036376953, 21.25783348083496, 22.080354690551758, 22.902877807617188, 23.725399017333984, 24.547922134399414, 25.370445251464844, 26.19296646118164, 27.01548957824707]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 13.0, 13.0, 18.0, 30.0, 37.0, 62.0, 70.0, 98.0, 178.0, 260.0, 372.0, 573.0, 820.0, 1245.0, 1940.0, 2876.0, 4783.0, 7807.0, 12727.0, 21680.0, 37594.0, 67850.0, 124283.0, 238435.0, 458588.0, 759983.0, 894242.0, 693349.0, 401915.0, 208880.0, 110298.0, 60257.0, 33669.0, 19593.0, 11341.0, 6792.0, 4294.0, 2591.0, 1657.0, 1060.0, 644.0, 442.0, 291.0, 212.0, 139.0, 83.0, 67.0, 43.0, 35.0, 26.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.046875, -28.177001953125, -27.30712890625, -26.437255859375, -25.5673828125, -24.697509765625, -23.82763671875, -22.957763671875, -22.087890625, -21.218017578125, -20.34814453125, -19.478271484375, -18.6083984375, -17.738525390625, -16.86865234375, -15.998779296875, -15.12890625, -14.259033203125, -13.38916015625, -12.519287109375, -11.6494140625, -10.779541015625, -9.90966796875, -9.039794921875, -8.169921875, -7.300048828125, -6.43017578125, -5.560302734375, -4.6904296875, -3.820556640625, -2.95068359375, -2.080810546875, -1.2109375, -0.341064453125, 0.52880859375, 1.398681640625, 2.2685546875, 3.138427734375, 4.00830078125, 4.878173828125, 5.748046875, 6.617919921875, 7.48779296875, 8.357666015625, 9.2275390625, 10.097412109375, 10.96728515625, 11.837158203125, 12.70703125, 13.576904296875, 14.44677734375, 15.316650390625, 16.1865234375, 17.056396484375, 17.92626953125, 18.796142578125, 19.666015625, 20.535888671875, 21.40576171875, 22.275634765625, 23.1455078125, 24.015380859375, 24.88525390625, 25.755126953125, 26.625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 8.0, 7.0, 13.0, 10.0, 17.0, 16.0, 24.0, 28.0, 23.0, 29.0, 25.0, 31.0, 38.0, 44.0, 40.0, 43.0, 50.0, 33.0, 40.0, 44.0, 52.0, 36.0, 35.0, 44.0, 27.0, 38.0, 41.0, 20.0, 21.0, 8.0, 16.0, 11.0, 11.0, 12.0, 14.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.625, -20.917236328125, -20.20947265625, -19.501708984375, -18.7939453125, -18.086181640625, -17.37841796875, -16.670654296875, -15.962890625, -15.255126953125, -14.54736328125, -13.839599609375, -13.1318359375, -12.424072265625, -11.71630859375, -11.008544921875, -10.30078125, -9.593017578125, -8.88525390625, -8.177490234375, -7.4697265625, -6.761962890625, -6.05419921875, -5.346435546875, -4.638671875, -3.930908203125, -3.22314453125, -2.515380859375, -1.8076171875, -1.099853515625, -0.39208984375, 0.315673828125, 1.0234375, 1.731201171875, 2.43896484375, 3.146728515625, 3.8544921875, 4.562255859375, 5.27001953125, 5.977783203125, 6.685546875, 7.393310546875, 8.10107421875, 8.808837890625, 9.5166015625, 10.224365234375, 10.93212890625, 11.639892578125, 12.34765625, 13.055419921875, 13.76318359375, 14.470947265625, 15.1787109375, 15.886474609375, 16.59423828125, 17.302001953125, 18.009765625, 18.717529296875, 19.42529296875, 20.133056640625, 20.8408203125, 21.548583984375, 22.25634765625, 22.964111328125, 23.671875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 6.0, 9.0, 16.0, 22.0, 35.0, 51.0, 78.0, 135.0, 235.0, 315.0, 467.0, 792.0, 1193.0, 1886.0, 3226.0, 5148.0, 8970.0, 15778.0, 27826.0, 50651.0, 94034.0, 176513.0, 334544.0, 597600.0, 881239.0, 833396.0, 531283.0, 290147.0, 154001.0, 81938.0, 44177.0, 24511.0, 13771.0, 8044.0, 4711.0, 2795.0, 1717.0, 1137.0, 680.0, 420.0, 288.0, 173.0, 119.0, 85.0, 47.0, 37.0, 15.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-35.0, -33.996826171875, -32.99365234375, -31.990478515625, -30.9873046875, -29.984130859375, -28.98095703125, -27.977783203125, -26.974609375, -25.971435546875, -24.96826171875, -23.965087890625, -22.9619140625, -21.958740234375, -20.95556640625, -19.952392578125, -18.94921875, -17.946044921875, -16.94287109375, -15.939697265625, -14.9365234375, -13.933349609375, -12.93017578125, -11.927001953125, -10.923828125, -9.920654296875, -8.91748046875, -7.914306640625, -6.9111328125, -5.907958984375, -4.90478515625, -3.901611328125, -2.8984375, -1.895263671875, -0.89208984375, 0.111083984375, 1.1142578125, 2.117431640625, 3.12060546875, 4.123779296875, 5.126953125, 6.130126953125, 7.13330078125, 8.136474609375, 9.1396484375, 10.142822265625, 11.14599609375, 12.149169921875, 13.15234375, 14.155517578125, 15.15869140625, 16.161865234375, 17.1650390625, 18.168212890625, 19.17138671875, 20.174560546875, 21.177734375, 22.180908203125, 23.18408203125, 24.187255859375, 25.1904296875, 26.193603515625, 27.19677734375, 28.199951171875, 29.203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 5.0, 8.0, 5.0, 8.0, 12.0, 17.0, 14.0, 20.0, 18.0, 32.0, 35.0, 55.0, 69.0, 87.0, 89.0, 100.0, 110.0, 152.0, 156.0, 160.0, 207.0, 232.0, 241.0, 260.0, 242.0, 231.0, 228.0, 180.0, 173.0, 146.0, 137.0, 117.0, 106.0, 74.0, 64.0, 63.0, 53.0, 30.0, 38.0, 20.0, 13.0, 12.0, 11.0, 18.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.578125, -10.25830078125, -9.9384765625, -9.61865234375, -9.298828125, -8.97900390625, -8.6591796875, -8.33935546875, -8.01953125, -7.69970703125, -7.3798828125, -7.06005859375, -6.740234375, -6.42041015625, -6.1005859375, -5.78076171875, -5.4609375, -5.14111328125, -4.8212890625, -4.50146484375, -4.181640625, -3.86181640625, -3.5419921875, -3.22216796875, -2.90234375, -2.58251953125, -2.2626953125, -1.94287109375, -1.623046875, -1.30322265625, -0.9833984375, -0.66357421875, -0.34375, -0.02392578125, 0.2958984375, 0.61572265625, 0.935546875, 1.25537109375, 1.5751953125, 1.89501953125, 2.21484375, 2.53466796875, 2.8544921875, 3.17431640625, 3.494140625, 3.81396484375, 4.1337890625, 4.45361328125, 4.7734375, 5.09326171875, 5.4130859375, 5.73291015625, 6.052734375, 6.37255859375, 6.6923828125, 7.01220703125, 7.33203125, 7.65185546875, 7.9716796875, 8.29150390625, 8.611328125, 8.93115234375, 9.2509765625, 9.57080078125, 9.890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 3.0, 9.0, 7.0, 11.0, 11.0, 10.0, 18.0, 20.0, 23.0, 28.0, 40.0, 34.0, 53.0, 53.0, 55.0, 49.0, 71.0, 56.0, 64.0, 50.0, 48.0, 56.0, 47.0, 26.0, 34.0, 27.0, 20.0, 12.0, 16.0, 7.0, 12.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.280052185058594, -32.23918533325195, -31.19831657409668, -30.157447814941406, -29.116580963134766, -28.075712203979492, -27.03484344482422, -25.993976593017578, -24.953107833862305, -23.91223907470703, -22.87137222290039, -21.830503463745117, -20.789634704589844, -19.748767852783203, -18.70789909362793, -17.667030334472656, -16.626163482666016, -15.585295677185059, -14.544427871704102, -13.503559112548828, -12.462691307067871, -11.421823501586914, -10.38095474243164, -9.340086936950684, -8.299219131469727, -7.2583513259887695, -6.217483043670654, -5.176614761352539, -4.135746955871582, -3.094879150390625, -2.0540108680725098, -1.0131425857543945, 0.0277252197265625, 1.0685932636260986, 2.1094613075256348, 3.150329351425171, 4.191197395324707, 5.232065200805664, 6.272933483123779, 7.3138017654418945, 8.354669570922852, 9.395537376403809, 10.436405181884766, 11.477273941040039, 12.518141746520996, 13.559009552001953, 14.599878311157227, 15.640746116638184, 16.68161392211914, 17.722482681274414, 18.763349533081055, 19.804218292236328, 20.84508514404297, 21.885953903198242, 22.926822662353516, 23.967689514160156, 25.00855827331543, 26.049427032470703, 27.090293884277344, 28.131162643432617, 29.17203140258789, 30.21289825439453, 31.253767013549805, 32.29463577270508, 33.33550262451172]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 10.0, 12.0, 9.0, 11.0, 13.0, 19.0, 21.0, 25.0, 41.0, 36.0, 42.0, 28.0, 38.0, 40.0, 35.0, 45.0, 43.0, 49.0, 44.0, 48.0, 48.0, 44.0, 35.0, 43.0, 36.0, 19.0, 29.0, 16.0, 19.0, 23.0, 11.0, 11.0, 12.0, 11.0, 8.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.848255157470703, -27.998109817504883, -27.14796257019043, -26.29781723022461, -25.447669982910156, -24.597524642944336, -23.747379302978516, -22.897232055664062, -22.047086715698242, -21.196941375732422, -20.34679412841797, -19.49664878845215, -18.646503448486328, -17.796356201171875, -16.946210861206055, -16.096065521240234, -15.245918273925781, -14.395771980285645, -13.545625686645508, -12.695480346679688, -11.84533405303955, -10.995187759399414, -10.145042419433594, -9.294896125793457, -8.44474983215332, -7.594603538513184, -6.744457721710205, -5.894311904907227, -5.04416561126709, -4.194019317626953, -3.3438735008239746, -2.493727684020996, -1.6435813903808594, -0.7934353351593018, 0.05671072006225586, 0.9068567752838135, 1.757002830505371, 2.607149124145508, 3.4572949409484863, 4.307440757751465, 5.157587051391602, 6.007733345031738, 6.857879161834717, 7.708024978637695, 8.558171272277832, 9.408317565917969, 10.258462905883789, 11.108609199523926, 11.958755493164062, 12.8089017868042, 13.659048080444336, 14.509193420410156, 15.359339714050293, 16.20948600769043, 17.05963134765625, 17.909778594970703, 18.759923934936523, 19.610069274902344, 20.460216522216797, 21.310361862182617, 22.160507202148438, 23.01065444946289, 23.86079978942871, 24.71094512939453, 25.561092376708984]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 7.0, 13.0, 16.0, 53.0, 61.0, 90.0, 111.0, 192.0, 306.0, 535.0, 781.0, 1214.0, 1933.0, 3098.0, 4689.0, 7582.0, 11648.0, 18359.0, 29639.0, 46593.0, 72918.0, 107820.0, 145534.0, 161365.0, 141340.0, 103597.0, 68489.0, 44444.0, 27919.0, 17599.0, 10846.0, 7118.0, 4500.0, 2978.0, 1757.0, 1244.0, 799.0, 492.0, 332.0, 188.0, 132.0, 81.0, 51.0, 33.0, 29.0, 17.0, 8.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-15.4921875, -15.0289306640625, -14.565673828125, -14.1024169921875, -13.63916015625, -13.1759033203125, -12.712646484375, -12.2493896484375, -11.7861328125, -11.3228759765625, -10.859619140625, -10.3963623046875, -9.93310546875, -9.4698486328125, -9.006591796875, -8.5433349609375, -8.080078125, -7.6168212890625, -7.153564453125, -6.6903076171875, -6.22705078125, -5.7637939453125, -5.300537109375, -4.8372802734375, -4.3740234375, -3.9107666015625, -3.447509765625, -2.9842529296875, -2.52099609375, -2.0577392578125, -1.594482421875, -1.1312255859375, -0.66796875, -0.2047119140625, 0.258544921875, 0.7218017578125, 1.18505859375, 1.6483154296875, 2.111572265625, 2.5748291015625, 3.0380859375, 3.5013427734375, 3.964599609375, 4.4278564453125, 4.89111328125, 5.3543701171875, 5.817626953125, 6.2808837890625, 6.744140625, 7.2073974609375, 7.670654296875, 8.1339111328125, 8.59716796875, 9.0604248046875, 9.523681640625, 9.9869384765625, 10.4501953125, 10.9134521484375, 11.376708984375, 11.8399658203125, 12.30322265625, 12.7664794921875, 13.229736328125, 13.6929931640625, 14.15625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 9.0, 19.0, 16.0, 24.0, 29.0, 33.0, 26.0, 34.0, 40.0, 34.0, 38.0, 38.0, 45.0, 37.0, 35.0, 54.0, 53.0, 35.0, 37.0, 45.0, 37.0, 32.0, 27.0, 24.0, 18.0, 21.0, 20.0, 19.0, 16.0, 12.0, 9.0, 10.0, 8.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.734375, -23.920654296875, -23.10693359375, -22.293212890625, -21.4794921875, -20.665771484375, -19.85205078125, -19.038330078125, -18.224609375, -17.410888671875, -16.59716796875, -15.783447265625, -14.9697265625, -14.156005859375, -13.34228515625, -12.528564453125, -11.71484375, -10.901123046875, -10.08740234375, -9.273681640625, -8.4599609375, -7.646240234375, -6.83251953125, -6.018798828125, -5.205078125, -4.391357421875, -3.57763671875, -2.763916015625, -1.9501953125, -1.136474609375, -0.32275390625, 0.490966796875, 1.3046875, 2.118408203125, 2.93212890625, 3.745849609375, 4.5595703125, 5.373291015625, 6.18701171875, 7.000732421875, 7.814453125, 8.628173828125, 9.44189453125, 10.255615234375, 11.0693359375, 11.883056640625, 12.69677734375, 13.510498046875, 14.32421875, 15.137939453125, 15.95166015625, 16.765380859375, 17.5791015625, 18.392822265625, 19.20654296875, 20.020263671875, 20.833984375, 21.647705078125, 22.46142578125, 23.275146484375, 24.0888671875, 24.902587890625, 25.71630859375, 26.530029296875, 27.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 6.0, 14.0, 13.0, 22.0, 37.0, 42.0, 88.0, 115.0, 156.0, 265.0, 413.0, 685.0, 1118.0, 1773.0, 2980.0, 4989.0, 8827.0, 15687.0, 28470.0, 54186.0, 101993.0, 178774.0, 233048.0, 184461.0, 105581.0, 56126.0, 29975.0, 16250.0, 9302.0, 5223.0, 3057.0, 1822.0, 1138.0, 689.0, 419.0, 292.0, 177.0, 110.0, 74.0, 45.0, 37.0, 21.0, 16.0, 16.0, 12.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-22.515625, -21.801513671875, -21.08740234375, -20.373291015625, -19.6591796875, -18.945068359375, -18.23095703125, -17.516845703125, -16.802734375, -16.088623046875, -15.37451171875, -14.660400390625, -13.9462890625, -13.232177734375, -12.51806640625, -11.803955078125, -11.08984375, -10.375732421875, -9.66162109375, -8.947509765625, -8.2333984375, -7.519287109375, -6.80517578125, -6.091064453125, -5.376953125, -4.662841796875, -3.94873046875, -3.234619140625, -2.5205078125, -1.806396484375, -1.09228515625, -0.378173828125, 0.3359375, 1.050048828125, 1.76416015625, 2.478271484375, 3.1923828125, 3.906494140625, 4.62060546875, 5.334716796875, 6.048828125, 6.762939453125, 7.47705078125, 8.191162109375, 8.9052734375, 9.619384765625, 10.33349609375, 11.047607421875, 11.76171875, 12.475830078125, 13.18994140625, 13.904052734375, 14.6181640625, 15.332275390625, 16.04638671875, 16.760498046875, 17.474609375, 18.188720703125, 18.90283203125, 19.616943359375, 20.3310546875, 21.045166015625, 21.75927734375, 22.473388671875, 23.1875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 3.0, 10.0, 4.0, 11.0, 13.0, 11.0, 11.0, 17.0, 19.0, 25.0, 14.0, 26.0, 27.0, 30.0, 35.0, 33.0, 49.0, 31.0, 37.0, 29.0, 28.0, 35.0, 36.0, 42.0, 50.0, 40.0, 30.0, 38.0, 39.0, 26.0, 29.0, 16.0, 24.0, 17.0, 11.0, 15.0, 14.0, 9.0, 13.0, 11.0, 4.0, 6.0, 11.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.3046875, -14.8265380859375, -14.348388671875, -13.8702392578125, -13.39208984375, -12.9139404296875, -12.435791015625, -11.9576416015625, -11.4794921875, -11.0013427734375, -10.523193359375, -10.0450439453125, -9.56689453125, -9.0887451171875, -8.610595703125, -8.1324462890625, -7.654296875, -7.1761474609375, -6.697998046875, -6.2198486328125, -5.74169921875, -5.2635498046875, -4.785400390625, -4.3072509765625, -3.8291015625, -3.3509521484375, -2.872802734375, -2.3946533203125, -1.91650390625, -1.4383544921875, -0.960205078125, -0.4820556640625, -0.00390625, 0.4742431640625, 0.952392578125, 1.4305419921875, 1.90869140625, 2.3868408203125, 2.864990234375, 3.3431396484375, 3.8212890625, 4.2994384765625, 4.777587890625, 5.2557373046875, 5.73388671875, 6.2120361328125, 6.690185546875, 7.1683349609375, 7.646484375, 8.1246337890625, 8.602783203125, 9.0809326171875, 9.55908203125, 10.0372314453125, 10.515380859375, 10.9935302734375, 11.4716796875, 11.9498291015625, 12.427978515625, 12.9061279296875, 13.38427734375, 13.8624267578125, 14.340576171875, 14.8187255859375, 15.296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 11.0, 14.0, 9.0, 19.0, 26.0, 37.0, 54.0, 79.0, 115.0, 175.0, 198.0, 302.0, 388.0, 591.0, 846.0, 1273.0, 1882.0, 2853.0, 4518.0, 6802.0, 10974.0, 17866.0, 29681.0, 50517.0, 87119.0, 148839.0, 212241.0, 186842.0, 116349.0, 66468.0, 39000.0, 23234.0, 14269.0, 8703.0, 5455.0, 3585.0, 2333.0, 1529.0, 1038.0, 683.0, 504.0, 340.0, 225.0, 154.0, 126.0, 81.0, 54.0, 50.0, 36.0, 22.0, 17.0, 7.0, 6.0, 5.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-5.51171875, -5.32647705078125, -5.1412353515625, -4.95599365234375, -4.770751953125, -4.58551025390625, -4.4002685546875, -4.21502685546875, -4.02978515625, -3.84454345703125, -3.6593017578125, -3.47406005859375, -3.288818359375, -3.10357666015625, -2.9183349609375, -2.73309326171875, -2.5478515625, -2.36260986328125, -2.1773681640625, -1.99212646484375, -1.806884765625, -1.62164306640625, -1.4364013671875, -1.25115966796875, -1.06591796875, -0.88067626953125, -0.6954345703125, -0.51019287109375, -0.324951171875, -0.13970947265625, 0.0455322265625, 0.23077392578125, 0.416015625, 0.60125732421875, 0.7864990234375, 0.97174072265625, 1.156982421875, 1.34222412109375, 1.5274658203125, 1.71270751953125, 1.89794921875, 2.08319091796875, 2.2684326171875, 2.45367431640625, 2.638916015625, 2.82415771484375, 3.0093994140625, 3.19464111328125, 3.3798828125, 3.56512451171875, 3.7503662109375, 3.93560791015625, 4.120849609375, 4.30609130859375, 4.4913330078125, 4.67657470703125, 4.86181640625, 5.04705810546875, 5.2322998046875, 5.41754150390625, 5.602783203125, 5.78802490234375, 5.9732666015625, 6.15850830078125, 6.34375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 12.0, 4.0, 8.0, 3.0, 13.0, 6.0, 13.0, 17.0, 10.0, 24.0, 21.0, 32.0, 28.0, 40.0, 48.0, 56.0, 42.0, 64.0, 52.0, 59.0, 44.0, 46.0, 64.0, 41.0, 32.0, 40.0, 24.0, 22.0, 19.0, 21.0, 19.0, 13.0, 16.0, 13.0, 2.0, 9.0, 3.0, 9.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005884170532226562, -0.0005707666277885437, -0.0005531162023544312, -0.0005354657769203186, -0.0005178153514862061, -0.0005001649260520935, -0.00048251450061798096, -0.0004648640751838684, -0.00044721364974975586, -0.0004295632243156433, -0.00041191279888153076, -0.0003942623734474182, -0.00037661194801330566, -0.0003589615225791931, -0.00034131109714508057, -0.000323660671710968, -0.00030601024627685547, -0.0002883598208427429, -0.00027070939540863037, -0.0002530589699745178, -0.00023540854454040527, -0.00021775811910629272, -0.00020010769367218018, -0.00018245726823806763, -0.00016480684280395508, -0.00014715641736984253, -0.00012950599193572998, -0.00011185556650161743, -9.420514106750488e-05, -7.655471563339233e-05, -5.8904290199279785e-05, -4.1253864765167236e-05, -2.3603439331054688e-05, -5.953013896942139e-06, 1.169741153717041e-05, 2.934783697128296e-05, 4.699826240539551e-05, 6.464868783950806e-05, 8.22991132736206e-05, 9.994953870773315e-05, 0.0001175999641418457, 0.00013525038957595825, 0.0001529008150100708, 0.00017055124044418335, 0.0001882016658782959, 0.00020585209131240845, 0.000223502516746521, 0.00024115294218063354, 0.0002588033676147461, 0.00027645379304885864, 0.0002941042184829712, 0.00031175464391708374, 0.0003294050693511963, 0.00034705549478530884, 0.0003647059202194214, 0.00038235634565353394, 0.0004000067710876465, 0.00041765719652175903, 0.0004353076219558716, 0.00045295804738998413, 0.0004706084728240967, 0.00048825889825820923, 0.0005059093236923218, 0.0005235597491264343, 0.0005412101745605469]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 15.0, 21.0, 15.0, 30.0, 55.0, 67.0, 90.0, 114.0, 175.0, 256.0, 346.0, 594.0, 811.0, 1188.0, 1754.0, 2934.0, 4276.0, 6834.0, 10904.0, 18161.0, 30621.0, 52054.0, 90856.0, 152621.0, 207515.0, 183408.0, 116539.0, 67110.0, 38762.0, 22808.0, 13721.0, 8447.0, 5307.0, 3329.0, 2270.0, 1459.0, 941.0, 650.0, 423.0, 330.0, 237.0, 148.0, 114.0, 74.0, 49.0, 33.0, 22.0, 23.0, 11.0, 8.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.27734375, -7.0479736328125, -6.818603515625, -6.5892333984375, -6.35986328125, -6.1304931640625, -5.901123046875, -5.6717529296875, -5.4423828125, -5.2130126953125, -4.983642578125, -4.7542724609375, -4.52490234375, -4.2955322265625, -4.066162109375, -3.8367919921875, -3.607421875, -3.3780517578125, -3.148681640625, -2.9193115234375, -2.68994140625, -2.4605712890625, -2.231201171875, -2.0018310546875, -1.7724609375, -1.5430908203125, -1.313720703125, -1.0843505859375, -0.85498046875, -0.6256103515625, -0.396240234375, -0.1668701171875, 0.0625, 0.2918701171875, 0.521240234375, 0.7506103515625, 0.97998046875, 1.2093505859375, 1.438720703125, 1.6680908203125, 1.8974609375, 2.1268310546875, 2.356201171875, 2.5855712890625, 2.81494140625, 3.0443115234375, 3.273681640625, 3.5030517578125, 3.732421875, 3.9617919921875, 4.191162109375, 4.4205322265625, 4.64990234375, 4.8792724609375, 5.108642578125, 5.3380126953125, 5.5673828125, 5.7967529296875, 6.026123046875, 6.2554931640625, 6.48486328125, 6.7142333984375, 6.943603515625, 7.1729736328125, 7.40234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 19.0, 27.0, 30.0, 46.0, 45.0, 73.0, 86.0, 91.0, 113.0, 75.0, 78.0, 70.0, 57.0, 33.0, 34.0, 27.0, 19.0, 11.0, 11.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8828125, -3.75189208984375, -3.6209716796875, -3.49005126953125, -3.359130859375, -3.22821044921875, -3.0972900390625, -2.96636962890625, -2.83544921875, -2.70452880859375, -2.5736083984375, -2.44268798828125, -2.311767578125, -2.18084716796875, -2.0499267578125, -1.91900634765625, -1.7880859375, -1.65716552734375, -1.5262451171875, -1.39532470703125, -1.264404296875, -1.13348388671875, -1.0025634765625, -0.87164306640625, -0.74072265625, -0.60980224609375, -0.4788818359375, -0.34796142578125, -0.217041015625, -0.08612060546875, 0.0447998046875, 0.17572021484375, 0.306640625, 0.43756103515625, 0.5684814453125, 0.69940185546875, 0.830322265625, 0.96124267578125, 1.0921630859375, 1.22308349609375, 1.35400390625, 1.48492431640625, 1.6158447265625, 1.74676513671875, 1.877685546875, 2.00860595703125, 2.1395263671875, 2.27044677734375, 2.4013671875, 2.53228759765625, 2.6632080078125, 2.79412841796875, 2.925048828125, 3.05596923828125, 3.1868896484375, 3.31781005859375, 3.44873046875, 3.57965087890625, 3.7105712890625, 3.84149169921875, 3.972412109375, 4.10333251953125, 4.2342529296875, 4.36517333984375, 4.49609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 9.0, 6.0, 12.0, 13.0, 11.0, 17.0, 18.0, 24.0, 30.0, 35.0, 36.0, 51.0, 54.0, 51.0, 58.0, 74.0, 54.0, 67.0, 56.0, 47.0, 42.0, 46.0, 29.0, 31.0, 28.0, 24.0, 16.0, 16.0, 8.0, 5.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.29232406616211, -32.246097564697266, -31.199871063232422, -30.153644561767578, -29.107419967651367, -28.061193466186523, -27.01496696472168, -25.968740463256836, -24.922515869140625, -23.87628936767578, -22.830062866210938, -21.783836364746094, -20.737611770629883, -19.69138526916504, -18.645158767700195, -17.59893226623535, -16.552705764770508, -15.506479263305664, -14.460253715515137, -13.414027214050293, -12.367801666259766, -11.321575164794922, -10.275348663330078, -9.229122161865234, -8.182896614074707, -7.1366705894470215, -6.090444564819336, -5.044218063354492, -3.9979920387268066, -2.951766014099121, -1.9055395126342773, -0.8593134880065918, 0.18691253662109375, 1.2331386804580688, 2.279364824295044, 3.3255910873413086, 4.371817111968994, 5.41804313659668, 6.464269638061523, 7.510495662689209, 8.556721687316895, 9.602948188781738, 10.649173736572266, 11.69540023803711, 12.741626739501953, 13.78785228729248, 14.834078788757324, 15.880304336547852, 16.926530838012695, 17.97275733947754, 19.018983840942383, 20.065208435058594, 21.111434936523438, 22.15766143798828, 23.203887939453125, 24.25011444091797, 25.296340942382812, 26.342567443847656, 27.3887939453125, 28.435020446777344, 29.481245040893555, 30.5274715423584, 31.573698043823242, 32.61992263793945, 33.6661491394043]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 10.0, 7.0, 11.0, 12.0, 16.0, 18.0, 18.0, 29.0, 30.0, 44.0, 28.0, 37.0, 35.0, 39.0, 43.0, 35.0, 42.0, 49.0, 42.0, 46.0, 45.0, 45.0, 42.0, 35.0, 44.0, 29.0, 19.0, 20.0, 25.0, 11.0, 20.0, 12.0, 12.0, 12.0, 10.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.941328048706055, -28.097658157348633, -27.253990173339844, -26.410320281982422, -25.566650390625, -24.722980499267578, -23.879310607910156, -23.035642623901367, -22.191972732543945, -21.348302841186523, -20.504634857177734, -19.660964965820312, -18.81729507446289, -17.97362518310547, -17.129955291748047, -16.286287307739258, -15.442617416381836, -14.598947525024414, -13.755278587341309, -12.911609649658203, -12.067939758300781, -11.22426986694336, -10.380600929260254, -9.536931991577148, -8.693262100219727, -7.849592685699463, -7.005923271179199, -6.1622538566589355, -5.318584442138672, -4.474915027618408, -3.6312456130981445, -2.787576198577881, -1.9439048767089844, -1.1002354621887207, -0.25656604766845703, 0.5871033668518066, 1.4307727813720703, 2.274442195892334, 3.1181116104125977, 3.9617810249328613, 4.805450439453125, 5.649119853973389, 6.492789268493652, 7.336458683013916, 8.18012809753418, 9.023797988891602, 9.867466926574707, 10.711135864257812, 11.554805755615234, 12.398475646972656, 13.242144584655762, 14.085813522338867, 14.929483413696289, 15.773153305053711, 16.6168212890625, 17.460491180419922, 18.304161071777344, 19.147830963134766, 19.991500854492188, 20.835168838500977, 21.6788387298584, 22.52250862121582, 23.36617660522461, 24.20984649658203, 25.053516387939453]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 10.0, 31.0, 41.0, 64.0, 81.0, 140.0, 221.0, 298.0, 517.0, 824.0, 1264.0, 2048.0, 3138.0, 4888.0, 7478.0, 11596.0, 17943.0, 27152.0, 40854.0, 59706.0, 82850.0, 107325.0, 124913.0, 129558.0, 117406.0, 94327.0, 69951.0, 48720.0, 33441.0, 21640.0, 14190.0, 9296.0, 5907.0, 3851.0, 2511.0, 1636.0, 980.0, 610.0, 412.0, 273.0, 156.0, 133.0, 61.0, 37.0, 27.0, 12.0, 12.0, 7.0, 10.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.359375, -21.6435546875, -20.927734375, -20.2119140625, -19.49609375, -18.7802734375, -18.064453125, -17.3486328125, -16.6328125, -15.9169921875, -15.201171875, -14.4853515625, -13.76953125, -13.0537109375, -12.337890625, -11.6220703125, -10.90625, -10.1904296875, -9.474609375, -8.7587890625, -8.04296875, -7.3271484375, -6.611328125, -5.8955078125, -5.1796875, -4.4638671875, -3.748046875, -3.0322265625, -2.31640625, -1.6005859375, -0.884765625, -0.1689453125, 0.546875, 1.2626953125, 1.978515625, 2.6943359375, 3.41015625, 4.1259765625, 4.841796875, 5.5576171875, 6.2734375, 6.9892578125, 7.705078125, 8.4208984375, 9.13671875, 9.8525390625, 10.568359375, 11.2841796875, 12.0, 12.7158203125, 13.431640625, 14.1474609375, 14.86328125, 15.5791015625, 16.294921875, 17.0107421875, 17.7265625, 18.4423828125, 19.158203125, 19.8740234375, 20.58984375, 21.3056640625, 22.021484375, 22.7373046875, 23.453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 8.0, 8.0, 6.0, 11.0, 7.0, 12.0, 13.0, 18.0, 23.0, 15.0, 27.0, 26.0, 23.0, 34.0, 33.0, 47.0, 44.0, 31.0, 43.0, 39.0, 38.0, 52.0, 45.0, 34.0, 45.0, 30.0, 43.0, 33.0, 30.0, 27.0, 17.0, 22.0, 31.0, 21.0, 14.0, 11.0, 12.0, 4.0, 2.0, 3.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-26.453125, -25.636962890625, -24.82080078125, -24.004638671875, -23.1884765625, -22.372314453125, -21.55615234375, -20.739990234375, -19.923828125, -19.107666015625, -18.29150390625, -17.475341796875, -16.6591796875, -15.843017578125, -15.02685546875, -14.210693359375, -13.39453125, -12.578369140625, -11.76220703125, -10.946044921875, -10.1298828125, -9.313720703125, -8.49755859375, -7.681396484375, -6.865234375, -6.049072265625, -5.23291015625, -4.416748046875, -3.6005859375, -2.784423828125, -1.96826171875, -1.152099609375, -0.3359375, 0.480224609375, 1.29638671875, 2.112548828125, 2.9287109375, 3.744873046875, 4.56103515625, 5.377197265625, 6.193359375, 7.009521484375, 7.82568359375, 8.641845703125, 9.4580078125, 10.274169921875, 11.09033203125, 11.906494140625, 12.72265625, 13.538818359375, 14.35498046875, 15.171142578125, 15.9873046875, 16.803466796875, 17.61962890625, 18.435791015625, 19.251953125, 20.068115234375, 20.88427734375, 21.700439453125, 22.5166015625, 23.332763671875, 24.14892578125, 24.965087890625, 25.78125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 21.0, 27.0, 38.0, 53.0, 83.0, 108.0, 197.0, 250.0, 426.0, 574.0, 885.0, 1315.0, 2014.0, 3099.0, 4745.0, 7186.0, 11013.0, 16603.0, 24671.0, 36195.0, 52228.0, 72580.0, 94656.0, 113493.0, 123825.0, 118280.0, 102098.0, 79359.0, 57822.0, 41108.0, 28162.0, 18901.0, 12445.0, 8134.0, 5379.0, 3566.0, 2437.0, 1549.0, 1008.0, 680.0, 439.0, 297.0, 198.0, 138.0, 82.0, 55.0, 37.0, 38.0, 22.0, 13.0, 6.0, 4.0, 2.0, 2.0, 3.0], "bins": [-24.859375, -24.120849609375, -23.38232421875, -22.643798828125, -21.9052734375, -21.166748046875, -20.42822265625, -19.689697265625, -18.951171875, -18.212646484375, -17.47412109375, -16.735595703125, -15.9970703125, -15.258544921875, -14.52001953125, -13.781494140625, -13.04296875, -12.304443359375, -11.56591796875, -10.827392578125, -10.0888671875, -9.350341796875, -8.61181640625, -7.873291015625, -7.134765625, -6.396240234375, -5.65771484375, -4.919189453125, -4.1806640625, -3.442138671875, -2.70361328125, -1.965087890625, -1.2265625, -0.488037109375, 0.25048828125, 0.989013671875, 1.7275390625, 2.466064453125, 3.20458984375, 3.943115234375, 4.681640625, 5.420166015625, 6.15869140625, 6.897216796875, 7.6357421875, 8.374267578125, 9.11279296875, 9.851318359375, 10.58984375, 11.328369140625, 12.06689453125, 12.805419921875, 13.5439453125, 14.282470703125, 15.02099609375, 15.759521484375, 16.498046875, 17.236572265625, 17.97509765625, 18.713623046875, 19.4521484375, 20.190673828125, 20.92919921875, 21.667724609375, 22.40625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 6.0, 2.0, 6.0, 5.0, 1.0, 7.0, 16.0, 13.0, 14.0, 12.0, 15.0, 14.0, 24.0, 30.0, 21.0, 24.0, 20.0, 32.0, 31.0, 25.0, 37.0, 34.0, 36.0, 29.0, 29.0, 26.0, 49.0, 41.0, 34.0, 29.0, 32.0, 24.0, 28.0, 29.0, 24.0, 25.0, 23.0, 20.0, 16.0, 22.0, 16.0, 12.0, 19.0, 12.0, 8.0, 8.0, 9.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.421875, -12.95166015625, -12.4814453125, -12.01123046875, -11.541015625, -11.07080078125, -10.6005859375, -10.13037109375, -9.66015625, -9.18994140625, -8.7197265625, -8.24951171875, -7.779296875, -7.30908203125, -6.8388671875, -6.36865234375, -5.8984375, -5.42822265625, -4.9580078125, -4.48779296875, -4.017578125, -3.54736328125, -3.0771484375, -2.60693359375, -2.13671875, -1.66650390625, -1.1962890625, -0.72607421875, -0.255859375, 0.21435546875, 0.6845703125, 1.15478515625, 1.625, 2.09521484375, 2.5654296875, 3.03564453125, 3.505859375, 3.97607421875, 4.4462890625, 4.91650390625, 5.38671875, 5.85693359375, 6.3271484375, 6.79736328125, 7.267578125, 7.73779296875, 8.2080078125, 8.67822265625, 9.1484375, 9.61865234375, 10.0888671875, 10.55908203125, 11.029296875, 11.49951171875, 11.9697265625, 12.43994140625, 12.91015625, 13.38037109375, 13.8505859375, 14.32080078125, 14.791015625, 15.26123046875, 15.7314453125, 16.20166015625, 16.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 19.0, 28.0, 36.0, 50.0, 75.0, 76.0, 163.0, 226.0, 327.0, 476.0, 739.0, 1212.0, 1730.0, 2922.0, 4570.0, 7553.0, 12372.0, 20568.0, 35916.0, 62108.0, 106695.0, 165496.0, 198060.0, 166544.0, 107582.0, 62913.0, 36303.0, 21015.0, 12447.0, 7506.0, 4539.0, 2822.0, 1857.0, 1269.0, 759.0, 507.0, 352.0, 208.0, 150.0, 96.0, 79.0, 61.0, 36.0, 29.0, 16.0, 9.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-15.8515625, -15.3485107421875, -14.845458984375, -14.3424072265625, -13.83935546875, -13.3363037109375, -12.833251953125, -12.3302001953125, -11.8271484375, -11.3240966796875, -10.821044921875, -10.3179931640625, -9.81494140625, -9.3118896484375, -8.808837890625, -8.3057861328125, -7.802734375, -7.2996826171875, -6.796630859375, -6.2935791015625, -5.79052734375, -5.2874755859375, -4.784423828125, -4.2813720703125, -3.7783203125, -3.2752685546875, -2.772216796875, -2.2691650390625, -1.76611328125, -1.2630615234375, -0.760009765625, -0.2569580078125, 0.24609375, 0.7491455078125, 1.252197265625, 1.7552490234375, 2.25830078125, 2.7613525390625, 3.264404296875, 3.7674560546875, 4.2705078125, 4.7735595703125, 5.276611328125, 5.7796630859375, 6.28271484375, 6.7857666015625, 7.288818359375, 7.7918701171875, 8.294921875, 8.7979736328125, 9.301025390625, 9.8040771484375, 10.30712890625, 10.8101806640625, 11.313232421875, 11.8162841796875, 12.3193359375, 12.8223876953125, 13.325439453125, 13.8284912109375, 14.33154296875, 14.8345947265625, 15.337646484375, 15.8406982421875, 16.34375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 10.0, 4.0, 11.0, 8.0, 11.0, 19.0, 16.0, 19.0, 34.0, 23.0, 35.0, 37.0, 56.0, 68.0, 58.0, 76.0, 69.0, 62.0, 66.0, 62.0, 47.0, 39.0, 36.0, 23.0, 20.0, 19.0, 21.0, 10.0, 10.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018014907836914062, -0.0017462968826293945, -0.0016911029815673828, -0.001635909080505371, -0.0015807151794433594, -0.0015255212783813477, -0.001470327377319336, -0.0014151334762573242, -0.0013599395751953125, -0.0013047456741333008, -0.001249551773071289, -0.0011943578720092773, -0.0011391639709472656, -0.001083970069885254, -0.0010287761688232422, -0.0009735822677612305, -0.0009183883666992188, -0.000863194465637207, -0.0008080005645751953, -0.0007528066635131836, -0.0006976127624511719, -0.0006424188613891602, -0.0005872249603271484, -0.0005320310592651367, -0.000476837158203125, -0.0004216432571411133, -0.00036644935607910156, -0.00031125545501708984, -0.0002560615539550781, -0.0002008676528930664, -0.0001456737518310547, -9.047985076904297e-05, -3.528594970703125e-05, 1.990795135498047e-05, 7.510185241699219e-05, 0.0001302957534790039, 0.00018548965454101562, 0.00024068355560302734, 0.00029587745666503906, 0.0003510713577270508, 0.0004062652587890625, 0.0004614591598510742, 0.0005166530609130859, 0.0005718469619750977, 0.0006270408630371094, 0.0006822347640991211, 0.0007374286651611328, 0.0007926225662231445, 0.0008478164672851562, 0.000903010368347168, 0.0009582042694091797, 0.0010133981704711914, 0.0010685920715332031, 0.0011237859725952148, 0.0011789798736572266, 0.0012341737747192383, 0.00128936767578125, 0.0013445615768432617, 0.0013997554779052734, 0.0014549493789672852, 0.0015101432800292969, 0.0015653371810913086, 0.0016205310821533203, 0.001675724983215332, 0.0017309188842773438]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 12.0, 18.0, 20.0, 38.0, 47.0, 62.0, 103.0, 143.0, 230.0, 353.0, 505.0, 781.0, 1192.0, 1808.0, 3048.0, 5173.0, 8470.0, 14556.0, 25827.0, 45556.0, 79502.0, 131580.0, 184062.0, 191367.0, 143936.0, 89211.0, 51105.0, 29025.0, 16311.0, 9698.0, 5567.0, 3312.0, 2073.0, 1312.0, 863.0, 540.0, 361.0, 215.0, 192.0, 116.0, 85.0, 54.0, 34.0, 27.0, 15.0, 10.0, 8.0, 10.0, 4.0, 1.0, 4.0, 3.0], "bins": [-17.09375, -16.6068115234375, -16.119873046875, -15.6329345703125, -15.14599609375, -14.6590576171875, -14.172119140625, -13.6851806640625, -13.1982421875, -12.7113037109375, -12.224365234375, -11.7374267578125, -11.25048828125, -10.7635498046875, -10.276611328125, -9.7896728515625, -9.302734375, -8.8157958984375, -8.328857421875, -7.8419189453125, -7.35498046875, -6.8680419921875, -6.381103515625, -5.8941650390625, -5.4072265625, -4.9202880859375, -4.433349609375, -3.9464111328125, -3.45947265625, -2.9725341796875, -2.485595703125, -1.9986572265625, -1.51171875, -1.0247802734375, -0.537841796875, -0.0509033203125, 0.43603515625, 0.9229736328125, 1.409912109375, 1.8968505859375, 2.3837890625, 2.8707275390625, 3.357666015625, 3.8446044921875, 4.33154296875, 4.8184814453125, 5.305419921875, 5.7923583984375, 6.279296875, 6.7662353515625, 7.253173828125, 7.7401123046875, 8.22705078125, 8.7139892578125, 9.200927734375, 9.6878662109375, 10.1748046875, 10.6617431640625, 11.148681640625, 11.6356201171875, 12.12255859375, 12.6094970703125, 13.096435546875, 13.5833740234375, 14.0703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 16.0, 12.0, 7.0, 27.0, 23.0, 23.0, 33.0, 48.0, 40.0, 56.0, 48.0, 61.0, 47.0, 67.0, 56.0, 50.0, 45.0, 42.0, 47.0, 45.0, 36.0, 27.0, 31.0, 18.0, 20.0, 17.0, 5.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.43359375, -7.2098388671875, -6.986083984375, -6.7623291015625, -6.53857421875, -6.3148193359375, -6.091064453125, -5.8673095703125, -5.6435546875, -5.4197998046875, -5.196044921875, -4.9722900390625, -4.74853515625, -4.5247802734375, -4.301025390625, -4.0772705078125, -3.853515625, -3.6297607421875, -3.406005859375, -3.1822509765625, -2.95849609375, -2.7347412109375, -2.510986328125, -2.2872314453125, -2.0634765625, -1.8397216796875, -1.615966796875, -1.3922119140625, -1.16845703125, -0.9447021484375, -0.720947265625, -0.4971923828125, -0.2734375, -0.0496826171875, 0.174072265625, 0.3978271484375, 0.62158203125, 0.8453369140625, 1.069091796875, 1.2928466796875, 1.5166015625, 1.7403564453125, 1.964111328125, 2.1878662109375, 2.41162109375, 2.6353759765625, 2.859130859375, 3.0828857421875, 3.306640625, 3.5303955078125, 3.754150390625, 3.9779052734375, 4.20166015625, 4.4254150390625, 4.649169921875, 4.8729248046875, 5.0966796875, 5.3204345703125, 5.544189453125, 5.7679443359375, 5.99169921875, 6.2154541015625, 6.439208984375, 6.6629638671875, 6.88671875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 13.0, 10.0, 13.0, 11.0, 12.0, 25.0, 31.0, 24.0, 34.0, 45.0, 37.0, 55.0, 50.0, 44.0, 62.0, 44.0, 64.0, 60.0, 44.0, 62.0, 36.0, 36.0, 39.0, 27.0, 21.0, 18.0, 10.0, 11.0, 12.0, 10.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.07898712158203, -34.102783203125, -33.12657928466797, -32.15037536621094, -31.17417335510254, -30.19797134399414, -29.22176742553711, -28.245563507080078, -27.26936149597168, -26.29315757751465, -25.31695556640625, -24.34075164794922, -23.364547729492188, -22.38834571838379, -21.412141799926758, -20.43593978881836, -19.459735870361328, -18.483531951904297, -17.5073299407959, -16.531126022338867, -15.554923057556152, -14.578720092773438, -13.602516174316406, -12.626313209533691, -11.650108337402344, -10.673905372619629, -9.697701454162598, -8.721498489379883, -7.745295524597168, -6.769092082977295, -5.792888641357422, -4.816685676574707, -3.840482711791992, -2.8642795085906982, -1.8880761861801147, -0.9118728637695312, 0.0643303394317627, 1.0405335426330566, 2.0167369842529297, 2.9929399490356445, 3.9691433906555176, 4.945346832275391, 5.9215497970581055, 6.8977532386779785, 7.873956680297852, 8.850159645080566, 9.826362609863281, 10.802566528320312, 11.778769493103027, 12.754972457885742, 13.731176376342773, 14.707379341125488, 15.683582305908203, 16.659786224365234, 17.635990142822266, 18.612192153930664, 19.588396072387695, 20.564599990844727, 21.540802001953125, 22.517005920410156, 23.493209838867188, 24.469411849975586, 25.445615768432617, 26.421817779541016, 27.398021697998047]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 5.0, 7.0, 11.0, 14.0, 23.0, 19.0, 27.0, 19.0, 46.0, 40.0, 36.0, 44.0, 36.0, 50.0, 45.0, 53.0, 29.0, 55.0, 49.0, 52.0, 40.0, 26.0, 33.0, 37.0, 33.0, 28.0, 14.0, 16.0, 20.0, 20.0, 12.0, 10.0, 8.0, 6.0, 2.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.11524200439453, -27.210716247558594, -26.306190490722656, -25.40166473388672, -24.497140884399414, -23.592615127563477, -22.68808937072754, -21.7835636138916, -20.879039764404297, -19.97451400756836, -19.069988250732422, -18.165462493896484, -17.26093864440918, -16.356412887573242, -15.451887130737305, -14.547361373901367, -13.64283561706543, -12.738309860229492, -11.833785057067871, -10.929259300231934, -10.024734497070312, -9.120208740234375, -8.215682983398438, -7.311157703399658, -6.406632423400879, -5.5021071434021, -4.59758186340332, -3.693056106567383, -2.7885308265686035, -1.8840055465698242, -0.9794797897338867, -0.07495450973510742, 0.8295688629150391, 1.734094262123108, 2.6386196613311768, 3.543145179748535, 4.4476704597473145, 5.352195739746094, 6.256721496582031, 7.1612467765808105, 8.06577205657959, 8.970297813415527, 9.874822616577148, 10.779348373413086, 11.683874130249023, 12.588398933410645, 13.492924690246582, 14.397449493408203, 15.30197525024414, 16.206501007080078, 17.111026763916016, 18.015552520751953, 18.920076370239258, 19.824602127075195, 20.729127883911133, 21.63365364074707, 22.538177490234375, 23.442703247070312, 24.34722900390625, 25.251754760742188, 26.156278610229492, 27.06080436706543, 27.965330123901367, 28.869855880737305, 29.774381637573242]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 8.0, 17.0, 33.0, 43.0, 67.0, 98.0, 159.0, 249.0, 473.0, 725.0, 1252.0, 2067.0, 3714.0, 6613.0, 12529.0, 24275.0, 48454.0, 104671.0, 242856.0, 578258.0, 1071087.0, 1070192.0, 578315.0, 243804.0, 104971.0, 48566.0, 23868.0, 12156.0, 6477.0, 3557.0, 1982.0, 1131.0, 635.0, 353.0, 233.0, 145.0, 90.0, 50.0, 38.0, 19.0, 21.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-38.28125, -37.12109375, -35.9609375, -34.80078125, -33.640625, -32.48046875, -31.3203125, -30.16015625, -29.0, -27.83984375, -26.6796875, -25.51953125, -24.359375, -23.19921875, -22.0390625, -20.87890625, -19.71875, -18.55859375, -17.3984375, -16.23828125, -15.078125, -13.91796875, -12.7578125, -11.59765625, -10.4375, -9.27734375, -8.1171875, -6.95703125, -5.796875, -4.63671875, -3.4765625, -2.31640625, -1.15625, 0.00390625, 1.1640625, 2.32421875, 3.484375, 4.64453125, 5.8046875, 6.96484375, 8.125, 9.28515625, 10.4453125, 11.60546875, 12.765625, 13.92578125, 15.0859375, 16.24609375, 17.40625, 18.56640625, 19.7265625, 20.88671875, 22.046875, 23.20703125, 24.3671875, 25.52734375, 26.6875, 27.84765625, 29.0078125, 30.16796875, 31.328125, 32.48828125, 33.6484375, 34.80859375, 35.96875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 9.0, 8.0, 13.0, 18.0, 26.0, 20.0, 27.0, 27.0, 28.0, 38.0, 23.0, 32.0, 39.0, 35.0, 42.0, 63.0, 54.0, 39.0, 49.0, 43.0, 40.0, 31.0, 36.0, 37.0, 32.0, 24.0, 32.0, 14.0, 15.0, 16.0, 15.0, 14.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.67822265625, -21.9345703125, -21.19091796875, -20.447265625, -19.70361328125, -18.9599609375, -18.21630859375, -17.47265625, -16.72900390625, -15.9853515625, -15.24169921875, -14.498046875, -13.75439453125, -13.0107421875, -12.26708984375, -11.5234375, -10.77978515625, -10.0361328125, -9.29248046875, -8.548828125, -7.80517578125, -7.0615234375, -6.31787109375, -5.57421875, -4.83056640625, -4.0869140625, -3.34326171875, -2.599609375, -1.85595703125, -1.1123046875, -0.36865234375, 0.375, 1.11865234375, 1.8623046875, 2.60595703125, 3.349609375, 4.09326171875, 4.8369140625, 5.58056640625, 6.32421875, 7.06787109375, 7.8115234375, 8.55517578125, 9.298828125, 10.04248046875, 10.7861328125, 11.52978515625, 12.2734375, 13.01708984375, 13.7607421875, 14.50439453125, 15.248046875, 15.99169921875, 16.7353515625, 17.47900390625, 18.22265625, 18.96630859375, 19.7099609375, 20.45361328125, 21.197265625, 21.94091796875, 22.6845703125, 23.42822265625, 24.171875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 17.0, 29.0, 33.0, 48.0, 80.0, 99.0, 165.0, 260.0, 386.0, 597.0, 924.0, 1589.0, 2446.0, 3959.0, 6652.0, 11240.0, 19858.0, 34548.0, 62489.0, 116482.0, 218598.0, 403444.0, 684918.0, 888257.0, 741117.0, 453210.0, 246968.0, 131644.0, 71543.0, 38813.0, 21966.0, 12710.0, 7436.0, 4383.0, 2734.0, 1720.0, 1060.0, 658.0, 415.0, 242.0, 190.0, 116.0, 80.0, 57.0, 35.0, 29.0, 12.0, 6.0, 11.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-30.71875, -29.71484375, -28.7109375, -27.70703125, -26.703125, -25.69921875, -24.6953125, -23.69140625, -22.6875, -21.68359375, -20.6796875, -19.67578125, -18.671875, -17.66796875, -16.6640625, -15.66015625, -14.65625, -13.65234375, -12.6484375, -11.64453125, -10.640625, -9.63671875, -8.6328125, -7.62890625, -6.625, -5.62109375, -4.6171875, -3.61328125, -2.609375, -1.60546875, -0.6015625, 0.40234375, 1.40625, 2.41015625, 3.4140625, 4.41796875, 5.421875, 6.42578125, 7.4296875, 8.43359375, 9.4375, 10.44140625, 11.4453125, 12.44921875, 13.453125, 14.45703125, 15.4609375, 16.46484375, 17.46875, 18.47265625, 19.4765625, 20.48046875, 21.484375, 22.48828125, 23.4921875, 24.49609375, 25.5, 26.50390625, 27.5078125, 28.51171875, 29.515625, 30.51953125, 31.5234375, 32.52734375, 33.53125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 3.0, 10.0, 12.0, 19.0, 20.0, 26.0, 27.0, 55.0, 55.0, 74.0, 89.0, 97.0, 130.0, 190.0, 189.0, 215.0, 236.0, 269.0, 236.0, 291.0, 267.0, 243.0, 241.0, 161.0, 165.0, 140.0, 134.0, 96.0, 76.0, 55.0, 49.0, 37.0, 34.0, 31.0, 17.0, 21.0, 13.0, 9.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.2022705078125, -11.826416015625, -11.4505615234375, -11.07470703125, -10.6988525390625, -10.322998046875, -9.9471435546875, -9.5712890625, -9.1954345703125, -8.819580078125, -8.4437255859375, -8.06787109375, -7.6920166015625, -7.316162109375, -6.9403076171875, -6.564453125, -6.1885986328125, -5.812744140625, -5.4368896484375, -5.06103515625, -4.6851806640625, -4.309326171875, -3.9334716796875, -3.5576171875, -3.1817626953125, -2.805908203125, -2.4300537109375, -2.05419921875, -1.6783447265625, -1.302490234375, -0.9266357421875, -0.55078125, -0.1749267578125, 0.200927734375, 0.5767822265625, 0.95263671875, 1.3284912109375, 1.704345703125, 2.0802001953125, 2.4560546875, 2.8319091796875, 3.207763671875, 3.5836181640625, 3.95947265625, 4.3353271484375, 4.711181640625, 5.0870361328125, 5.462890625, 5.8387451171875, 6.214599609375, 6.5904541015625, 6.96630859375, 7.3421630859375, 7.718017578125, 8.0938720703125, 8.4697265625, 8.8455810546875, 9.221435546875, 9.5972900390625, 9.97314453125, 10.3489990234375, 10.724853515625, 11.1007080078125, 11.4765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 4.0, 7.0, 5.0, 13.0, 11.0, 11.0, 11.0, 12.0, 18.0, 28.0, 25.0, 32.0, 26.0, 39.0, 40.0, 42.0, 57.0, 44.0, 60.0, 61.0, 43.0, 48.0, 31.0, 43.0, 39.0, 46.0, 30.0, 24.0, 15.0, 23.0, 18.0, 19.0, 13.0, 14.0, 10.0, 9.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.190847396850586, -29.326860427856445, -28.462871551513672, -27.59888458251953, -26.73489761352539, -25.870908737182617, -25.006921768188477, -24.142932891845703, -23.278945922851562, -22.414958953857422, -21.55097007751465, -20.686983108520508, -19.822996139526367, -18.959007263183594, -18.095020294189453, -17.231033325195312, -16.367046356201172, -15.503058433532715, -14.639071464538574, -13.775083541870117, -12.91109561920166, -12.047107696533203, -11.183120727539062, -10.319132804870605, -9.455144882202148, -8.591156959533691, -7.727169513702393, -6.863182067871094, -5.999194145202637, -5.135206699371338, -4.271219253540039, -3.407231330871582, -2.543243408203125, -1.679255723953247, -0.8152681589126587, 0.04871940612792969, 0.9127070903778076, 1.7766947746276855, 2.6406822204589844, 3.5046701431274414, 4.36865758895874, 5.232645034790039, 6.096632957458496, 6.960620403289795, 7.824607849121094, 8.68859577178955, 9.552583694458008, 10.416570663452148, 11.280558586120605, 12.144546508789062, 13.008533477783203, 13.87252140045166, 14.736509323120117, 15.600496292114258, 16.46448516845703, 17.328472137451172, 18.192459106445312, 19.056446075439453, 19.920434951782227, 20.784421920776367, 21.648408889770508, 22.51239776611328, 23.376384735107422, 24.240371704101562, 25.104360580444336]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 6.0, 10.0, 13.0, 18.0, 18.0, 17.0, 29.0, 29.0, 21.0, 36.0, 39.0, 35.0, 43.0, 30.0, 46.0, 43.0, 34.0, 46.0, 42.0, 34.0, 51.0, 30.0, 44.0, 36.0, 32.0, 22.0, 24.0, 18.0, 24.0, 20.0, 9.0, 18.0, 9.0, 9.0, 11.0, 8.0, 3.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.226667404174805, -26.397836685180664, -25.56900405883789, -24.74017333984375, -23.91134262084961, -23.082509994506836, -22.253679275512695, -21.424846649169922, -20.59601593017578, -19.76718521118164, -18.938352584838867, -18.109521865844727, -17.280689239501953, -16.451858520507812, -15.623027801513672, -14.794196128845215, -13.965364456176758, -13.1365327835083, -12.307701110839844, -11.478870391845703, -10.650038719177246, -9.821207046508789, -8.992376327514648, -8.163544654846191, -7.334712982177734, -6.505881309509277, -5.6770501136779785, -4.84821891784668, -4.019387245178223, -3.1905555725097656, -2.361724376678467, -1.532893180847168, -0.7040634155273438, 0.12476801872253418, 0.9535994529724121, 1.78243088722229, 2.611262321472168, 3.440093994140625, 4.268925189971924, 5.097756385803223, 5.92658805847168, 6.755419731140137, 7.5842509269714355, 8.413082122802734, 9.241913795471191, 10.070745468139648, 10.899576187133789, 11.728407859802246, 12.557239532470703, 13.38607120513916, 14.214902877807617, 15.043733596801758, 15.872565269470215, 16.701396942138672, 17.530227661132812, 18.359058380126953, 19.187891006469727, 20.016721725463867, 20.84555435180664, 21.67438507080078, 22.503215789794922, 23.332048416137695, 24.160879135131836, 24.98971176147461, 25.81854248046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 4.0, 6.0, 26.0, 23.0, 37.0, 59.0, 67.0, 123.0, 201.0, 299.0, 465.0, 730.0, 1112.0, 1729.0, 2608.0, 4036.0, 6531.0, 9884.0, 15115.0, 23893.0, 35885.0, 54803.0, 80902.0, 112115.0, 139688.0, 145950.0, 126753.0, 94682.0, 65279.0, 43953.0, 28962.0, 18501.0, 12237.0, 7736.0, 5010.0, 3201.0, 2092.0, 1368.0, 844.0, 599.0, 372.0, 233.0, 171.0, 108.0, 63.0, 35.0, 22.0, 15.0, 8.0, 9.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.859375, -11.4796142578125, -11.099853515625, -10.7200927734375, -10.34033203125, -9.9605712890625, -9.580810546875, -9.2010498046875, -8.8212890625, -8.4415283203125, -8.061767578125, -7.6820068359375, -7.30224609375, -6.9224853515625, -6.542724609375, -6.1629638671875, -5.783203125, -5.4034423828125, -5.023681640625, -4.6439208984375, -4.26416015625, -3.8843994140625, -3.504638671875, -3.1248779296875, -2.7451171875, -2.3653564453125, -1.985595703125, -1.6058349609375, -1.22607421875, -0.8463134765625, -0.466552734375, -0.0867919921875, 0.29296875, 0.6727294921875, 1.052490234375, 1.4322509765625, 1.81201171875, 2.1917724609375, 2.571533203125, 2.9512939453125, 3.3310546875, 3.7108154296875, 4.090576171875, 4.4703369140625, 4.85009765625, 5.2298583984375, 5.609619140625, 5.9893798828125, 6.369140625, 6.7489013671875, 7.128662109375, 7.5084228515625, 7.88818359375, 8.2679443359375, 8.647705078125, 9.0274658203125, 9.4072265625, 9.7869873046875, 10.166748046875, 10.5465087890625, 10.92626953125, 11.3060302734375, 11.685791015625, 12.0655517578125, 12.4453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 13.0, 6.0, 10.0, 12.0, 12.0, 13.0, 17.0, 20.0, 21.0, 27.0, 35.0, 28.0, 31.0, 39.0, 38.0, 36.0, 32.0, 31.0, 49.0, 43.0, 49.0, 46.0, 37.0, 43.0, 44.0, 38.0, 38.0, 19.0, 27.0, 20.0, 17.0, 20.0, 14.0, 15.0, 6.0, 12.0, 10.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0], "bins": [-30.671875, -29.820068359375, -28.96826171875, -28.116455078125, -27.2646484375, -26.412841796875, -25.56103515625, -24.709228515625, -23.857421875, -23.005615234375, -22.15380859375, -21.302001953125, -20.4501953125, -19.598388671875, -18.74658203125, -17.894775390625, -17.04296875, -16.191162109375, -15.33935546875, -14.487548828125, -13.6357421875, -12.783935546875, -11.93212890625, -11.080322265625, -10.228515625, -9.376708984375, -8.52490234375, -7.673095703125, -6.8212890625, -5.969482421875, -5.11767578125, -4.265869140625, -3.4140625, -2.562255859375, -1.71044921875, -0.858642578125, -0.0068359375, 0.844970703125, 1.69677734375, 2.548583984375, 3.400390625, 4.252197265625, 5.10400390625, 5.955810546875, 6.8076171875, 7.659423828125, 8.51123046875, 9.363037109375, 10.21484375, 11.066650390625, 11.91845703125, 12.770263671875, 13.6220703125, 14.473876953125, 15.32568359375, 16.177490234375, 17.029296875, 17.881103515625, 18.73291015625, 19.584716796875, 20.4365234375, 21.288330078125, 22.14013671875, 22.991943359375, 23.84375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 14.0, 17.0, 23.0, 22.0, 46.0, 46.0, 97.0, 117.0, 187.0, 227.0, 348.0, 544.0, 813.0, 1238.0, 1991.0, 2982.0, 4706.0, 7807.0, 12802.0, 20791.0, 34093.0, 56425.0, 90852.0, 136564.0, 173405.0, 167349.0, 124520.0, 81333.0, 50010.0, 30072.0, 18676.0, 11300.0, 6842.0, 4454.0, 2742.0, 1703.0, 1178.0, 701.0, 454.0, 337.0, 236.0, 149.0, 105.0, 72.0, 50.0, 26.0, 22.0, 22.0, 14.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 4.0], "bins": [-14.9453125, -14.4764404296875, -14.007568359375, -13.5386962890625, -13.06982421875, -12.6009521484375, -12.132080078125, -11.6632080078125, -11.1943359375, -10.7254638671875, -10.256591796875, -9.7877197265625, -9.31884765625, -8.8499755859375, -8.381103515625, -7.9122314453125, -7.443359375, -6.9744873046875, -6.505615234375, -6.0367431640625, -5.56787109375, -5.0989990234375, -4.630126953125, -4.1612548828125, -3.6923828125, -3.2235107421875, -2.754638671875, -2.2857666015625, -1.81689453125, -1.3480224609375, -0.879150390625, -0.4102783203125, 0.05859375, 0.5274658203125, 0.996337890625, 1.4652099609375, 1.93408203125, 2.4029541015625, 2.871826171875, 3.3406982421875, 3.8095703125, 4.2784423828125, 4.747314453125, 5.2161865234375, 5.68505859375, 6.1539306640625, 6.622802734375, 7.0916748046875, 7.560546875, 8.0294189453125, 8.498291015625, 8.9671630859375, 9.43603515625, 9.9049072265625, 10.373779296875, 10.8426513671875, 11.3115234375, 11.7803955078125, 12.249267578125, 12.7181396484375, 13.18701171875, 13.6558837890625, 14.124755859375, 14.5936279296875, 15.0625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 4.0, 8.0, 9.0, 7.0, 13.0, 18.0, 14.0, 13.0, 16.0, 18.0, 19.0, 21.0, 17.0, 31.0, 33.0, 26.0, 30.0, 34.0, 30.0, 35.0, 32.0, 35.0, 34.0, 43.0, 34.0, 29.0, 26.0, 34.0, 45.0, 39.0, 26.0, 25.0, 24.0, 26.0, 19.0, 13.0, 18.0, 18.0, 10.0, 12.0, 8.0, 9.0, 10.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0], "bins": [-15.0625, -14.6107177734375, -14.158935546875, -13.7071533203125, -13.25537109375, -12.8035888671875, -12.351806640625, -11.9000244140625, -11.4482421875, -10.9964599609375, -10.544677734375, -10.0928955078125, -9.64111328125, -9.1893310546875, -8.737548828125, -8.2857666015625, -7.833984375, -7.3822021484375, -6.930419921875, -6.4786376953125, -6.02685546875, -5.5750732421875, -5.123291015625, -4.6715087890625, -4.2197265625, -3.7679443359375, -3.316162109375, -2.8643798828125, -2.41259765625, -1.9608154296875, -1.509033203125, -1.0572509765625, -0.60546875, -0.1536865234375, 0.298095703125, 0.7498779296875, 1.20166015625, 1.6534423828125, 2.105224609375, 2.5570068359375, 3.0087890625, 3.4605712890625, 3.912353515625, 4.3641357421875, 4.81591796875, 5.2677001953125, 5.719482421875, 6.1712646484375, 6.623046875, 7.0748291015625, 7.526611328125, 7.9783935546875, 8.43017578125, 8.8819580078125, 9.333740234375, 9.7855224609375, 10.2373046875, 10.6890869140625, 11.140869140625, 11.5926513671875, 12.04443359375, 12.4962158203125, 12.947998046875, 13.3997802734375, 13.8515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 12.0, 6.0, 24.0, 19.0, 25.0, 46.0, 47.0, 89.0, 140.0, 244.0, 288.0, 468.0, 775.0, 1274.0, 2142.0, 3972.0, 7513.0, 15506.0, 35021.0, 85195.0, 202755.0, 322757.0, 210494.0, 89111.0, 36788.0, 16117.0, 7791.0, 4152.0, 2237.0, 1276.0, 835.0, 491.0, 317.0, 188.0, 126.0, 103.0, 75.0, 39.0, 30.0, 26.0, 13.0, 12.0, 8.0, 5.0, 0.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-8.9140625, -8.6558837890625, -8.397705078125, -8.1395263671875, -7.88134765625, -7.6231689453125, -7.364990234375, -7.1068115234375, -6.8486328125, -6.5904541015625, -6.332275390625, -6.0740966796875, -5.81591796875, -5.5577392578125, -5.299560546875, -5.0413818359375, -4.783203125, -4.5250244140625, -4.266845703125, -4.0086669921875, -3.75048828125, -3.4923095703125, -3.234130859375, -2.9759521484375, -2.7177734375, -2.4595947265625, -2.201416015625, -1.9432373046875, -1.68505859375, -1.4268798828125, -1.168701171875, -0.9105224609375, -0.65234375, -0.3941650390625, -0.135986328125, 0.1221923828125, 0.38037109375, 0.6385498046875, 0.896728515625, 1.1549072265625, 1.4130859375, 1.6712646484375, 1.929443359375, 2.1876220703125, 2.44580078125, 2.7039794921875, 2.962158203125, 3.2203369140625, 3.478515625, 3.7366943359375, 3.994873046875, 4.2530517578125, 4.51123046875, 4.7694091796875, 5.027587890625, 5.2857666015625, 5.5439453125, 5.8021240234375, 6.060302734375, 6.3184814453125, 6.57666015625, 6.8348388671875, 7.093017578125, 7.3511962890625, 7.609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 15.0, 15.0, 18.0, 23.0, 44.0, 41.0, 36.0, 61.0, 58.0, 69.0, 68.0, 77.0, 64.0, 59.0, 52.0, 47.0, 45.0, 34.0, 25.0, 24.0, 12.0, 10.0, 20.0, 8.0, 9.0, 8.0, 5.0, 2.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00060272216796875, -0.0005843937397003174, -0.0005660653114318848, -0.0005477368831634521, -0.0005294084548950195, -0.0005110800266265869, -0.0004927515983581543, -0.0004744231700897217, -0.00045609474182128906, -0.00043776631355285645, -0.00041943788528442383, -0.0004011094570159912, -0.0003827810287475586, -0.000364452600479126, -0.00034612417221069336, -0.00032779574394226074, -0.0003094673156738281, -0.0002911388874053955, -0.0002728104591369629, -0.0002544820308685303, -0.00023615360260009766, -0.00021782517433166504, -0.00019949674606323242, -0.0001811683177947998, -0.0001628398895263672, -0.00014451146125793457, -0.00012618303298950195, -0.00010785460472106934, -8.952617645263672e-05, -7.11977481842041e-05, -5.2869319915771484e-05, -3.454089164733887e-05, -1.621246337890625e-05, 2.115964889526367e-06, 2.0444393157958984e-05, 3.87728214263916e-05, 5.710124969482422e-05, 7.542967796325684e-05, 9.375810623168945e-05, 0.00011208653450012207, 0.0001304149627685547, 0.0001487433910369873, 0.00016707181930541992, 0.00018540024757385254, 0.00020372867584228516, 0.00022205710411071777, 0.0002403855323791504, 0.000258713960647583, 0.0002770423889160156, 0.00029537081718444824, 0.00031369924545288086, 0.0003320276737213135, 0.0003503561019897461, 0.0003686845302581787, 0.00038701295852661133, 0.00040534138679504395, 0.00042366981506347656, 0.0004419982433319092, 0.0004603266716003418, 0.0004786550998687744, 0.000496983528137207, 0.0005153119564056396, 0.0005336403846740723, 0.0005519688129425049, 0.0005702972412109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 1.0, 5.0, 7.0, 10.0, 15.0, 18.0, 29.0, 36.0, 55.0, 84.0, 110.0, 175.0, 213.0, 321.0, 519.0, 782.0, 1316.0, 2124.0, 3543.0, 6270.0, 11387.0, 22677.0, 46269.0, 97274.0, 190581.0, 265014.0, 197563.0, 101822.0, 48752.0, 23519.0, 11859.0, 6563.0, 3651.0, 2177.0, 1340.0, 832.0, 508.0, 367.0, 232.0, 158.0, 115.0, 72.0, 53.0, 44.0, 29.0, 18.0, 12.0, 16.0, 8.0, 3.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.2421875, -7.98883056640625, -7.7354736328125, -7.48211669921875, -7.228759765625, -6.97540283203125, -6.7220458984375, -6.46868896484375, -6.21533203125, -5.96197509765625, -5.7086181640625, -5.45526123046875, -5.201904296875, -4.94854736328125, -4.6951904296875, -4.44183349609375, -4.1884765625, -3.93511962890625, -3.6817626953125, -3.42840576171875, -3.175048828125, -2.92169189453125, -2.6683349609375, -2.41497802734375, -2.16162109375, -1.90826416015625, -1.6549072265625, -1.40155029296875, -1.148193359375, -0.89483642578125, -0.6414794921875, -0.38812255859375, -0.134765625, 0.11859130859375, 0.3719482421875, 0.62530517578125, 0.878662109375, 1.13201904296875, 1.3853759765625, 1.63873291015625, 1.89208984375, 2.14544677734375, 2.3988037109375, 2.65216064453125, 2.905517578125, 3.15887451171875, 3.4122314453125, 3.66558837890625, 3.9189453125, 4.17230224609375, 4.4256591796875, 4.67901611328125, 4.932373046875, 5.18572998046875, 5.4390869140625, 5.69244384765625, 5.94580078125, 6.19915771484375, 6.4525146484375, 6.70587158203125, 6.959228515625, 7.21258544921875, 7.4659423828125, 7.71929931640625, 7.97265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 10.0, 14.0, 18.0, 26.0, 35.0, 43.0, 68.0, 84.0, 78.0, 104.0, 121.0, 86.0, 76.0, 60.0, 47.0, 28.0, 22.0, 18.0, 7.0, 9.0, 11.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.335845947265625, -3.22052001953125, -3.105194091796875, -2.9898681640625, -2.874542236328125, -2.75921630859375, -2.643890380859375, -2.528564453125, -2.413238525390625, -2.29791259765625, -2.182586669921875, -2.0672607421875, -1.951934814453125, -1.83660888671875, -1.721282958984375, -1.60595703125, -1.490631103515625, -1.37530517578125, -1.259979248046875, -1.1446533203125, -1.029327392578125, -0.91400146484375, -0.798675537109375, -0.683349609375, -0.568023681640625, -0.45269775390625, -0.337371826171875, -0.2220458984375, -0.106719970703125, 0.00860595703125, 0.123931884765625, 0.2392578125, 0.354583740234375, 0.46990966796875, 0.585235595703125, 0.7005615234375, 0.815887451171875, 0.93121337890625, 1.046539306640625, 1.161865234375, 1.277191162109375, 1.39251708984375, 1.507843017578125, 1.6231689453125, 1.738494873046875, 1.85382080078125, 1.969146728515625, 2.08447265625, 2.199798583984375, 2.31512451171875, 2.430450439453125, 2.5457763671875, 2.661102294921875, 2.77642822265625, 2.891754150390625, 3.007080078125, 3.122406005859375, 3.23773193359375, 3.353057861328125, 3.4683837890625, 3.583709716796875, 3.69903564453125, 3.814361572265625, 3.9296875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 10.0, 11.0, 6.0, 5.0, 9.0, 16.0, 15.0, 13.0, 13.0, 26.0, 30.0, 34.0, 34.0, 52.0, 44.0, 53.0, 40.0, 46.0, 71.0, 65.0, 41.0, 38.0, 47.0, 48.0, 35.0, 31.0, 28.0, 26.0, 14.0, 14.0, 15.0, 19.0, 14.0, 6.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.694002151489258, -30.791574478149414, -29.88914680480957, -28.986719131469727, -28.084291458129883, -27.18186378479004, -26.279436111450195, -25.37700843811035, -24.474580764770508, -23.572153091430664, -22.66972541809082, -21.767297744750977, -20.864870071411133, -19.96244239807129, -19.060014724731445, -18.1575870513916, -17.255159378051758, -16.352731704711914, -15.45030403137207, -14.547876358032227, -13.645448684692383, -12.743021011352539, -11.840593338012695, -10.938165664672852, -10.035737991333008, -9.133310317993164, -8.23088264465332, -7.328454971313477, -6.426027297973633, -5.523599624633789, -4.621171951293945, -3.7187442779541016, -2.816316604614258, -1.913888931274414, -1.0114612579345703, -0.10903358459472656, 0.7933940887451172, 1.695821762084961, 2.5982494354248047, 3.5006771087646484, 4.403104782104492, 5.305532455444336, 6.20796012878418, 7.110387802124023, 8.012815475463867, 8.915243148803711, 9.817670822143555, 10.720098495483398, 11.622526168823242, 12.524953842163086, 13.42738151550293, 14.329809188842773, 15.232236862182617, 16.13466453552246, 17.037092208862305, 17.93951988220215, 18.841947555541992, 19.744375228881836, 20.64680290222168, 21.549230575561523, 22.451658248901367, 23.35408592224121, 24.256513595581055, 25.1589412689209, 26.061368942260742]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 10.0, 10.0, 6.0, 12.0, 16.0, 20.0, 19.0, 26.0, 23.0, 30.0, 22.0, 32.0, 40.0, 39.0, 39.0, 41.0, 50.0, 37.0, 34.0, 44.0, 46.0, 36.0, 43.0, 36.0, 31.0, 40.0, 22.0, 22.0, 30.0, 21.0, 20.0, 13.0, 17.0, 6.0, 12.0, 12.0, 5.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.143665313720703, -26.327356338500977, -25.511049270629883, -24.694740295410156, -23.878433227539062, -23.062124252319336, -22.24581527709961, -21.429508209228516, -20.61319923400879, -19.796890258789062, -18.98058319091797, -18.164274215698242, -17.347965240478516, -16.531658172607422, -15.715349197387695, -14.899041175842285, -14.082733154296875, -13.266425132751465, -12.450117111206055, -11.633808135986328, -10.817500114440918, -10.001192092895508, -9.184883117675781, -8.368575096130371, -7.552267074584961, -6.735959053039551, -5.919650554656982, -5.103342056274414, -4.287034034729004, -3.4707260131835938, -2.6544175148010254, -1.838109016418457, -1.0218009948730469, -0.20549273490905762, 0.6108155250549316, 1.427123785018921, 2.24343204498291, 3.0597400665283203, 3.8760485649108887, 4.692357063293457, 5.508665084838867, 6.324973106384277, 7.141281604766846, 7.957590103149414, 8.773898124694824, 9.590206146240234, 10.406515121459961, 11.222823143005371, 12.039131164550781, 12.855439186096191, 13.671747207641602, 14.488056182861328, 15.304364204406738, 16.12067222595215, 16.936981201171875, 17.75328826904297, 18.569597244262695, 19.385906219482422, 20.202213287353516, 21.018522262573242, 21.83483123779297, 22.651138305664062, 23.46744728088379, 24.283756256103516, 25.10006332397461]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 13.0, 25.0, 54.0, 88.0, 121.0, 203.0, 299.0, 421.0, 703.0, 1098.0, 1724.0, 2577.0, 4027.0, 6127.0, 9359.0, 14524.0, 21688.0, 32774.0, 48272.0, 68588.0, 91370.0, 112651.0, 125655.0, 123659.0, 107670.0, 84395.0, 62137.0, 43224.0, 29043.0, 19441.0, 12804.0, 8273.0, 5508.0, 3551.0, 2266.0, 1470.0, 958.0, 633.0, 401.0, 260.0, 186.0, 112.0, 64.0, 56.0, 28.0, 20.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.453125, -20.7578125, -20.0625, -19.3671875, -18.671875, -17.9765625, -17.28125, -16.5859375, -15.890625, -15.1953125, -14.5, -13.8046875, -13.109375, -12.4140625, -11.71875, -11.0234375, -10.328125, -9.6328125, -8.9375, -8.2421875, -7.546875, -6.8515625, -6.15625, -5.4609375, -4.765625, -4.0703125, -3.375, -2.6796875, -1.984375, -1.2890625, -0.59375, 0.1015625, 0.796875, 1.4921875, 2.1875, 2.8828125, 3.578125, 4.2734375, 4.96875, 5.6640625, 6.359375, 7.0546875, 7.75, 8.4453125, 9.140625, 9.8359375, 10.53125, 11.2265625, 11.921875, 12.6171875, 13.3125, 14.0078125, 14.703125, 15.3984375, 16.09375, 16.7890625, 17.484375, 18.1796875, 18.875, 19.5703125, 20.265625, 20.9609375, 21.65625, 22.3515625, 23.046875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 3.0, 5.0, 13.0, 7.0, 13.0, 18.0, 20.0, 16.0, 25.0, 35.0, 33.0, 21.0, 35.0, 40.0, 30.0, 35.0, 49.0, 44.0, 47.0, 47.0, 47.0, 43.0, 33.0, 35.0, 34.0, 34.0, 29.0, 28.0, 26.0, 20.0, 23.0, 15.0, 14.0, 11.0, 12.0, 8.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.703125, -24.867431640625, -24.03173828125, -23.196044921875, -22.3603515625, -21.524658203125, -20.68896484375, -19.853271484375, -19.017578125, -18.181884765625, -17.34619140625, -16.510498046875, -15.6748046875, -14.839111328125, -14.00341796875, -13.167724609375, -12.33203125, -11.496337890625, -10.66064453125, -9.824951171875, -8.9892578125, -8.153564453125, -7.31787109375, -6.482177734375, -5.646484375, -4.810791015625, -3.97509765625, -3.139404296875, -2.3037109375, -1.468017578125, -0.63232421875, 0.203369140625, 1.0390625, 1.874755859375, 2.71044921875, 3.546142578125, 4.3818359375, 5.217529296875, 6.05322265625, 6.888916015625, 7.724609375, 8.560302734375, 9.39599609375, 10.231689453125, 11.0673828125, 11.903076171875, 12.73876953125, 13.574462890625, 14.41015625, 15.245849609375, 16.08154296875, 16.917236328125, 17.7529296875, 18.588623046875, 19.42431640625, 20.260009765625, 21.095703125, 21.931396484375, 22.76708984375, 23.602783203125, 24.4384765625, 25.274169921875, 26.10986328125, 26.945556640625, 27.78125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 13.0, 16.0, 34.0, 44.0, 74.0, 100.0, 144.0, 192.0, 319.0, 459.0, 688.0, 1076.0, 1629.0, 2419.0, 3812.0, 6004.0, 9512.0, 14689.0, 23024.0, 35279.0, 53812.0, 78933.0, 106410.0, 130111.0, 139212.0, 126937.0, 100434.0, 72690.0, 49209.0, 32618.0, 20729.0, 13567.0, 8594.0, 5491.0, 3481.0, 2285.0, 1538.0, 956.0, 643.0, 440.0, 313.0, 190.0, 145.0, 94.0, 78.0, 40.0, 22.0, 17.0, 15.0, 9.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-23.984375, -23.1953125, -22.40625, -21.6171875, -20.828125, -20.0390625, -19.25, -18.4609375, -17.671875, -16.8828125, -16.09375, -15.3046875, -14.515625, -13.7265625, -12.9375, -12.1484375, -11.359375, -10.5703125, -9.78125, -8.9921875, -8.203125, -7.4140625, -6.625, -5.8359375, -5.046875, -4.2578125, -3.46875, -2.6796875, -1.890625, -1.1015625, -0.3125, 0.4765625, 1.265625, 2.0546875, 2.84375, 3.6328125, 4.421875, 5.2109375, 6.0, 6.7890625, 7.578125, 8.3671875, 9.15625, 9.9453125, 10.734375, 11.5234375, 12.3125, 13.1015625, 13.890625, 14.6796875, 15.46875, 16.2578125, 17.046875, 17.8359375, 18.625, 19.4140625, 20.203125, 20.9921875, 21.78125, 22.5703125, 23.359375, 24.1484375, 24.9375, 25.7265625, 26.515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 14.0, 10.0, 15.0, 20.0, 14.0, 21.0, 21.0, 23.0, 27.0, 38.0, 28.0, 34.0, 27.0, 33.0, 38.0, 39.0, 42.0, 48.0, 44.0, 48.0, 37.0, 34.0, 33.0, 30.0, 28.0, 33.0, 29.0, 21.0, 34.0, 21.0, 22.0, 9.0, 15.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.703125, -18.15625, -17.609375, -17.0625, -16.515625, -15.96875, -15.421875, -14.875, -14.328125, -13.78125, -13.234375, -12.6875, -12.140625, -11.59375, -11.046875, -10.5, -9.953125, -9.40625, -8.859375, -8.3125, -7.765625, -7.21875, -6.671875, -6.125, -5.578125, -5.03125, -4.484375, -3.9375, -3.390625, -2.84375, -2.296875, -1.75, -1.203125, -0.65625, -0.109375, 0.4375, 0.984375, 1.53125, 2.078125, 2.625, 3.171875, 3.71875, 4.265625, 4.8125, 5.359375, 5.90625, 6.453125, 7.0, 7.546875, 8.09375, 8.640625, 9.1875, 9.734375, 10.28125, 10.828125, 11.375, 11.921875, 12.46875, 13.015625, 13.5625, 14.109375, 14.65625, 15.203125, 15.75, 16.296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 15.0, 15.0, 19.0, 40.0, 54.0, 70.0, 126.0, 149.0, 232.0, 370.0, 533.0, 909.0, 1462.0, 2574.0, 4585.0, 8752.0, 17386.0, 37891.0, 86254.0, 189116.0, 289284.0, 217560.0, 102987.0, 44876.0, 20696.0, 10049.0, 5141.0, 2826.0, 1696.0, 1068.0, 620.0, 374.0, 266.0, 168.0, 121.0, 72.0, 58.0, 35.0, 24.0, 24.0, 14.0, 8.0, 4.0, 3.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.203125, -19.520751953125, -18.83837890625, -18.156005859375, -17.4736328125, -16.791259765625, -16.10888671875, -15.426513671875, -14.744140625, -14.061767578125, -13.37939453125, -12.697021484375, -12.0146484375, -11.332275390625, -10.64990234375, -9.967529296875, -9.28515625, -8.602783203125, -7.92041015625, -7.238037109375, -6.5556640625, -5.873291015625, -5.19091796875, -4.508544921875, -3.826171875, -3.143798828125, -2.46142578125, -1.779052734375, -1.0966796875, -0.414306640625, 0.26806640625, 0.950439453125, 1.6328125, 2.315185546875, 2.99755859375, 3.679931640625, 4.3623046875, 5.044677734375, 5.72705078125, 6.409423828125, 7.091796875, 7.774169921875, 8.45654296875, 9.138916015625, 9.8212890625, 10.503662109375, 11.18603515625, 11.868408203125, 12.55078125, 13.233154296875, 13.91552734375, 14.597900390625, 15.2802734375, 15.962646484375, 16.64501953125, 17.327392578125, 18.009765625, 18.692138671875, 19.37451171875, 20.056884765625, 20.7392578125, 21.421630859375, 22.10400390625, 22.786376953125, 23.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 8.0, 14.0, 9.0, 9.0, 18.0, 17.0, 33.0, 32.0, 50.0, 54.0, 55.0, 56.0, 60.0, 72.0, 70.0, 63.0, 58.0, 57.0, 50.0, 36.0, 30.0, 24.0, 23.0, 17.0, 15.0, 4.0, 9.0, 6.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013790130615234375, -0.001329660415649414, -0.0012803077697753906, -0.0012309551239013672, -0.0011816024780273438, -0.0011322498321533203, -0.0010828971862792969, -0.0010335445404052734, -0.00098419189453125, -0.0009348392486572266, -0.0008854866027832031, -0.0008361339569091797, -0.0007867813110351562, -0.0007374286651611328, -0.0006880760192871094, -0.0006387233734130859, -0.0005893707275390625, -0.0005400180816650391, -0.0004906654357910156, -0.0004413127899169922, -0.00039196014404296875, -0.0003426074981689453, -0.0002932548522949219, -0.00024390220642089844, -0.000194549560546875, -0.00014519691467285156, -9.584426879882812e-05, -4.649162292480469e-05, 2.86102294921875e-06, 5.221366882324219e-05, 0.00010156631469726562, 0.00015091896057128906, 0.0002002716064453125, 0.00024962425231933594, 0.0002989768981933594, 0.0003483295440673828, 0.00039768218994140625, 0.0004470348358154297, 0.0004963874816894531, 0.0005457401275634766, 0.0005950927734375, 0.0006444454193115234, 0.0006937980651855469, 0.0007431507110595703, 0.0007925033569335938, 0.0008418560028076172, 0.0008912086486816406, 0.0009405612945556641, 0.0009899139404296875, 0.001039266586303711, 0.0010886192321777344, 0.0011379718780517578, 0.0011873245239257812, 0.0012366771697998047, 0.0012860298156738281, 0.0013353824615478516, 0.001384735107421875, 0.0014340877532958984, 0.0014834403991699219, 0.0015327930450439453, 0.0015821456909179688, 0.0016314983367919922, 0.0016808509826660156, 0.001730203628540039, 0.0017795562744140625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 8.0, 4.0, 16.0, 14.0, 25.0, 24.0, 35.0, 57.0, 74.0, 132.0, 157.0, 237.0, 375.0, 583.0, 933.0, 1490.0, 2501.0, 4356.0, 7365.0, 13831.0, 26200.0, 51618.0, 101228.0, 180098.0, 233411.0, 191809.0, 111108.0, 56640.0, 28978.0, 15117.0, 8416.0, 4656.0, 2644.0, 1577.0, 985.0, 601.0, 384.0, 281.0, 179.0, 112.0, 77.0, 63.0, 44.0, 30.0, 25.0, 12.0, 10.0, 6.0, 11.0, 8.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0], "bins": [-17.34375, -16.811279296875, -16.27880859375, -15.746337890625, -15.2138671875, -14.681396484375, -14.14892578125, -13.616455078125, -13.083984375, -12.551513671875, -12.01904296875, -11.486572265625, -10.9541015625, -10.421630859375, -9.88916015625, -9.356689453125, -8.82421875, -8.291748046875, -7.75927734375, -7.226806640625, -6.6943359375, -6.161865234375, -5.62939453125, -5.096923828125, -4.564453125, -4.031982421875, -3.49951171875, -2.967041015625, -2.4345703125, -1.902099609375, -1.36962890625, -0.837158203125, -0.3046875, 0.227783203125, 0.76025390625, 1.292724609375, 1.8251953125, 2.357666015625, 2.89013671875, 3.422607421875, 3.955078125, 4.487548828125, 5.02001953125, 5.552490234375, 6.0849609375, 6.617431640625, 7.14990234375, 7.682373046875, 8.21484375, 8.747314453125, 9.27978515625, 9.812255859375, 10.3447265625, 10.877197265625, 11.40966796875, 11.942138671875, 12.474609375, 13.007080078125, 13.53955078125, 14.072021484375, 14.6044921875, 15.136962890625, 15.66943359375, 16.201904296875, 16.734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 13.0, 16.0, 10.0, 18.0, 22.0, 27.0, 46.0, 30.0, 53.0, 55.0, 44.0, 66.0, 55.0, 54.0, 50.0, 48.0, 56.0, 50.0, 39.0, 47.0, 28.0, 28.0, 15.0, 18.0, 19.0, 11.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.640625, -7.43414306640625, -7.2276611328125, -7.02117919921875, -6.814697265625, -6.60821533203125, -6.4017333984375, -6.19525146484375, -5.98876953125, -5.78228759765625, -5.5758056640625, -5.36932373046875, -5.162841796875, -4.95635986328125, -4.7498779296875, -4.54339599609375, -4.3369140625, -4.13043212890625, -3.9239501953125, -3.71746826171875, -3.510986328125, -3.30450439453125, -3.0980224609375, -2.89154052734375, -2.68505859375, -2.47857666015625, -2.2720947265625, -2.06561279296875, -1.859130859375, -1.65264892578125, -1.4461669921875, -1.23968505859375, -1.033203125, -0.82672119140625, -0.6202392578125, -0.41375732421875, -0.207275390625, -0.00079345703125, 0.2056884765625, 0.41217041015625, 0.61865234375, 0.82513427734375, 1.0316162109375, 1.23809814453125, 1.444580078125, 1.65106201171875, 1.8575439453125, 2.06402587890625, 2.2705078125, 2.47698974609375, 2.6834716796875, 2.88995361328125, 3.096435546875, 3.30291748046875, 3.5093994140625, 3.71588134765625, 3.92236328125, 4.12884521484375, 4.3353271484375, 4.54180908203125, 4.748291015625, 4.95477294921875, 5.1612548828125, 5.36773681640625, 5.57421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 9.0, 7.0, 9.0, 7.0, 12.0, 15.0, 20.0, 26.0, 29.0, 25.0, 33.0, 41.0, 43.0, 52.0, 37.0, 47.0, 49.0, 66.0, 53.0, 68.0, 41.0, 47.0, 37.0, 31.0, 26.0, 29.0, 29.0, 19.0, 12.0, 10.0, 11.0, 7.0, 9.0, 10.0, 5.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.415931701660156, -30.511384963989258, -29.60683822631836, -28.702293395996094, -27.797746658325195, -26.893199920654297, -25.9886531829834, -25.0841064453125, -24.179561614990234, -23.275014877319336, -22.370468139648438, -21.465923309326172, -20.561376571655273, -19.656829833984375, -18.752283096313477, -17.847736358642578, -16.94318962097168, -16.03864288330078, -15.1340970993042, -14.2295503616333, -13.325004577636719, -12.42045783996582, -11.515911102294922, -10.611364364624023, -9.706818580627441, -8.802271842956543, -7.897726058959961, -6.9931793212890625, -6.088633060455322, -5.184086799621582, -4.279540061950684, -3.3749938011169434, -2.4704456329345703, -1.5658992528915405, -0.6613528728485107, 0.2431936264038086, 1.1477398872375488, 2.052286148071289, 2.9568328857421875, 3.8613791465759277, 4.765925407409668, 5.670471668243408, 6.575017929077148, 7.479564666748047, 8.384111404418945, 9.288657188415527, 10.193203926086426, 11.097749710083008, 12.002296447753906, 12.906843185424805, 13.811388969421387, 14.715935707092285, 15.620481491088867, 16.525028228759766, 17.429574966430664, 18.334121704101562, 19.238666534423828, 20.143213272094727, 21.047760009765625, 21.95230484008789, 22.85685157775879, 23.761398315429688, 24.665945053100586, 25.570491790771484, 26.475038528442383]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 12.0, 9.0, 15.0, 11.0, 13.0, 15.0, 22.0, 16.0, 27.0, 26.0, 28.0, 31.0, 28.0, 36.0, 47.0, 51.0, 45.0, 49.0, 49.0, 42.0, 38.0, 38.0, 35.0, 26.0, 31.0, 33.0, 29.0, 20.0, 20.0, 22.0, 12.0, 20.0, 12.0, 21.0, 14.0, 4.0, 5.0, 7.0, 10.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.35444450378418, -24.535263061523438, -23.716081619262695, -22.896900177001953, -22.077720642089844, -21.2585391998291, -20.43935775756836, -19.620176315307617, -18.800994873046875, -17.981813430786133, -17.16263198852539, -16.34345245361328, -15.524271011352539, -14.705089569091797, -13.885908126831055, -13.066726684570312, -12.247547149658203, -11.428365707397461, -10.609185218811035, -9.790003776550293, -8.970823287963867, -8.151641845703125, -7.332460403442383, -6.513279438018799, -5.694098472595215, -4.874917507171631, -4.055736541748047, -3.2365550994873047, -2.4173741340637207, -1.5981931686401367, -0.7790117263793945, 0.04016923904418945, 0.8593502044677734, 1.678531289100647, 2.4977123737335205, 3.3168935775756836, 4.136074542999268, 4.955255508422852, 5.774436950683594, 6.593617916107178, 7.412798881530762, 8.231980323791504, 9.05116081237793, 9.870342254638672, 10.689523696899414, 11.50870418548584, 12.327885627746582, 13.147066116333008, 13.96624755859375, 14.785429000854492, 15.604609489440918, 16.423789978027344, 17.242971420288086, 18.062152862548828, 18.88133430480957, 19.700515747070312, 20.519695281982422, 21.338876724243164, 22.158058166503906, 22.977237701416016, 23.796419143676758, 24.6156005859375, 25.434782028198242, 26.253963470458984, 27.073144912719727]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 12.0, 17.0, 25.0, 34.0, 71.0, 82.0, 121.0, 225.0, 336.0, 531.0, 820.0, 1416.0, 2274.0, 3745.0, 6217.0, 10769.0, 18359.0, 33212.0, 59825.0, 114175.0, 225603.0, 453964.0, 789933.0, 948465.0, 714992.0, 392864.0, 195404.0, 99669.0, 52873.0, 28931.0, 16475.0, 9486.0, 5371.0, 3200.0, 1908.0, 1138.0, 700.0, 398.0, 243.0, 160.0, 91.0, 63.0, 28.0, 22.0, 19.0, 4.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.860107421875, -30.87646484375, -29.892822265625, -28.9091796875, -27.925537109375, -26.94189453125, -25.958251953125, -24.974609375, -23.990966796875, -23.00732421875, -22.023681640625, -21.0400390625, -20.056396484375, -19.07275390625, -18.089111328125, -17.10546875, -16.121826171875, -15.13818359375, -14.154541015625, -13.1708984375, -12.187255859375, -11.20361328125, -10.219970703125, -9.236328125, -8.252685546875, -7.26904296875, -6.285400390625, -5.3017578125, -4.318115234375, -3.33447265625, -2.350830078125, -1.3671875, -0.383544921875, 0.60009765625, 1.583740234375, 2.5673828125, 3.551025390625, 4.53466796875, 5.518310546875, 6.501953125, 7.485595703125, 8.46923828125, 9.452880859375, 10.4365234375, 11.420166015625, 12.40380859375, 13.387451171875, 14.37109375, 15.354736328125, 16.33837890625, 17.322021484375, 18.3056640625, 19.289306640625, 20.27294921875, 21.256591796875, 22.240234375, 23.223876953125, 24.20751953125, 25.191162109375, 26.1748046875, 27.158447265625, 28.14208984375, 29.125732421875, 30.109375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 8.0, 6.0, 6.0, 8.0, 8.0, 19.0, 15.0, 12.0, 12.0, 18.0, 16.0, 26.0, 35.0, 27.0, 23.0, 36.0, 34.0, 53.0, 44.0, 51.0, 48.0, 46.0, 39.0, 49.0, 31.0, 38.0, 32.0, 31.0, 35.0, 22.0, 23.0, 26.0, 17.0, 13.0, 15.0, 14.0, 22.0, 11.0, 4.0, 13.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.828125, -22.114990234375, -21.40185546875, -20.688720703125, -19.9755859375, -19.262451171875, -18.54931640625, -17.836181640625, -17.123046875, -16.409912109375, -15.69677734375, -14.983642578125, -14.2705078125, -13.557373046875, -12.84423828125, -12.131103515625, -11.41796875, -10.704833984375, -9.99169921875, -9.278564453125, -8.5654296875, -7.852294921875, -7.13916015625, -6.426025390625, -5.712890625, -4.999755859375, -4.28662109375, -3.573486328125, -2.8603515625, -2.147216796875, -1.43408203125, -0.720947265625, -0.0078125, 0.705322265625, 1.41845703125, 2.131591796875, 2.8447265625, 3.557861328125, 4.27099609375, 4.984130859375, 5.697265625, 6.410400390625, 7.12353515625, 7.836669921875, 8.5498046875, 9.262939453125, 9.97607421875, 10.689208984375, 11.40234375, 12.115478515625, 12.82861328125, 13.541748046875, 14.2548828125, 14.968017578125, 15.68115234375, 16.394287109375, 17.107421875, 17.820556640625, 18.53369140625, 19.246826171875, 19.9599609375, 20.673095703125, 21.38623046875, 22.099365234375, 22.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 15.0, 7.0, 11.0, 27.0, 21.0, 50.0, 66.0, 84.0, 153.0, 201.0, 332.0, 480.0, 701.0, 1046.0, 1632.0, 2616.0, 3975.0, 6402.0, 9684.0, 16181.0, 25825.0, 42442.0, 70098.0, 118415.0, 200598.0, 333587.0, 523481.0, 702865.0, 713671.0, 543660.0, 350630.0, 211338.0, 123562.0, 73826.0, 44341.0, 26840.0, 16545.0, 10393.0, 6543.0, 4195.0, 2719.0, 1749.0, 1120.0, 710.0, 504.0, 321.0, 202.0, 126.0, 103.0, 57.0, 50.0, 36.0, 10.0, 14.0, 8.0, 9.0, 8.0, 4.0, 5.0], "bins": [-29.109375, -28.228515625, -27.34765625, -26.466796875, -25.5859375, -24.705078125, -23.82421875, -22.943359375, -22.0625, -21.181640625, -20.30078125, -19.419921875, -18.5390625, -17.658203125, -16.77734375, -15.896484375, -15.015625, -14.134765625, -13.25390625, -12.373046875, -11.4921875, -10.611328125, -9.73046875, -8.849609375, -7.96875, -7.087890625, -6.20703125, -5.326171875, -4.4453125, -3.564453125, -2.68359375, -1.802734375, -0.921875, -0.041015625, 0.83984375, 1.720703125, 2.6015625, 3.482421875, 4.36328125, 5.244140625, 6.125, 7.005859375, 7.88671875, 8.767578125, 9.6484375, 10.529296875, 11.41015625, 12.291015625, 13.171875, 14.052734375, 14.93359375, 15.814453125, 16.6953125, 17.576171875, 18.45703125, 19.337890625, 20.21875, 21.099609375, 21.98046875, 22.861328125, 23.7421875, 24.623046875, 25.50390625, 26.384765625, 27.265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 8.0, 9.0, 2.0, 10.0, 16.0, 17.0, 34.0, 40.0, 46.0, 56.0, 75.0, 96.0, 119.0, 141.0, 159.0, 178.0, 226.0, 226.0, 255.0, 278.0, 265.0, 255.0, 239.0, 213.0, 172.0, 195.0, 145.0, 127.0, 98.0, 80.0, 67.0, 46.0, 46.0, 33.0, 25.0, 23.0, 16.0, 9.0, 10.0, 6.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.625, -12.234375, -11.84375, -11.453125, -11.0625, -10.671875, -10.28125, -9.890625, -9.5, -9.109375, -8.71875, -8.328125, -7.9375, -7.546875, -7.15625, -6.765625, -6.375, -5.984375, -5.59375, -5.203125, -4.8125, -4.421875, -4.03125, -3.640625, -3.25, -2.859375, -2.46875, -2.078125, -1.6875, -1.296875, -0.90625, -0.515625, -0.125, 0.265625, 0.65625, 1.046875, 1.4375, 1.828125, 2.21875, 2.609375, 3.0, 3.390625, 3.78125, 4.171875, 4.5625, 4.953125, 5.34375, 5.734375, 6.125, 6.515625, 6.90625, 7.296875, 7.6875, 8.078125, 8.46875, 8.859375, 9.25, 9.640625, 10.03125, 10.421875, 10.8125, 11.203125, 11.59375, 11.984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 6.0, 6.0, 7.0, 3.0, 7.0, 7.0, 6.0, 10.0, 19.0, 12.0, 27.0, 30.0, 29.0, 30.0, 36.0, 43.0, 40.0, 55.0, 45.0, 44.0, 52.0, 47.0, 42.0, 46.0, 38.0, 48.0, 42.0, 34.0, 26.0, 25.0, 34.0, 21.0, 9.0, 8.0, 14.0, 9.0, 10.0, 5.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-33.33519744873047, -32.44449996948242, -31.553802490234375, -30.663105010986328, -29.77240753173828, -28.881710052490234, -27.991012573242188, -27.10031509399414, -26.209617614746094, -25.318920135498047, -24.42822265625, -23.537525177001953, -22.646827697753906, -21.75613021850586, -20.865432739257812, -19.974735260009766, -19.08403778076172, -18.193340301513672, -17.302642822265625, -16.411945343017578, -15.521247863769531, -14.630550384521484, -13.739852905273438, -12.84915542602539, -11.958457946777344, -11.067760467529297, -10.17706298828125, -9.286365509033203, -8.395668029785156, -7.504970550537109, -6.6142730712890625, -5.723575592041016, -4.832878112792969, -3.942180633544922, -3.051483154296875, -2.160785675048828, -1.2700881958007812, -0.3793907165527344, 0.5113067626953125, 1.4020042419433594, 2.2927017211914062, 3.183399200439453, 4.0740966796875, 4.964794158935547, 5.855491638183594, 6.746189117431641, 7.6368865966796875, 8.527584075927734, 9.418281555175781, 10.308979034423828, 11.199676513671875, 12.090373992919922, 12.981071472167969, 13.871768951416016, 14.762466430664062, 15.65316390991211, 16.543861389160156, 17.434558868408203, 18.32525634765625, 19.215953826904297, 20.106651306152344, 20.99734878540039, 21.888046264648438, 22.778743743896484, 23.66944122314453]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 8.0, 12.0, 11.0, 16.0, 9.0, 17.0, 22.0, 17.0, 21.0, 29.0, 37.0, 29.0, 28.0, 31.0, 48.0, 40.0, 30.0, 34.0, 43.0, 41.0, 47.0, 29.0, 34.0, 40.0, 32.0, 20.0, 29.0, 23.0, 25.0, 24.0, 24.0, 17.0, 20.0, 9.0, 18.0, 10.0, 8.0, 4.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.274375915527344, -22.53460121154785, -21.794824600219727, -21.055049896240234, -20.315275192260742, -19.57550048828125, -18.835723876953125, -18.095949172973633, -17.35617446899414, -16.61639976501465, -15.87662410736084, -15.136848449707031, -14.397073745727539, -13.65729808807373, -12.917522430419922, -12.17774772644043, -11.437971115112305, -10.698195457458496, -9.958420753479004, -9.218645095825195, -8.478870391845703, -7.7390947341918945, -6.999319076538086, -6.2595438957214355, -5.519768714904785, -4.779993534088135, -4.040218353271484, -3.300442695617676, -2.5606675148010254, -1.820892333984375, -1.0811166763305664, -0.341341495513916, 0.3984336853027344, 1.1382089853286743, 1.8779842853546143, 2.6177597045898438, 3.357534885406494, 4.0973100662231445, 4.837085723876953, 5.5768609046936035, 6.316636085510254, 7.056411266326904, 7.796186447143555, 8.535962104797363, 9.275737762451172, 10.015512466430664, 10.755288124084473, 11.495063781738281, 12.234838485717773, 12.974614143371582, 13.714388847351074, 14.454164505004883, 15.193939208984375, 15.933714866638184, 16.673490524291992, 17.413265228271484, 18.15304183959961, 18.8928165435791, 19.632593154907227, 20.37236785888672, 21.11214256286621, 21.851917266845703, 22.591693878173828, 23.33146858215332, 24.071243286132812]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 10.0, 19.0, 11.0, 25.0, 51.0, 68.0, 101.0, 177.0, 273.0, 400.0, 618.0, 1016.0, 1601.0, 2580.0, 4141.0, 6637.0, 10542.0, 17087.0, 27272.0, 43356.0, 67980.0, 102120.0, 138992.0, 159713.0, 146857.0, 111537.0, 75244.0, 48654.0, 30487.0, 19077.0, 12001.0, 7464.0, 4709.0, 2797.0, 1831.0, 1121.0, 727.0, 445.0, 288.0, 199.0, 119.0, 70.0, 47.0, 28.0, 29.0, 20.0, 7.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.7674560546875, -10.363037109375, -9.9586181640625, -9.55419921875, -9.1497802734375, -8.745361328125, -8.3409423828125, -7.9365234375, -7.5321044921875, -7.127685546875, -6.7232666015625, -6.31884765625, -5.9144287109375, -5.510009765625, -5.1055908203125, -4.701171875, -4.2967529296875, -3.892333984375, -3.4879150390625, -3.08349609375, -2.6790771484375, -2.274658203125, -1.8702392578125, -1.4658203125, -1.0614013671875, -0.656982421875, -0.2525634765625, 0.15185546875, 0.5562744140625, 0.960693359375, 1.3651123046875, 1.76953125, 2.1739501953125, 2.578369140625, 2.9827880859375, 3.38720703125, 3.7916259765625, 4.196044921875, 4.6004638671875, 5.0048828125, 5.4093017578125, 5.813720703125, 6.2181396484375, 6.62255859375, 7.0269775390625, 7.431396484375, 7.8358154296875, 8.240234375, 8.6446533203125, 9.049072265625, 9.4534912109375, 9.85791015625, 10.2623291015625, 10.666748046875, 11.0711669921875, 11.4755859375, 11.8800048828125, 12.284423828125, 12.6888427734375, 13.09326171875, 13.4976806640625, 13.902099609375, 14.3065185546875, 14.7109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 10.0, 10.0, 9.0, 5.0, 12.0, 13.0, 8.0, 12.0, 25.0, 26.0, 24.0, 27.0, 25.0, 29.0, 40.0, 40.0, 39.0, 38.0, 36.0, 42.0, 41.0, 41.0, 42.0, 35.0, 45.0, 35.0, 40.0, 21.0, 23.0, 32.0, 28.0, 21.0, 19.0, 21.0, 8.0, 10.0, 13.0, 10.0, 9.0, 13.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0], "bins": [-29.71875, -28.905029296875, -28.09130859375, -27.277587890625, -26.4638671875, -25.650146484375, -24.83642578125, -24.022705078125, -23.208984375, -22.395263671875, -21.58154296875, -20.767822265625, -19.9541015625, -19.140380859375, -18.32666015625, -17.512939453125, -16.69921875, -15.885498046875, -15.07177734375, -14.258056640625, -13.4443359375, -12.630615234375, -11.81689453125, -11.003173828125, -10.189453125, -9.375732421875, -8.56201171875, -7.748291015625, -6.9345703125, -6.120849609375, -5.30712890625, -4.493408203125, -3.6796875, -2.865966796875, -2.05224609375, -1.238525390625, -0.4248046875, 0.388916015625, 1.20263671875, 2.016357421875, 2.830078125, 3.643798828125, 4.45751953125, 5.271240234375, 6.0849609375, 6.898681640625, 7.71240234375, 8.526123046875, 9.33984375, 10.153564453125, 10.96728515625, 11.781005859375, 12.5947265625, 13.408447265625, 14.22216796875, 15.035888671875, 15.849609375, 16.663330078125, 17.47705078125, 18.290771484375, 19.1044921875, 19.918212890625, 20.73193359375, 21.545654296875, 22.359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 9.0, 8.0, 13.0, 14.0, 20.0, 45.0, 49.0, 64.0, 93.0, 171.0, 248.0, 328.0, 541.0, 827.0, 1294.0, 1997.0, 3181.0, 5215.0, 8431.0, 14443.0, 24424.0, 41279.0, 71432.0, 116887.0, 171987.0, 192564.0, 152674.0, 97504.0, 58389.0, 34047.0, 19883.0, 11770.0, 7115.0, 4221.0, 2651.0, 1650.0, 1047.0, 719.0, 445.0, 295.0, 180.0, 118.0, 84.0, 56.0, 45.0, 37.0, 20.0, 18.0, 12.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.984375, -16.458740234375, -15.93310546875, -15.407470703125, -14.8818359375, -14.356201171875, -13.83056640625, -13.304931640625, -12.779296875, -12.253662109375, -11.72802734375, -11.202392578125, -10.6767578125, -10.151123046875, -9.62548828125, -9.099853515625, -8.57421875, -8.048583984375, -7.52294921875, -6.997314453125, -6.4716796875, -5.946044921875, -5.42041015625, -4.894775390625, -4.369140625, -3.843505859375, -3.31787109375, -2.792236328125, -2.2666015625, -1.740966796875, -1.21533203125, -0.689697265625, -0.1640625, 0.361572265625, 0.88720703125, 1.412841796875, 1.9384765625, 2.464111328125, 2.98974609375, 3.515380859375, 4.041015625, 4.566650390625, 5.09228515625, 5.617919921875, 6.1435546875, 6.669189453125, 7.19482421875, 7.720458984375, 8.24609375, 8.771728515625, 9.29736328125, 9.822998046875, 10.3486328125, 10.874267578125, 11.39990234375, 11.925537109375, 12.451171875, 12.976806640625, 13.50244140625, 14.028076171875, 14.5537109375, 15.079345703125, 15.60498046875, 16.130615234375, 16.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 8.0, 5.0, 7.0, 5.0, 11.0, 15.0, 12.0, 16.0, 19.0, 20.0, 17.0, 17.0, 28.0, 37.0, 42.0, 32.0, 30.0, 36.0, 27.0, 42.0, 38.0, 40.0, 41.0, 58.0, 34.0, 44.0, 34.0, 42.0, 24.0, 35.0, 29.0, 18.0, 15.0, 18.0, 21.0, 11.0, 12.0, 14.0, 10.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.90625, -16.3946533203125, -15.883056640625, -15.3714599609375, -14.85986328125, -14.3482666015625, -13.836669921875, -13.3250732421875, -12.8134765625, -12.3018798828125, -11.790283203125, -11.2786865234375, -10.76708984375, -10.2554931640625, -9.743896484375, -9.2322998046875, -8.720703125, -8.2091064453125, -7.697509765625, -7.1859130859375, -6.67431640625, -6.1627197265625, -5.651123046875, -5.1395263671875, -4.6279296875, -4.1163330078125, -3.604736328125, -3.0931396484375, -2.58154296875, -2.0699462890625, -1.558349609375, -1.0467529296875, -0.53515625, -0.0235595703125, 0.488037109375, 0.9996337890625, 1.51123046875, 2.0228271484375, 2.534423828125, 3.0460205078125, 3.5576171875, 4.0692138671875, 4.580810546875, 5.0924072265625, 5.60400390625, 6.1156005859375, 6.627197265625, 7.1387939453125, 7.650390625, 8.1619873046875, 8.673583984375, 9.1851806640625, 9.69677734375, 10.2083740234375, 10.719970703125, 11.2315673828125, 11.7431640625, 12.2547607421875, 12.766357421875, 13.2779541015625, 13.78955078125, 14.3011474609375, 14.812744140625, 15.3243408203125, 15.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 13.0, 19.0, 25.0, 28.0, 71.0, 92.0, 120.0, 211.0, 333.0, 516.0, 844.0, 1394.0, 2418.0, 4168.0, 8059.0, 15101.0, 29692.0, 62501.0, 130676.0, 240026.0, 256506.0, 150569.0, 72337.0, 35051.0, 17347.0, 8973.0, 4712.0, 2603.0, 1615.0, 1001.0, 551.0, 375.0, 224.0, 130.0, 85.0, 62.0, 29.0, 23.0, 17.0, 14.0, 10.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.10186767578125, -6.8873291015625, -6.67279052734375, -6.458251953125, -6.24371337890625, -6.0291748046875, -5.81463623046875, -5.60009765625, -5.38555908203125, -5.1710205078125, -4.95648193359375, -4.741943359375, -4.52740478515625, -4.3128662109375, -4.09832763671875, -3.8837890625, -3.66925048828125, -3.4547119140625, -3.24017333984375, -3.025634765625, -2.81109619140625, -2.5965576171875, -2.38201904296875, -2.16748046875, -1.95294189453125, -1.7384033203125, -1.52386474609375, -1.309326171875, -1.09478759765625, -0.8802490234375, -0.66571044921875, -0.451171875, -0.23663330078125, -0.0220947265625, 0.19244384765625, 0.406982421875, 0.62152099609375, 0.8360595703125, 1.05059814453125, 1.26513671875, 1.47967529296875, 1.6942138671875, 1.90875244140625, 2.123291015625, 2.33782958984375, 2.5523681640625, 2.76690673828125, 2.9814453125, 3.19598388671875, 3.4105224609375, 3.62506103515625, 3.839599609375, 4.05413818359375, 4.2686767578125, 4.48321533203125, 4.69775390625, 4.91229248046875, 5.1268310546875, 5.34136962890625, 5.555908203125, 5.77044677734375, 5.9849853515625, 6.19952392578125, 6.4140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 4.0, 12.0, 11.0, 10.0, 15.0, 16.0, 21.0, 21.0, 28.0, 46.0, 48.0, 47.0, 61.0, 57.0, 54.0, 67.0, 68.0, 56.0, 51.0, 59.0, 45.0, 36.0, 37.0, 31.0, 15.0, 17.0, 9.0, 12.0, 8.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006165504455566406, -0.0006001628935337067, -0.0005837753415107727, -0.0005673877894878387, -0.0005510002374649048, -0.0005346126854419708, -0.0005182251334190369, -0.0005018375813961029, -0.00048545002937316895, -0.000469062477350235, -0.000452674925327301, -0.00043628737330436707, -0.0004198998212814331, -0.00040351226925849915, -0.0003871247172355652, -0.0003707371652126312, -0.00035434961318969727, -0.0003379620611667633, -0.00032157450914382935, -0.0003051869571208954, -0.0002887994050979614, -0.00027241185307502747, -0.0002560243010520935, -0.00023963674902915955, -0.00022324919700622559, -0.00020686164498329163, -0.00019047409296035767, -0.0001740865409374237, -0.00015769898891448975, -0.00014131143689155579, -0.00012492388486862183, -0.00010853633284568787, -9.21487808227539e-05, -7.576122879981995e-05, -5.9373676776885986e-05, -4.2986124753952026e-05, -2.6598572731018066e-05, -1.0211020708084106e-05, 6.1765313148498535e-06, 2.2564083337783813e-05, 3.8951635360717773e-05, 5.5339187383651733e-05, 7.17267394065857e-05, 8.811429142951965e-05, 0.00010450184345245361, 0.00012088939547538757, 0.00013727694749832153, 0.0001536644995212555, 0.00017005205154418945, 0.0001864396035671234, 0.00020282715559005737, 0.00021921470761299133, 0.0002356022596359253, 0.00025198981165885925, 0.0002683773636817932, 0.00028476491570472717, 0.00030115246772766113, 0.0003175400197505951, 0.00033392757177352905, 0.000350315123796463, 0.00036670267581939697, 0.00038309022784233093, 0.0003994777798652649, 0.00041586533188819885, 0.0004322528839111328]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 13.0, 27.0, 34.0, 48.0, 83.0, 140.0, 203.0, 334.0, 481.0, 769.0, 1213.0, 2042.0, 3150.0, 5270.0, 8754.0, 15216.0, 26394.0, 48525.0, 87760.0, 150156.0, 206534.0, 194142.0, 129848.0, 73299.0, 39640.0, 22172.0, 12744.0, 7445.0, 4576.0, 2856.0, 1675.0, 1104.0, 697.0, 418.0, 290.0, 170.0, 128.0, 66.0, 44.0, 34.0, 18.0, 8.0, 4.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.7054443359375, -5.492919921875, -5.2803955078125, -5.06787109375, -4.8553466796875, -4.642822265625, -4.4302978515625, -4.2177734375, -4.0052490234375, -3.792724609375, -3.5802001953125, -3.36767578125, -3.1551513671875, -2.942626953125, -2.7301025390625, -2.517578125, -2.3050537109375, -2.092529296875, -1.8800048828125, -1.66748046875, -1.4549560546875, -1.242431640625, -1.0299072265625, -0.8173828125, -0.6048583984375, -0.392333984375, -0.1798095703125, 0.03271484375, 0.2452392578125, 0.457763671875, 0.6702880859375, 0.8828125, 1.0953369140625, 1.307861328125, 1.5203857421875, 1.73291015625, 1.9454345703125, 2.157958984375, 2.3704833984375, 2.5830078125, 2.7955322265625, 3.008056640625, 3.2205810546875, 3.43310546875, 3.6456298828125, 3.858154296875, 4.0706787109375, 4.283203125, 4.4957275390625, 4.708251953125, 4.9207763671875, 5.13330078125, 5.3458251953125, 5.558349609375, 5.7708740234375, 5.9833984375, 6.1959228515625, 6.408447265625, 6.6209716796875, 6.83349609375, 7.0460205078125, 7.258544921875, 7.4710693359375, 7.68359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 7.0, 8.0, 14.0, 14.0, 25.0, 28.0, 27.0, 26.0, 36.0, 52.0, 48.0, 47.0, 52.0, 53.0, 55.0, 58.0, 51.0, 51.0, 53.0, 39.0, 27.0, 41.0, 37.0, 26.0, 14.0, 28.0, 8.0, 5.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.2323150634765625, -2.167755126953125, -2.1031951904296875, -2.03863525390625, -1.9740753173828125, -1.909515380859375, -1.8449554443359375, -1.7803955078125, -1.7158355712890625, -1.651275634765625, -1.5867156982421875, -1.52215576171875, -1.4575958251953125, -1.393035888671875, -1.3284759521484375, -1.263916015625, -1.1993560791015625, -1.134796142578125, -1.0702362060546875, -1.00567626953125, -0.9411163330078125, -0.876556396484375, -0.8119964599609375, -0.7474365234375, -0.6828765869140625, -0.618316650390625, -0.5537567138671875, -0.48919677734375, -0.4246368408203125, -0.360076904296875, -0.2955169677734375, -0.23095703125, -0.1663970947265625, -0.101837158203125, -0.0372772216796875, 0.02728271484375, 0.0918426513671875, 0.156402587890625, 0.2209625244140625, 0.2855224609375, 0.3500823974609375, 0.414642333984375, 0.4792022705078125, 0.54376220703125, 0.6083221435546875, 0.672882080078125, 0.7374420166015625, 0.802001953125, 0.8665618896484375, 0.931121826171875, 0.9956817626953125, 1.06024169921875, 1.1248016357421875, 1.189361572265625, 1.2539215087890625, 1.3184814453125, 1.3830413818359375, 1.447601318359375, 1.5121612548828125, 1.57672119140625, 1.6412811279296875, 1.705841064453125, 1.7704010009765625, 1.8349609375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 5.0, 7.0, 9.0, 9.0, 17.0, 15.0, 16.0, 29.0, 32.0, 46.0, 29.0, 33.0, 37.0, 48.0, 44.0, 47.0, 51.0, 40.0, 36.0, 48.0, 44.0, 37.0, 50.0, 42.0, 38.0, 17.0, 23.0, 22.0, 15.0, 19.0, 10.0, 10.0, 15.0, 5.0, 4.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-30.283309936523438, -29.434499740600586, -28.5856876373291, -27.73687744140625, -26.8880672454834, -26.039255142211914, -25.190444946289062, -24.341632843017578, -23.492822647094727, -22.644012451171875, -21.79520034790039, -20.94639015197754, -20.097579956054688, -19.248767852783203, -18.39995765686035, -17.5511474609375, -16.702335357666016, -15.853524208068848, -15.004714012145996, -14.155902862548828, -13.30709171295166, -12.458280563354492, -11.60947036743164, -10.760659217834473, -9.911849975585938, -9.06303882598877, -8.214228630065918, -7.36541748046875, -6.516606330871582, -5.667795658111572, -4.8189849853515625, -3.9701738357543945, -3.1213626861572266, -2.2725517749786377, -1.4237409830093384, -0.5749301910400391, 0.2738807201385498, 1.1226916313171387, 1.9715023040771484, 2.8203134536743164, 3.669124126434326, 4.517934799194336, 5.366745948791504, 6.215556621551514, 7.064367294311523, 7.913178443908691, 8.76198959350586, 9.610799789428711, 10.459610939025879, 11.308422088623047, 12.157232284545898, 13.006043434143066, 13.854854583740234, 14.703664779663086, 15.552475929260254, 16.401287078857422, 17.250097274780273, 18.098907470703125, 18.94771957397461, 19.79652976989746, 20.645339965820312, 21.494152069091797, 22.34296226501465, 23.1917724609375, 24.040584564208984]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 9.0, 9.0, 9.0, 14.0, 14.0, 9.0, 16.0, 17.0, 24.0, 23.0, 22.0, 36.0, 33.0, 28.0, 30.0, 48.0, 34.0, 37.0, 36.0, 38.0, 47.0, 49.0, 33.0, 33.0, 37.0, 28.0, 28.0, 25.0, 22.0, 25.0, 29.0, 21.0, 20.0, 15.0, 8.0, 18.0, 8.0, 11.0, 8.0, 10.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.505081176757812, -22.764629364013672, -22.02417755126953, -21.28372573852539, -20.54327392578125, -19.80282211303711, -19.06237030029297, -18.321916580200195, -17.581464767456055, -16.841012954711914, -16.100561141967773, -15.360109329223633, -14.619656562805176, -13.879204750061035, -13.138752937316895, -12.398300170898438, -11.657849311828613, -10.917397499084473, -10.176945686340332, -9.436492919921875, -8.696041107177734, -7.955589294433594, -7.215137481689453, -6.474685192108154, -5.734233379364014, -4.993781566619873, -4.253329277038574, -3.5128774642944336, -2.772425413131714, -2.031973361968994, -1.2915215492248535, -0.5510692596435547, 0.18938255310058594, 0.9298345446586609, 1.6702865362167358, 2.410738468170166, 3.1511905193328857, 3.8916425704956055, 4.632094383239746, 5.372546672821045, 6.1129984855651855, 6.853450298309326, 7.593902587890625, 8.334354400634766, 9.074806213378906, 9.815258026123047, 10.555709838867188, 11.296162605285645, 12.036614418029785, 12.777066230773926, 13.517518043518066, 14.257970809936523, 14.998422622680664, 15.738874435424805, 16.479326248168945, 17.219778060913086, 17.960229873657227, 18.700681686401367, 19.441133499145508, 20.18158531188965, 20.92203712463379, 21.662490844726562, 22.402942657470703, 23.143394470214844, 23.883846282958984]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 17.0, 35.0, 75.0, 89.0, 165.0, 197.0, 314.0, 562.0, 781.0, 1269.0, 1949.0, 3098.0, 4678.0, 7389.0, 11126.0, 17075.0, 25770.0, 38388.0, 55518.0, 76083.0, 99117.0, 118152.0, 125218.0, 117204.0, 98708.0, 76438.0, 55907.0, 38621.0, 25850.0, 17051.0, 11317.0, 7237.0, 4770.0, 2993.0, 1907.0, 1256.0, 831.0, 511.0, 307.0, 217.0, 107.0, 91.0, 46.0, 32.0, 25.0, 21.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.029296875, -20.33984375, -19.650390625, -18.9609375, -18.271484375, -17.58203125, -16.892578125, -16.203125, -15.513671875, -14.82421875, -14.134765625, -13.4453125, -12.755859375, -12.06640625, -11.376953125, -10.6875, -9.998046875, -9.30859375, -8.619140625, -7.9296875, -7.240234375, -6.55078125, -5.861328125, -5.171875, -4.482421875, -3.79296875, -3.103515625, -2.4140625, -1.724609375, -1.03515625, -0.345703125, 0.34375, 1.033203125, 1.72265625, 2.412109375, 3.1015625, 3.791015625, 4.48046875, 5.169921875, 5.859375, 6.548828125, 7.23828125, 7.927734375, 8.6171875, 9.306640625, 9.99609375, 10.685546875, 11.375, 12.064453125, 12.75390625, 13.443359375, 14.1328125, 14.822265625, 15.51171875, 16.201171875, 16.890625, 17.580078125, 18.26953125, 18.958984375, 19.6484375, 20.337890625, 21.02734375, 21.716796875, 22.40625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 10.0, 12.0, 13.0, 6.0, 18.0, 19.0, 18.0, 17.0, 29.0, 18.0, 33.0, 29.0, 29.0, 30.0, 40.0, 37.0, 54.0, 48.0, 37.0, 35.0, 41.0, 46.0, 31.0, 27.0, 25.0, 33.0, 38.0, 35.0, 24.0, 24.0, 18.0, 13.0, 13.0, 19.0, 9.0, 8.0, 5.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.971435546875, -23.19287109375, -22.414306640625, -21.6357421875, -20.857177734375, -20.07861328125, -19.300048828125, -18.521484375, -17.742919921875, -16.96435546875, -16.185791015625, -15.4072265625, -14.628662109375, -13.85009765625, -13.071533203125, -12.29296875, -11.514404296875, -10.73583984375, -9.957275390625, -9.1787109375, -8.400146484375, -7.62158203125, -6.843017578125, -6.064453125, -5.285888671875, -4.50732421875, -3.728759765625, -2.9501953125, -2.171630859375, -1.39306640625, -0.614501953125, 0.1640625, 0.942626953125, 1.72119140625, 2.499755859375, 3.2783203125, 4.056884765625, 4.83544921875, 5.614013671875, 6.392578125, 7.171142578125, 7.94970703125, 8.728271484375, 9.5068359375, 10.285400390625, 11.06396484375, 11.842529296875, 12.62109375, 13.399658203125, 14.17822265625, 14.956787109375, 15.7353515625, 16.513916015625, 17.29248046875, 18.071044921875, 18.849609375, 19.628173828125, 20.40673828125, 21.185302734375, 21.9638671875, 22.742431640625, 23.52099609375, 24.299560546875, 25.078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 28.0, 25.0, 50.0, 58.0, 133.0, 171.0, 244.0, 407.0, 581.0, 955.0, 1365.0, 2157.0, 3447.0, 5215.0, 8039.0, 12681.0, 19462.0, 29628.0, 44375.0, 63620.0, 87563.0, 110439.0, 126369.0, 127265.0, 113232.0, 89830.0, 66389.0, 46456.0, 30855.0, 20357.0, 13135.0, 8460.0, 5598.0, 3647.0, 2113.0, 1499.0, 955.0, 624.0, 367.0, 259.0, 178.0, 105.0, 68.0, 45.0, 41.0, 22.0, 14.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.676025390625, -21.94580078125, -21.215576171875, -20.4853515625, -19.755126953125, -19.02490234375, -18.294677734375, -17.564453125, -16.834228515625, -16.10400390625, -15.373779296875, -14.6435546875, -13.913330078125, -13.18310546875, -12.452880859375, -11.72265625, -10.992431640625, -10.26220703125, -9.531982421875, -8.8017578125, -8.071533203125, -7.34130859375, -6.611083984375, -5.880859375, -5.150634765625, -4.42041015625, -3.690185546875, -2.9599609375, -2.229736328125, -1.49951171875, -0.769287109375, -0.0390625, 0.691162109375, 1.42138671875, 2.151611328125, 2.8818359375, 3.612060546875, 4.34228515625, 5.072509765625, 5.802734375, 6.532958984375, 7.26318359375, 7.993408203125, 8.7236328125, 9.453857421875, 10.18408203125, 10.914306640625, 11.64453125, 12.374755859375, 13.10498046875, 13.835205078125, 14.5654296875, 15.295654296875, 16.02587890625, 16.756103515625, 17.486328125, 18.216552734375, 18.94677734375, 19.677001953125, 20.4072265625, 21.137451171875, 21.86767578125, 22.597900390625, 23.328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 3.0, 16.0, 16.0, 18.0, 16.0, 22.0, 22.0, 25.0, 38.0, 29.0, 46.0, 26.0, 44.0, 40.0, 48.0, 48.0, 39.0, 38.0, 48.0, 40.0, 34.0, 36.0, 32.0, 29.0, 27.0, 32.0, 35.0, 27.0, 14.0, 19.0, 10.0, 14.0, 8.0, 13.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.359375, -14.8349609375, -14.310546875, -13.7861328125, -13.26171875, -12.7373046875, -12.212890625, -11.6884765625, -11.1640625, -10.6396484375, -10.115234375, -9.5908203125, -9.06640625, -8.5419921875, -8.017578125, -7.4931640625, -6.96875, -6.4443359375, -5.919921875, -5.3955078125, -4.87109375, -4.3466796875, -3.822265625, -3.2978515625, -2.7734375, -2.2490234375, -1.724609375, -1.2001953125, -0.67578125, -0.1513671875, 0.373046875, 0.8974609375, 1.421875, 1.9462890625, 2.470703125, 2.9951171875, 3.51953125, 4.0439453125, 4.568359375, 5.0927734375, 5.6171875, 6.1416015625, 6.666015625, 7.1904296875, 7.71484375, 8.2392578125, 8.763671875, 9.2880859375, 9.8125, 10.3369140625, 10.861328125, 11.3857421875, 11.91015625, 12.4345703125, 12.958984375, 13.4833984375, 14.0078125, 14.5322265625, 15.056640625, 15.5810546875, 16.10546875, 16.6298828125, 17.154296875, 17.6787109375, 18.203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 3.0, 9.0, 18.0, 19.0, 22.0, 50.0, 44.0, 73.0, 105.0, 160.0, 235.0, 336.0, 469.0, 669.0, 1001.0, 1500.0, 2508.0, 4193.0, 7597.0, 15223.0, 31920.0, 71926.0, 149806.0, 242106.0, 238305.0, 146105.0, 69274.0, 31545.0, 14793.0, 7393.0, 4150.0, 2362.0, 1490.0, 1010.0, 673.0, 416.0, 324.0, 211.0, 152.0, 92.0, 80.0, 67.0, 33.0, 31.0, 14.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 6.0], "bins": [-17.65625, -17.1514892578125, -16.646728515625, -16.1419677734375, -15.63720703125, -15.1324462890625, -14.627685546875, -14.1229248046875, -13.6181640625, -13.1134033203125, -12.608642578125, -12.1038818359375, -11.59912109375, -11.0943603515625, -10.589599609375, -10.0848388671875, -9.580078125, -9.0753173828125, -8.570556640625, -8.0657958984375, -7.56103515625, -7.0562744140625, -6.551513671875, -6.0467529296875, -5.5419921875, -5.0372314453125, -4.532470703125, -4.0277099609375, -3.52294921875, -3.0181884765625, -2.513427734375, -2.0086669921875, -1.50390625, -0.9991455078125, -0.494384765625, 0.0103759765625, 0.51513671875, 1.0198974609375, 1.524658203125, 2.0294189453125, 2.5341796875, 3.0389404296875, 3.543701171875, 4.0484619140625, 4.55322265625, 5.0579833984375, 5.562744140625, 6.0675048828125, 6.572265625, 7.0770263671875, 7.581787109375, 8.0865478515625, 8.59130859375, 9.0960693359375, 9.600830078125, 10.1055908203125, 10.6103515625, 11.1151123046875, 11.619873046875, 12.1246337890625, 12.62939453125, 13.1341552734375, 13.638916015625, 14.1436767578125, 14.6484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 10.0, 4.0, 9.0, 8.0, 21.0, 38.0, 51.0, 49.0, 72.0, 77.0, 108.0, 108.0, 95.0, 89.0, 73.0, 52.0, 33.0, 27.0, 17.0, 19.0, 10.0, 3.0, 9.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002086639404296875, -0.0020223259925842285, -0.001958012580871582, -0.0018936991691589355, -0.001829385757446289, -0.0017650723457336426, -0.001700758934020996, -0.0016364455223083496, -0.0015721321105957031, -0.0015078186988830566, -0.0014435052871704102, -0.0013791918754577637, -0.0013148784637451172, -0.0012505650520324707, -0.0011862516403198242, -0.0011219382286071777, -0.0010576248168945312, -0.0009933114051818848, -0.0009289979934692383, -0.0008646845817565918, -0.0008003711700439453, -0.0007360577583312988, -0.0006717443466186523, -0.0006074309349060059, -0.0005431175231933594, -0.0004788041114807129, -0.0004144906997680664, -0.0003501772880554199, -0.00028586387634277344, -0.00022155046463012695, -0.00015723705291748047, -9.292364120483398e-05, -2.86102294921875e-05, 3.5703182220458984e-05, 0.00010001659393310547, 0.00016433000564575195, 0.00022864341735839844, 0.0002929568290710449, 0.0003572702407836914, 0.0004215836524963379, 0.0004858970642089844, 0.0005502104759216309, 0.0006145238876342773, 0.0006788372993469238, 0.0007431507110595703, 0.0008074641227722168, 0.0008717775344848633, 0.0009360909461975098, 0.0010004043579101562, 0.0010647177696228027, 0.0011290311813354492, 0.0011933445930480957, 0.0012576580047607422, 0.0013219714164733887, 0.0013862848281860352, 0.0014505982398986816, 0.0015149116516113281, 0.0015792250633239746, 0.001643538475036621, 0.0017078518867492676, 0.001772165298461914, 0.0018364787101745605, 0.001900792121887207, 0.0019651055335998535, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 7.0, 13.0, 17.0, 29.0, 30.0, 41.0, 63.0, 112.0, 143.0, 176.0, 252.0, 374.0, 520.0, 809.0, 1229.0, 1995.0, 3305.0, 5887.0, 11133.0, 22627.0, 48383.0, 102751.0, 190985.0, 248802.0, 198567.0, 108388.0, 50934.0, 23922.0, 11579.0, 5986.0, 3456.0, 2031.0, 1239.0, 804.0, 541.0, 404.0, 288.0, 200.0, 135.0, 128.0, 85.0, 44.0, 36.0, 23.0, 23.0, 11.0, 8.0, 5.0, 5.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.931396484375, -15.40966796875, -14.887939453125, -14.3662109375, -13.844482421875, -13.32275390625, -12.801025390625, -12.279296875, -11.757568359375, -11.23583984375, -10.714111328125, -10.1923828125, -9.670654296875, -9.14892578125, -8.627197265625, -8.10546875, -7.583740234375, -7.06201171875, -6.540283203125, -6.0185546875, -5.496826171875, -4.97509765625, -4.453369140625, -3.931640625, -3.409912109375, -2.88818359375, -2.366455078125, -1.8447265625, -1.322998046875, -0.80126953125, -0.279541015625, 0.2421875, 0.763916015625, 1.28564453125, 1.807373046875, 2.3291015625, 2.850830078125, 3.37255859375, 3.894287109375, 4.416015625, 4.937744140625, 5.45947265625, 5.981201171875, 6.5029296875, 7.024658203125, 7.54638671875, 8.068115234375, 8.58984375, 9.111572265625, 9.63330078125, 10.155029296875, 10.6767578125, 11.198486328125, 11.72021484375, 12.241943359375, 12.763671875, 13.285400390625, 13.80712890625, 14.328857421875, 14.8505859375, 15.372314453125, 15.89404296875, 16.415771484375, 16.9375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 12.0, 13.0, 23.0, 18.0, 38.0, 25.0, 53.0, 47.0, 79.0, 69.0, 81.0, 79.0, 82.0, 79.0, 58.0, 40.0, 46.0, 30.0, 23.0, 15.0, 18.0, 8.0, 12.0, 3.0, 5.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2109375, -6.99395751953125, -6.7769775390625, -6.55999755859375, -6.343017578125, -6.12603759765625, -5.9090576171875, -5.69207763671875, -5.47509765625, -5.25811767578125, -5.0411376953125, -4.82415771484375, -4.607177734375, -4.39019775390625, -4.1732177734375, -3.95623779296875, -3.7392578125, -3.52227783203125, -3.3052978515625, -3.08831787109375, -2.871337890625, -2.65435791015625, -2.4373779296875, -2.22039794921875, -2.00341796875, -1.78643798828125, -1.5694580078125, -1.35247802734375, -1.135498046875, -0.91851806640625, -0.7015380859375, -0.48455810546875, -0.267578125, -0.05059814453125, 0.1663818359375, 0.38336181640625, 0.600341796875, 0.81732177734375, 1.0343017578125, 1.25128173828125, 1.46826171875, 1.68524169921875, 1.9022216796875, 2.11920166015625, 2.336181640625, 2.55316162109375, 2.7701416015625, 2.98712158203125, 3.2041015625, 3.42108154296875, 3.6380615234375, 3.85504150390625, 4.072021484375, 4.28900146484375, 4.5059814453125, 4.72296142578125, 4.93994140625, 5.15692138671875, 5.3739013671875, 5.59088134765625, 5.807861328125, 6.02484130859375, 6.2418212890625, 6.45880126953125, 6.67578125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 3.0, 8.0, 8.0, 9.0, 12.0, 18.0, 16.0, 21.0, 18.0, 32.0, 35.0, 24.0, 38.0, 42.0, 42.0, 41.0, 43.0, 44.0, 57.0, 48.0, 44.0, 43.0, 37.0, 35.0, 32.0, 35.0, 36.0, 22.0, 17.0, 20.0, 22.0, 14.0, 11.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0], "bins": [-29.546329498291016, -28.719093322753906, -27.89185905456543, -27.06462287902832, -26.237388610839844, -25.410152435302734, -24.582916259765625, -23.75568199157715, -22.92844581604004, -22.10120964050293, -21.273975372314453, -20.446739196777344, -19.619504928588867, -18.792268753051758, -17.96503448486328, -17.137798309326172, -16.310562133789062, -15.48332691192627, -14.656091690063477, -13.828855514526367, -13.001620292663574, -12.174385070800781, -11.347149848937988, -10.519914627075195, -9.692680358886719, -8.865445137023926, -8.038209915161133, -7.210974216461182, -6.3837385177612305, -5.5565032958984375, -4.7292680740356445, -3.9020323753356934, -3.074796676635742, -2.24756121635437, -1.4203258752822876, -0.5930905342102051, 0.234144926071167, 1.061380386352539, 1.888615608215332, 2.715851306915283, 3.543086528778076, 4.370321750640869, 5.19755744934082, 6.024792671203613, 6.852027893066406, 7.679263591766357, 8.506498336791992, 9.333734512329102, 10.160969734191895, 10.988204956054688, 11.81544017791748, 12.642675399780273, 13.469911575317383, 14.297146797180176, 15.124382019042969, 15.951618194580078, 16.778852462768555, 17.606088638305664, 18.43332290649414, 19.26055908203125, 20.087793350219727, 20.915029525756836, 21.742263793945312, 22.569499969482422, 23.39673614501953]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 15.0, 9.0, 22.0, 16.0, 22.0, 26.0, 34.0, 27.0, 38.0, 28.0, 29.0, 26.0, 40.0, 33.0, 47.0, 32.0, 49.0, 42.0, 40.0, 36.0, 25.0, 36.0, 31.0, 24.0, 32.0, 31.0, 19.0, 27.0, 17.0, 15.0, 14.0, 18.0, 15.0, 5.0, 11.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.621994018554688, -23.85186767578125, -23.081741333007812, -22.311614990234375, -21.541488647460938, -20.7713623046875, -20.001235961914062, -19.231111526489258, -18.46098518371582, -17.690858840942383, -16.920732498168945, -16.150606155395508, -15.380480766296387, -14.61035442352295, -13.840228080749512, -13.07010269165039, -12.299975395202637, -11.5298490524292, -10.759722709655762, -9.98959732055664, -9.219470977783203, -8.449344635009766, -7.679218292236328, -6.909092426300049, -6.138966083526611, -5.368839740753174, -4.5987138748168945, -3.828587532043457, -3.0584614276885986, -2.2883353233337402, -1.5182089805603027, -0.7480831146240234, 0.022043228149414062, 0.7921693921089172, 1.5622955560684204, 2.3324217796325684, 3.1025478839874268, 3.872673988342285, 4.642800331115723, 5.412926197052002, 6.1830525398254395, 6.953178882598877, 7.723304748535156, 8.493431091308594, 9.263557434082031, 10.033683776855469, 10.803810119628906, 11.573935508728027, 12.344061851501465, 13.114188194274902, 13.88431453704834, 14.654439926147461, 15.424566268920898, 16.194692611694336, 16.964818954467773, 17.73494529724121, 18.50507164001465, 19.275197982788086, 20.045324325561523, 20.81545066833496, 21.5855770111084, 22.355701446533203, 23.12582778930664, 23.895954132080078, 24.666080474853516]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 13.0, 25.0, 45.0, 76.0, 134.0, 218.0, 324.0, 560.0, 897.0, 1610.0, 2750.0, 4810.0, 8204.0, 14979.0, 28084.0, 53127.0, 106015.0, 223524.0, 474716.0, 867551.0, 1022275.0, 702164.0, 350060.0, 163565.0, 79462.0, 41099.0, 21337.0, 11663.0, 6528.0, 3640.0, 2015.0, 1215.0, 670.0, 370.0, 213.0, 149.0, 88.0, 37.0, 26.0, 15.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.625, -35.49072265625, -34.3564453125, -33.22216796875, -32.087890625, -30.95361328125, -29.8193359375, -28.68505859375, -27.55078125, -26.41650390625, -25.2822265625, -24.14794921875, -23.013671875, -21.87939453125, -20.7451171875, -19.61083984375, -18.4765625, -17.34228515625, -16.2080078125, -15.07373046875, -13.939453125, -12.80517578125, -11.6708984375, -10.53662109375, -9.40234375, -8.26806640625, -7.1337890625, -5.99951171875, -4.865234375, -3.73095703125, -2.5966796875, -1.46240234375, -0.328125, 0.80615234375, 1.9404296875, 3.07470703125, 4.208984375, 5.34326171875, 6.4775390625, 7.61181640625, 8.74609375, 9.88037109375, 11.0146484375, 12.14892578125, 13.283203125, 14.41748046875, 15.5517578125, 16.68603515625, 17.8203125, 18.95458984375, 20.0888671875, 21.22314453125, 22.357421875, 23.49169921875, 24.6259765625, 25.76025390625, 26.89453125, 28.02880859375, 29.1630859375, 30.29736328125, 31.431640625, 32.56591796875, 33.7001953125, 34.83447265625, 35.96875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 3.0, 8.0, 4.0, 11.0, 7.0, 6.0, 15.0, 15.0, 17.0, 15.0, 21.0, 40.0, 23.0, 29.0, 30.0, 34.0, 24.0, 32.0, 29.0, 41.0, 42.0, 48.0, 43.0, 47.0, 38.0, 38.0, 31.0, 23.0, 19.0, 29.0, 35.0, 32.0, 24.0, 23.0, 19.0, 11.0, 18.0, 15.0, 12.0, 7.0, 8.0, 5.0, 6.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.40625, -19.74609375, -19.0859375, -18.42578125, -17.765625, -17.10546875, -16.4453125, -15.78515625, -15.125, -14.46484375, -13.8046875, -13.14453125, -12.484375, -11.82421875, -11.1640625, -10.50390625, -9.84375, -9.18359375, -8.5234375, -7.86328125, -7.203125, -6.54296875, -5.8828125, -5.22265625, -4.5625, -3.90234375, -3.2421875, -2.58203125, -1.921875, -1.26171875, -0.6015625, 0.05859375, 0.71875, 1.37890625, 2.0390625, 2.69921875, 3.359375, 4.01953125, 4.6796875, 5.33984375, 6.0, 6.66015625, 7.3203125, 7.98046875, 8.640625, 9.30078125, 9.9609375, 10.62109375, 11.28125, 11.94140625, 12.6015625, 13.26171875, 13.921875, 14.58203125, 15.2421875, 15.90234375, 16.5625, 17.22265625, 17.8828125, 18.54296875, 19.203125, 19.86328125, 20.5234375, 21.18359375, 21.84375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 13.0, 12.0, 25.0, 38.0, 71.0, 95.0, 135.0, 236.0, 376.0, 681.0, 1054.0, 1696.0, 2879.0, 4846.0, 8379.0, 14710.0, 26459.0, 47453.0, 88429.0, 164897.0, 304341.0, 531601.0, 788315.0, 828457.0, 601629.0, 354198.0, 192865.0, 103204.0, 55818.0, 30667.0, 17133.0, 9804.0, 5637.0, 3229.0, 1916.0, 1133.0, 713.0, 434.0, 253.0, 172.0, 88.0, 66.0, 43.0, 29.0, 17.0, 17.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-36.75, -35.640625, -34.53125, -33.421875, -32.3125, -31.203125, -30.09375, -28.984375, -27.875, -26.765625, -25.65625, -24.546875, -23.4375, -22.328125, -21.21875, -20.109375, -19.0, -17.890625, -16.78125, -15.671875, -14.5625, -13.453125, -12.34375, -11.234375, -10.125, -9.015625, -7.90625, -6.796875, -5.6875, -4.578125, -3.46875, -2.359375, -1.25, -0.140625, 0.96875, 2.078125, 3.1875, 4.296875, 5.40625, 6.515625, 7.625, 8.734375, 9.84375, 10.953125, 12.0625, 13.171875, 14.28125, 15.390625, 16.5, 17.609375, 18.71875, 19.828125, 20.9375, 22.046875, 23.15625, 24.265625, 25.375, 26.484375, 27.59375, 28.703125, 29.8125, 30.921875, 32.03125, 33.140625, 34.25]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 18.0, 28.0, 28.0, 38.0, 62.0, 56.0, 89.0, 123.0, 120.0, 171.0, 204.0, 236.0, 242.0, 250.0, 281.0, 299.0, 293.0, 305.0, 243.0, 197.0, 155.0, 135.0, 125.0, 77.0, 72.0, 54.0, 39.0, 29.0, 27.0, 18.0, 18.0, 9.0, 2.0, 10.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.152587890625, -9.69580078125, -9.239013671875, -8.7822265625, -8.325439453125, -7.86865234375, -7.411865234375, -6.955078125, -6.498291015625, -6.04150390625, -5.584716796875, -5.1279296875, -4.671142578125, -4.21435546875, -3.757568359375, -3.30078125, -2.843994140625, -2.38720703125, -1.930419921875, -1.4736328125, -1.016845703125, -0.56005859375, -0.103271484375, 0.353515625, 0.810302734375, 1.26708984375, 1.723876953125, 2.1806640625, 2.637451171875, 3.09423828125, 3.551025390625, 4.0078125, 4.464599609375, 4.92138671875, 5.378173828125, 5.8349609375, 6.291748046875, 6.74853515625, 7.205322265625, 7.662109375, 8.118896484375, 8.57568359375, 9.032470703125, 9.4892578125, 9.946044921875, 10.40283203125, 10.859619140625, 11.31640625, 11.773193359375, 12.22998046875, 12.686767578125, 13.1435546875, 13.600341796875, 14.05712890625, 14.513916015625, 14.970703125, 15.427490234375, 15.88427734375, 16.341064453125, 16.7978515625, 17.254638671875, 17.71142578125, 18.168212890625, 18.625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 11.0, 21.0, 14.0, 29.0, 24.0, 31.0, 21.0, 23.0, 42.0, 33.0, 51.0, 48.0, 48.0, 54.0, 49.0, 58.0, 51.0, 33.0, 45.0, 31.0, 28.0, 34.0, 28.0, 34.0, 23.0, 10.0, 17.0, 8.0, 17.0, 16.0, 10.0, 4.0, 6.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-32.16241455078125, -31.269439697265625, -30.37646484375, -29.483489990234375, -28.590517044067383, -27.697542190551758, -26.804567337036133, -25.911592483520508, -25.018619537353516, -24.12564468383789, -23.232669830322266, -22.33969497680664, -21.44672203063965, -20.553747177124023, -19.6607723236084, -18.767797470092773, -17.87482261657715, -16.981847763061523, -16.0888729095459, -15.19589900970459, -14.302925109863281, -13.409950256347656, -12.516975402832031, -11.624000549316406, -10.731026649475098, -9.838051795959473, -8.945077896118164, -8.052103042602539, -7.159128665924072, -6.2661542892456055, -5.3731794357299805, -4.480205059051514, -3.587228775024414, -2.6942543983459473, -1.8012797832489014, -0.9083051681518555, -0.015330791473388672, 0.8776435852050781, 1.7706184387207031, 2.66359281539917, 3.5565671920776367, 4.4495415687561035, 5.34251594543457, 6.235490798950195, 7.128465175628662, 8.021439552307129, 8.914414405822754, 9.807388305664062, 10.700363159179688, 11.593338012695312, 12.486311912536621, 13.379286766052246, 14.272260665893555, 15.16523551940918, 16.058210372924805, 16.95118522644043, 17.844158172607422, 18.737133026123047, 19.630107879638672, 20.523082733154297, 21.41605567932129, 22.309030532836914, 23.20200538635254, 24.094980239868164, 24.98795509338379]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 4.0, 7.0, 5.0, 13.0, 7.0, 13.0, 14.0, 13.0, 28.0, 26.0, 30.0, 36.0, 40.0, 30.0, 25.0, 36.0, 29.0, 37.0, 42.0, 49.0, 42.0, 49.0, 37.0, 33.0, 44.0, 35.0, 36.0, 24.0, 33.0, 32.0, 18.0, 20.0, 14.0, 17.0, 12.0, 13.0, 10.0, 8.0, 10.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.61370277404785, -22.778467178344727, -21.9432315826416, -21.10799789428711, -20.272762298583984, -19.43752670288086, -18.602291107177734, -17.76705551147461, -16.931819915771484, -16.09658432006836, -15.26134967803955, -14.426114082336426, -13.590879440307617, -12.755643844604492, -11.920408248901367, -11.085172653198242, -10.24993896484375, -9.414703369140625, -8.579468727111816, -7.744233131408691, -6.908998012542725, -6.073762893676758, -5.238527297973633, -4.403292179107666, -3.568057060241699, -2.7328219413757324, -1.8975865840911865, -1.0623512268066406, -0.22711610794067383, 0.608119010925293, 1.443354606628418, 2.2785897254943848, 3.1138229370117188, 3.9490580558776855, 4.784293174743652, 5.619528770446777, 6.454763889312744, 7.289999008178711, 8.125234603881836, 8.960470199584961, 9.79570484161377, 10.630940437316895, 11.466175079345703, 12.301410675048828, 13.136646270751953, 13.971880912780762, 14.807116508483887, 15.642351150512695, 16.47758674621582, 17.312822341918945, 18.14805793762207, 18.983291625976562, 19.818527221679688, 20.653762817382812, 21.488998413085938, 22.324234008789062, 23.159469604492188, 23.994705200195312, 24.829940795898438, 25.665176391601562, 26.500410079956055, 27.33564567565918, 28.170881271362305, 29.00611686706543, 29.841350555419922]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 11.0, 19.0, 22.0, 41.0, 41.0, 67.0, 116.0, 156.0, 272.0, 420.0, 570.0, 875.0, 1251.0, 1784.0, 2739.0, 4041.0, 6054.0, 9018.0, 13178.0, 19951.0, 29334.0, 43731.0, 63971.0, 88842.0, 116367.0, 134585.0, 132679.0, 111202.0, 83746.0, 59069.0, 40788.0, 27303.0, 18468.0, 12361.0, 8207.0, 5670.0, 3762.0, 2552.0, 1703.0, 1184.0, 790.0, 559.0, 370.0, 218.0, 158.0, 104.0, 84.0, 40.0, 37.0, 19.0, 11.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.3671875, -9.0430908203125, -8.718994140625, -8.3948974609375, -8.07080078125, -7.7467041015625, -7.422607421875, -7.0985107421875, -6.7744140625, -6.4503173828125, -6.126220703125, -5.8021240234375, -5.47802734375, -5.1539306640625, -4.829833984375, -4.5057373046875, -4.181640625, -3.8575439453125, -3.533447265625, -3.2093505859375, -2.88525390625, -2.5611572265625, -2.237060546875, -1.9129638671875, -1.5888671875, -1.2647705078125, -0.940673828125, -0.6165771484375, -0.29248046875, 0.0316162109375, 0.355712890625, 0.6798095703125, 1.00390625, 1.3280029296875, 1.652099609375, 1.9761962890625, 2.30029296875, 2.6243896484375, 2.948486328125, 3.2725830078125, 3.5966796875, 3.9207763671875, 4.244873046875, 4.5689697265625, 4.89306640625, 5.2171630859375, 5.541259765625, 5.8653564453125, 6.189453125, 6.5135498046875, 6.837646484375, 7.1617431640625, 7.48583984375, 7.8099365234375, 8.134033203125, 8.4581298828125, 8.7822265625, 9.1063232421875, 9.430419921875, 9.7545166015625, 10.07861328125, 10.4027099609375, 10.726806640625, 11.0509033203125, 11.375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 9.0, 7.0, 12.0, 19.0, 14.0, 22.0, 20.0, 31.0, 33.0, 40.0, 33.0, 45.0, 39.0, 38.0, 45.0, 45.0, 45.0, 42.0, 37.0, 45.0, 28.0, 40.0, 43.0, 30.0, 33.0, 24.0, 27.0, 28.0, 14.0, 8.0, 13.0, 14.0, 7.0, 8.0, 6.0, 9.0, 10.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.578125, -24.677490234375, -23.77685546875, -22.876220703125, -21.9755859375, -21.074951171875, -20.17431640625, -19.273681640625, -18.373046875, -17.472412109375, -16.57177734375, -15.671142578125, -14.7705078125, -13.869873046875, -12.96923828125, -12.068603515625, -11.16796875, -10.267333984375, -9.36669921875, -8.466064453125, -7.5654296875, -6.664794921875, -5.76416015625, -4.863525390625, -3.962890625, -3.062255859375, -2.16162109375, -1.260986328125, -0.3603515625, 0.540283203125, 1.44091796875, 2.341552734375, 3.2421875, 4.142822265625, 5.04345703125, 5.944091796875, 6.8447265625, 7.745361328125, 8.64599609375, 9.546630859375, 10.447265625, 11.347900390625, 12.24853515625, 13.149169921875, 14.0498046875, 14.950439453125, 15.85107421875, 16.751708984375, 17.65234375, 18.552978515625, 19.45361328125, 20.354248046875, 21.2548828125, 22.155517578125, 23.05615234375, 23.956787109375, 24.857421875, 25.758056640625, 26.65869140625, 27.559326171875, 28.4599609375, 29.360595703125, 30.26123046875, 31.161865234375, 32.0625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 13.0, 23.0, 33.0, 46.0, 90.0, 131.0, 181.0, 284.0, 391.0, 583.0, 914.0, 1409.0, 2213.0, 3342.0, 5312.0, 8400.0, 13573.0, 21740.0, 35161.0, 55777.0, 86254.0, 127057.0, 162845.0, 162274.0, 126809.0, 85596.0, 54770.0, 34874.0, 21464.0, 13436.0, 8529.0, 5471.0, 3341.0, 2105.0, 1401.0, 914.0, 602.0, 392.0, 289.0, 170.0, 116.0, 86.0, 40.0, 34.0, 21.0, 19.0, 10.0, 3.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-14.4296875, -13.9923095703125, -13.554931640625, -13.1175537109375, -12.68017578125, -12.2427978515625, -11.805419921875, -11.3680419921875, -10.9306640625, -10.4932861328125, -10.055908203125, -9.6185302734375, -9.18115234375, -8.7437744140625, -8.306396484375, -7.8690185546875, -7.431640625, -6.9942626953125, -6.556884765625, -6.1195068359375, -5.68212890625, -5.2447509765625, -4.807373046875, -4.3699951171875, -3.9326171875, -3.4952392578125, -3.057861328125, -2.6204833984375, -2.18310546875, -1.7457275390625, -1.308349609375, -0.8709716796875, -0.43359375, 0.0037841796875, 0.441162109375, 0.8785400390625, 1.31591796875, 1.7532958984375, 2.190673828125, 2.6280517578125, 3.0654296875, 3.5028076171875, 3.940185546875, 4.3775634765625, 4.81494140625, 5.2523193359375, 5.689697265625, 6.1270751953125, 6.564453125, 7.0018310546875, 7.439208984375, 7.8765869140625, 8.31396484375, 8.7513427734375, 9.188720703125, 9.6260986328125, 10.0634765625, 10.5008544921875, 10.938232421875, 11.3756103515625, 11.81298828125, 12.2503662109375, 12.687744140625, 13.1251220703125, 13.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 6.0, 6.0, 6.0, 13.0, 13.0, 18.0, 21.0, 19.0, 21.0, 16.0, 32.0, 30.0, 17.0, 30.0, 38.0, 32.0, 47.0, 41.0, 37.0, 39.0, 36.0, 37.0, 45.0, 43.0, 33.0, 37.0, 41.0, 25.0, 24.0, 21.0, 22.0, 19.0, 18.0, 22.0, 17.0, 21.0, 8.0, 11.0, 3.0, 6.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.625, -15.108154296875, -14.59130859375, -14.074462890625, -13.5576171875, -13.040771484375, -12.52392578125, -12.007080078125, -11.490234375, -10.973388671875, -10.45654296875, -9.939697265625, -9.4228515625, -8.906005859375, -8.38916015625, -7.872314453125, -7.35546875, -6.838623046875, -6.32177734375, -5.804931640625, -5.2880859375, -4.771240234375, -4.25439453125, -3.737548828125, -3.220703125, -2.703857421875, -2.18701171875, -1.670166015625, -1.1533203125, -0.636474609375, -0.11962890625, 0.397216796875, 0.9140625, 1.430908203125, 1.94775390625, 2.464599609375, 2.9814453125, 3.498291015625, 4.01513671875, 4.531982421875, 5.048828125, 5.565673828125, 6.08251953125, 6.599365234375, 7.1162109375, 7.633056640625, 8.14990234375, 8.666748046875, 9.18359375, 9.700439453125, 10.21728515625, 10.734130859375, 11.2509765625, 11.767822265625, 12.28466796875, 12.801513671875, 13.318359375, 13.835205078125, 14.35205078125, 14.868896484375, 15.3857421875, 15.902587890625, 16.41943359375, 16.936279296875, 17.453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 4.0, 11.0, 7.0, 12.0, 18.0, 40.0, 41.0, 84.0, 116.0, 170.0, 267.0, 324.0, 520.0, 893.0, 1306.0, 2196.0, 3571.0, 6102.0, 10688.0, 18711.0, 33906.0, 62001.0, 113203.0, 185699.0, 221708.0, 167098.0, 97600.0, 53340.0, 29117.0, 16156.0, 9513.0, 5461.0, 3228.0, 2027.0, 1176.0, 721.0, 502.0, 336.0, 201.0, 130.0, 104.0, 73.0, 46.0, 32.0, 22.0, 17.0, 13.0, 9.0, 5.0, 8.0, 8.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-5.28125, -5.11810302734375, -4.9549560546875, -4.79180908203125, -4.628662109375, -4.46551513671875, -4.3023681640625, -4.13922119140625, -3.97607421875, -3.81292724609375, -3.6497802734375, -3.48663330078125, -3.323486328125, -3.16033935546875, -2.9971923828125, -2.83404541015625, -2.6708984375, -2.50775146484375, -2.3446044921875, -2.18145751953125, -2.018310546875, -1.85516357421875, -1.6920166015625, -1.52886962890625, -1.36572265625, -1.20257568359375, -1.0394287109375, -0.87628173828125, -0.713134765625, -0.54998779296875, -0.3868408203125, -0.22369384765625, -0.060546875, 0.10260009765625, 0.2657470703125, 0.42889404296875, 0.592041015625, 0.75518798828125, 0.9183349609375, 1.08148193359375, 1.24462890625, 1.40777587890625, 1.5709228515625, 1.73406982421875, 1.897216796875, 2.06036376953125, 2.2235107421875, 2.38665771484375, 2.5498046875, 2.71295166015625, 2.8760986328125, 3.03924560546875, 3.202392578125, 3.36553955078125, 3.5286865234375, 3.69183349609375, 3.85498046875, 4.01812744140625, 4.1812744140625, 4.34442138671875, 4.507568359375, 4.67071533203125, 4.8338623046875, 4.99700927734375, 5.16015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 4.0, 12.0, 11.0, 18.0, 16.0, 28.0, 31.0, 45.0, 56.0, 63.0, 69.0, 67.0, 66.0, 77.0, 66.0, 72.0, 56.0, 47.0, 33.0, 36.0, 35.0, 14.0, 13.0, 11.0, 10.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000457763671875, -0.000441916286945343, -0.00042606890201568604, -0.00041022151708602905, -0.00039437413215637207, -0.0003785267472267151, -0.0003626793622970581, -0.0003468319773674011, -0.00033098459243774414, -0.00031513720750808716, -0.0002992898225784302, -0.0002834424376487732, -0.0002675950527191162, -0.00025174766778945923, -0.00023590028285980225, -0.00022005289793014526, -0.00020420551300048828, -0.0001883581280708313, -0.00017251074314117432, -0.00015666335821151733, -0.00014081597328186035, -0.00012496858835220337, -0.00010912120342254639, -9.32738184928894e-05, -7.742643356323242e-05, -6.157904863357544e-05, -4.573166370391846e-05, -2.9884278774261475e-05, -1.4036893844604492e-05, 1.8104910850524902e-06, 1.7657876014709473e-05, 3.3505260944366455e-05, 4.935264587402344e-05, 6.520003080368042e-05, 8.10474157333374e-05, 9.689480066299438e-05, 0.00011274218559265137, 0.00012858957052230835, 0.00014443695545196533, 0.00016028434038162231, 0.0001761317253112793, 0.00019197911024093628, 0.00020782649517059326, 0.00022367388010025024, 0.00023952126502990723, 0.0002553686499595642, 0.0002712160348892212, 0.0002870634198188782, 0.00030291080474853516, 0.00031875818967819214, 0.0003346055746078491, 0.0003504529595375061, 0.0003663003444671631, 0.00038214772939682007, 0.00039799511432647705, 0.00041384249925613403, 0.000429689884185791, 0.000445537269115448, 0.000461384654045105, 0.00047723203897476196, 0.0004930794239044189, 0.0005089268088340759, 0.0005247741937637329, 0.0005406215786933899, 0.0005564689636230469]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 8.0, 6.0, 19.0, 14.0, 23.0, 34.0, 59.0, 65.0, 128.0, 159.0, 271.0, 407.0, 554.0, 866.0, 1337.0, 1913.0, 3022.0, 4412.0, 6906.0, 10544.0, 16247.0, 25829.0, 40693.0, 63826.0, 97896.0, 133870.0, 157945.0, 148724.0, 114581.0, 78518.0, 50444.0, 31939.0, 20081.0, 12824.0, 8214.0, 5361.0, 3573.0, 2473.0, 1604.0, 1049.0, 677.0, 479.0, 321.0, 196.0, 155.0, 97.0, 70.0, 39.0, 30.0, 19.0, 6.0, 18.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.49609375, -4.34979248046875, -4.2034912109375, -4.05718994140625, -3.910888671875, -3.76458740234375, -3.6182861328125, -3.47198486328125, -3.32568359375, -3.17938232421875, -3.0330810546875, -2.88677978515625, -2.740478515625, -2.59417724609375, -2.4478759765625, -2.30157470703125, -2.1552734375, -2.00897216796875, -1.8626708984375, -1.71636962890625, -1.570068359375, -1.42376708984375, -1.2774658203125, -1.13116455078125, -0.98486328125, -0.83856201171875, -0.6922607421875, -0.54595947265625, -0.399658203125, -0.25335693359375, -0.1070556640625, 0.03924560546875, 0.185546875, 0.33184814453125, 0.4781494140625, 0.62445068359375, 0.770751953125, 0.91705322265625, 1.0633544921875, 1.20965576171875, 1.35595703125, 1.50225830078125, 1.6485595703125, 1.79486083984375, 1.941162109375, 2.08746337890625, 2.2337646484375, 2.38006591796875, 2.5263671875, 2.67266845703125, 2.8189697265625, 2.96527099609375, 3.111572265625, 3.25787353515625, 3.4041748046875, 3.55047607421875, 3.69677734375, 3.84307861328125, 3.9893798828125, 4.13568115234375, 4.281982421875, 4.42828369140625, 4.5745849609375, 4.72088623046875, 4.8671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 5.0, 7.0, 10.0, 11.0, 10.0, 36.0, 20.0, 25.0, 30.0, 34.0, 41.0, 43.0, 40.0, 58.0, 54.0, 54.0, 49.0, 42.0, 40.0, 49.0, 52.0, 48.0, 38.0, 25.0, 29.0, 25.0, 18.0, 16.0, 12.0, 11.0, 9.0, 11.0, 6.0, 3.0, 1.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6630859375, -1.6056060791015625, -1.548126220703125, -1.4906463623046875, -1.43316650390625, -1.3756866455078125, -1.318206787109375, -1.2607269287109375, -1.2032470703125, -1.1457672119140625, -1.088287353515625, -1.0308074951171875, -0.97332763671875, -0.9158477783203125, -0.858367919921875, -0.8008880615234375, -0.743408203125, -0.6859283447265625, -0.628448486328125, -0.5709686279296875, -0.51348876953125, -0.4560089111328125, -0.398529052734375, -0.3410491943359375, -0.2835693359375, -0.2260894775390625, -0.168609619140625, -0.1111297607421875, -0.05364990234375, 0.0038299560546875, 0.061309814453125, 0.1187896728515625, 0.17626953125, 0.2337493896484375, 0.291229248046875, 0.3487091064453125, 0.40618896484375, 0.4636688232421875, 0.521148681640625, 0.5786285400390625, 0.6361083984375, 0.6935882568359375, 0.751068115234375, 0.8085479736328125, 0.86602783203125, 0.9235076904296875, 0.980987548828125, 1.0384674072265625, 1.095947265625, 1.1534271240234375, 1.210906982421875, 1.2683868408203125, 1.32586669921875, 1.3833465576171875, 1.440826416015625, 1.4983062744140625, 1.5557861328125, 1.6132659912109375, 1.670745849609375, 1.7282257080078125, 1.78570556640625, 1.8431854248046875, 1.900665283203125, 1.9581451416015625, 2.015625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 9.0, 19.0, 19.0, 22.0, 20.0, 30.0, 23.0, 32.0, 32.0, 40.0, 38.0, 40.0, 49.0, 51.0, 57.0, 54.0, 44.0, 44.0, 42.0, 38.0, 31.0, 31.0, 25.0, 32.0, 26.0, 21.0, 20.0, 12.0, 11.0, 9.0, 15.0, 10.0, 6.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.013689041137695, -29.141399383544922, -28.269107818603516, -27.396818161010742, -26.52452850341797, -25.652236938476562, -24.77994728088379, -23.907657623291016, -23.03536605834961, -22.163076400756836, -21.29078483581543, -20.418495178222656, -19.546205520629883, -18.67391586303711, -17.801624298095703, -16.92933464050293, -16.057044982910156, -15.184754371643066, -14.312464714050293, -13.440174102783203, -12.56788444519043, -11.69559383392334, -10.82330322265625, -9.951013565063477, -9.078722953796387, -8.206432342529297, -7.334142684936523, -6.461852073669434, -5.589561939239502, -4.71727180480957, -3.8449811935424805, -2.972691059112549, -2.1003990173339844, -1.2281087636947632, -0.355818510055542, 0.5164718627929688, 1.3887619972229004, 2.261052131652832, 3.133342742919922, 4.0056328773498535, 4.877923011779785, 5.750213146209717, 6.622503280639648, 7.494793891906738, 8.367084503173828, 9.239374160766602, 10.111664772033691, 10.983955383300781, 11.856245040893555, 12.728535652160645, 13.600825309753418, 14.473115921020508, 15.345405578613281, 16.217697143554688, 17.08998680114746, 17.962276458740234, 18.83456802368164, 19.706857681274414, 20.57914924621582, 21.451438903808594, 22.323728561401367, 23.19601821899414, 24.068309783935547, 24.94059944152832, 25.812889099121094]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 3.0, 6.0, 3.0, 10.0, 11.0, 10.0, 11.0, 13.0, 17.0, 31.0, 21.0, 38.0, 32.0, 47.0, 25.0, 34.0, 28.0, 33.0, 38.0, 49.0, 48.0, 45.0, 35.0, 44.0, 38.0, 43.0, 33.0, 31.0, 30.0, 29.0, 26.0, 19.0, 17.0, 16.0, 17.0, 7.0, 17.0, 6.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.278066635131836, -22.437660217285156, -21.597253799438477, -20.756847381591797, -19.916440963745117, -19.076034545898438, -18.235626220703125, -17.395219802856445, -16.554813385009766, -15.714406967163086, -14.874000549316406, -14.033594131469727, -13.19318675994873, -12.35278034210205, -11.512373924255371, -10.671966552734375, -9.831561088562012, -8.991154670715332, -8.150748252868652, -7.3103413581848145, -6.469934463500977, -5.629528045654297, -4.789121627807617, -3.9487147331237793, -3.1083083152770996, -2.267901659011841, -1.4274951219558716, -0.5870885848999023, 0.25331807136535645, 1.0937247276306152, 1.934131145477295, 2.774538040161133, 3.6149444580078125, 4.455350875854492, 5.29575777053833, 6.13616418838501, 6.976571083068848, 7.816977500915527, 8.657383918762207, 9.497791290283203, 10.338197708129883, 11.178604125976562, 12.019010543823242, 12.859416961669922, 13.699824333190918, 14.540230751037598, 15.380637168884277, 16.221044540405273, 17.061450958251953, 17.901857376098633, 18.742263793945312, 19.582670211791992, 20.423076629638672, 21.263484954833984, 22.10388946533203, 22.944297790527344, 23.78470230102539, 24.62510871887207, 25.46551513671875, 26.30592155456543, 27.14632797241211, 27.986736297607422, 28.82714080810547, 29.66754913330078, 30.50795555114746]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 11.0, 11.0, 30.0, 31.0, 54.0, 96.0, 131.0, 187.0, 304.0, 373.0, 657.0, 974.0, 1557.0, 2340.0, 3601.0, 5438.0, 8408.0, 12676.0, 19349.0, 28793.0, 42207.0, 59779.0, 79755.0, 101794.0, 117758.0, 121747.0, 112708.0, 94085.0, 72122.0, 52359.0, 36484.0, 24562.0, 16584.0, 11009.0, 7029.0, 4757.0, 3057.0, 1962.0, 1248.0, 888.0, 529.0, 373.0, 248.0, 154.0, 112.0, 77.0, 43.0, 40.0, 19.0, 15.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-20.953125, -20.283935546875, -19.61474609375, -18.945556640625, -18.2763671875, -17.607177734375, -16.93798828125, -16.268798828125, -15.599609375, -14.930419921875, -14.26123046875, -13.592041015625, -12.9228515625, -12.253662109375, -11.58447265625, -10.915283203125, -10.24609375, -9.576904296875, -8.90771484375, -8.238525390625, -7.5693359375, -6.900146484375, -6.23095703125, -5.561767578125, -4.892578125, -4.223388671875, -3.55419921875, -2.885009765625, -2.2158203125, -1.546630859375, -0.87744140625, -0.208251953125, 0.4609375, 1.130126953125, 1.79931640625, 2.468505859375, 3.1376953125, 3.806884765625, 4.47607421875, 5.145263671875, 5.814453125, 6.483642578125, 7.15283203125, 7.822021484375, 8.4912109375, 9.160400390625, 9.82958984375, 10.498779296875, 11.16796875, 11.837158203125, 12.50634765625, 13.175537109375, 13.8447265625, 14.513916015625, 15.18310546875, 15.852294921875, 16.521484375, 17.190673828125, 17.85986328125, 18.529052734375, 19.1982421875, 19.867431640625, 20.53662109375, 21.205810546875, 21.875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 5.0, 11.0, 6.0, 10.0, 8.0, 11.0, 16.0, 17.0, 26.0, 21.0, 28.0, 31.0, 26.0, 33.0, 35.0, 42.0, 41.0, 35.0, 39.0, 38.0, 49.0, 41.0, 41.0, 33.0, 37.0, 40.0, 30.0, 29.0, 29.0, 17.0, 32.0, 17.0, 12.0, 9.0, 16.0, 10.0, 12.0, 17.0, 10.0, 5.0, 7.0, 8.0, 1.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-26.1875, -25.374755859375, -24.56201171875, -23.749267578125, -22.9365234375, -22.123779296875, -21.31103515625, -20.498291015625, -19.685546875, -18.872802734375, -18.06005859375, -17.247314453125, -16.4345703125, -15.621826171875, -14.80908203125, -13.996337890625, -13.18359375, -12.370849609375, -11.55810546875, -10.745361328125, -9.9326171875, -9.119873046875, -8.30712890625, -7.494384765625, -6.681640625, -5.868896484375, -5.05615234375, -4.243408203125, -3.4306640625, -2.617919921875, -1.80517578125, -0.992431640625, -0.1796875, 0.633056640625, 1.44580078125, 2.258544921875, 3.0712890625, 3.884033203125, 4.69677734375, 5.509521484375, 6.322265625, 7.135009765625, 7.94775390625, 8.760498046875, 9.5732421875, 10.385986328125, 11.19873046875, 12.011474609375, 12.82421875, 13.636962890625, 14.44970703125, 15.262451171875, 16.0751953125, 16.887939453125, 17.70068359375, 18.513427734375, 19.326171875, 20.138916015625, 20.95166015625, 21.764404296875, 22.5771484375, 23.389892578125, 24.20263671875, 25.015380859375, 25.828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 10.0, 7.0, 20.0, 19.0, 37.0, 60.0, 119.0, 180.0, 215.0, 388.0, 671.0, 969.0, 1573.0, 2496.0, 3890.0, 6256.0, 9886.0, 15187.0, 23635.0, 37028.0, 56061.0, 80285.0, 106592.0, 127898.0, 134330.0, 123014.0, 100213.0, 74044.0, 50768.0, 33265.0, 21724.0, 13704.0, 8779.0, 5474.0, 3575.0, 2191.0, 1454.0, 900.0, 623.0, 364.0, 228.0, 157.0, 104.0, 54.0, 38.0, 26.0, 24.0, 14.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.90625, -23.119384765625, -22.33251953125, -21.545654296875, -20.7587890625, -19.971923828125, -19.18505859375, -18.398193359375, -17.611328125, -16.824462890625, -16.03759765625, -15.250732421875, -14.4638671875, -13.677001953125, -12.89013671875, -12.103271484375, -11.31640625, -10.529541015625, -9.74267578125, -8.955810546875, -8.1689453125, -7.382080078125, -6.59521484375, -5.808349609375, -5.021484375, -4.234619140625, -3.44775390625, -2.660888671875, -1.8740234375, -1.087158203125, -0.30029296875, 0.486572265625, 1.2734375, 2.060302734375, 2.84716796875, 3.634033203125, 4.4208984375, 5.207763671875, 5.99462890625, 6.781494140625, 7.568359375, 8.355224609375, 9.14208984375, 9.928955078125, 10.7158203125, 11.502685546875, 12.28955078125, 13.076416015625, 13.86328125, 14.650146484375, 15.43701171875, 16.223876953125, 17.0107421875, 17.797607421875, 18.58447265625, 19.371337890625, 20.158203125, 20.945068359375, 21.73193359375, 22.518798828125, 23.3056640625, 24.092529296875, 24.87939453125, 25.666259765625, 26.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 9.0, 9.0, 13.0, 12.0, 13.0, 14.0, 17.0, 18.0, 19.0, 36.0, 26.0, 41.0, 26.0, 41.0, 36.0, 46.0, 38.0, 40.0, 43.0, 49.0, 37.0, 30.0, 43.0, 30.0, 28.0, 23.0, 42.0, 32.0, 34.0, 22.0, 17.0, 16.0, 12.0, 20.0, 4.0, 9.0, 4.0, 13.0, 13.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.90771484375, -15.3623046875, -14.81689453125, -14.271484375, -13.72607421875, -13.1806640625, -12.63525390625, -12.08984375, -11.54443359375, -10.9990234375, -10.45361328125, -9.908203125, -9.36279296875, -8.8173828125, -8.27197265625, -7.7265625, -7.18115234375, -6.6357421875, -6.09033203125, -5.544921875, -4.99951171875, -4.4541015625, -3.90869140625, -3.36328125, -2.81787109375, -2.2724609375, -1.72705078125, -1.181640625, -0.63623046875, -0.0908203125, 0.45458984375, 1.0, 1.54541015625, 2.0908203125, 2.63623046875, 3.181640625, 3.72705078125, 4.2724609375, 4.81787109375, 5.36328125, 5.90869140625, 6.4541015625, 6.99951171875, 7.544921875, 8.09033203125, 8.6357421875, 9.18115234375, 9.7265625, 10.27197265625, 10.8173828125, 11.36279296875, 11.908203125, 12.45361328125, 12.9990234375, 13.54443359375, 14.08984375, 14.63525390625, 15.1806640625, 15.72607421875, 16.271484375, 16.81689453125, 17.3623046875, 17.90771484375, 18.453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 15.0, 16.0, 18.0, 38.0, 58.0, 100.0, 137.0, 217.0, 328.0, 507.0, 779.0, 1182.0, 2007.0, 3199.0, 5327.0, 8828.0, 14994.0, 25055.0, 41885.0, 70284.0, 109687.0, 151469.0, 171555.0, 153119.0, 110887.0, 70846.0, 42945.0, 25304.0, 14851.0, 8771.0, 5312.0, 3378.0, 2009.0, 1227.0, 767.0, 538.0, 286.0, 210.0, 124.0, 87.0, 66.0, 45.0, 23.0, 23.0, 13.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1875, -10.8433837890625, -10.499267578125, -10.1551513671875, -9.81103515625, -9.4669189453125, -9.122802734375, -8.7786865234375, -8.4345703125, -8.0904541015625, -7.746337890625, -7.4022216796875, -7.05810546875, -6.7139892578125, -6.369873046875, -6.0257568359375, -5.681640625, -5.3375244140625, -4.993408203125, -4.6492919921875, -4.30517578125, -3.9610595703125, -3.616943359375, -3.2728271484375, -2.9287109375, -2.5845947265625, -2.240478515625, -1.8963623046875, -1.55224609375, -1.2081298828125, -0.864013671875, -0.5198974609375, -0.17578125, 0.1683349609375, 0.512451171875, 0.8565673828125, 1.20068359375, 1.5447998046875, 1.888916015625, 2.2330322265625, 2.5771484375, 2.9212646484375, 3.265380859375, 3.6094970703125, 3.95361328125, 4.2977294921875, 4.641845703125, 4.9859619140625, 5.330078125, 5.6741943359375, 6.018310546875, 6.3624267578125, 6.70654296875, 7.0506591796875, 7.394775390625, 7.7388916015625, 8.0830078125, 8.4271240234375, 8.771240234375, 9.1153564453125, 9.45947265625, 9.8035888671875, 10.147705078125, 10.4918212890625, 10.8359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 5.0, 5.0, 14.0, 13.0, 23.0, 22.0, 23.0, 30.0, 34.0, 48.0, 60.0, 65.0, 48.0, 73.0, 55.0, 64.0, 64.0, 54.0, 42.0, 36.0, 44.0, 26.0, 26.0, 18.0, 16.0, 21.0, 18.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001064300537109375, -0.0010243356227874756, -0.0009843707084655762, -0.0009444057941436768, -0.0009044408798217773, -0.0008644759654998779, -0.0008245110511779785, -0.0007845461368560791, -0.0007445812225341797, -0.0007046163082122803, -0.0006646513938903809, -0.0006246864795684814, -0.000584721565246582, -0.0005447566509246826, -0.0005047917366027832, -0.0004648268222808838, -0.0004248619079589844, -0.00038489699363708496, -0.00034493207931518555, -0.00030496716499328613, -0.0002650022506713867, -0.0002250373363494873, -0.0001850724220275879, -0.00014510750770568848, -0.00010514259338378906, -6.517767906188965e-05, -2.5212764739990234e-05, 1.475214958190918e-05, 5.4717063903808594e-05, 9.468197822570801e-05, 0.00013464689254760742, 0.00017461180686950684, 0.00021457672119140625, 0.00025454163551330566, 0.0002945065498352051, 0.0003344714641571045, 0.0003744363784790039, 0.0004144012928009033, 0.00045436620712280273, 0.0004943311214447021, 0.0005342960357666016, 0.000574260950088501, 0.0006142258644104004, 0.0006541907787322998, 0.0006941556930541992, 0.0007341206073760986, 0.000774085521697998, 0.0008140504360198975, 0.0008540153503417969, 0.0008939802646636963, 0.0009339451789855957, 0.0009739100933074951, 0.0010138750076293945, 0.001053839921951294, 0.0010938048362731934, 0.0011337697505950928, 0.0011737346649169922, 0.0012136995792388916, 0.001253664493560791, 0.0012936294078826904, 0.0013335943222045898, 0.0013735592365264893, 0.0014135241508483887, 0.001453489065170288, 0.0014934539794921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 10.0, 24.0, 21.0, 36.0, 63.0, 81.0, 121.0, 173.0, 226.0, 400.0, 659.0, 1014.0, 1749.0, 3068.0, 5397.0, 10431.0, 20843.0, 41291.0, 81940.0, 149284.0, 216478.0, 212306.0, 143379.0, 77883.0, 39633.0, 19395.0, 9813.0, 5416.0, 2999.0, 1604.0, 979.0, 631.0, 404.0, 257.0, 184.0, 100.0, 72.0, 59.0, 37.0, 24.0, 24.0, 11.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-16.78125, -16.30126953125, -15.8212890625, -15.34130859375, -14.861328125, -14.38134765625, -13.9013671875, -13.42138671875, -12.94140625, -12.46142578125, -11.9814453125, -11.50146484375, -11.021484375, -10.54150390625, -10.0615234375, -9.58154296875, -9.1015625, -8.62158203125, -8.1416015625, -7.66162109375, -7.181640625, -6.70166015625, -6.2216796875, -5.74169921875, -5.26171875, -4.78173828125, -4.3017578125, -3.82177734375, -3.341796875, -2.86181640625, -2.3818359375, -1.90185546875, -1.421875, -0.94189453125, -0.4619140625, 0.01806640625, 0.498046875, 0.97802734375, 1.4580078125, 1.93798828125, 2.41796875, 2.89794921875, 3.3779296875, 3.85791015625, 4.337890625, 4.81787109375, 5.2978515625, 5.77783203125, 6.2578125, 6.73779296875, 7.2177734375, 7.69775390625, 8.177734375, 8.65771484375, 9.1376953125, 9.61767578125, 10.09765625, 10.57763671875, 11.0576171875, 11.53759765625, 12.017578125, 12.49755859375, 12.9775390625, 13.45751953125, 13.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 3.0, 13.0, 11.0, 13.0, 20.0, 22.0, 26.0, 38.0, 38.0, 58.0, 68.0, 58.0, 55.0, 62.0, 76.0, 73.0, 63.0, 61.0, 53.0, 36.0, 38.0, 20.0, 24.0, 13.0, 13.0, 11.0, 11.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4324951171875, -4.267333984375, -4.1021728515625, -3.93701171875, -3.7718505859375, -3.606689453125, -3.4415283203125, -3.2763671875, -3.1112060546875, -2.946044921875, -2.7808837890625, -2.61572265625, -2.4505615234375, -2.285400390625, -2.1202392578125, -1.955078125, -1.7899169921875, -1.624755859375, -1.4595947265625, -1.29443359375, -1.1292724609375, -0.964111328125, -0.7989501953125, -0.6337890625, -0.4686279296875, -0.303466796875, -0.1383056640625, 0.02685546875, 0.1920166015625, 0.357177734375, 0.5223388671875, 0.6875, 0.8526611328125, 1.017822265625, 1.1829833984375, 1.34814453125, 1.5133056640625, 1.678466796875, 1.8436279296875, 2.0087890625, 2.1739501953125, 2.339111328125, 2.5042724609375, 2.66943359375, 2.8345947265625, 2.999755859375, 3.1649169921875, 3.330078125, 3.4952392578125, 3.660400390625, 3.8255615234375, 3.99072265625, 4.1558837890625, 4.321044921875, 4.4862060546875, 4.6513671875, 4.8165283203125, 4.981689453125, 5.1468505859375, 5.31201171875, 5.4771728515625, 5.642333984375, 5.8074951171875, 5.97265625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 7.0, 15.0, 12.0, 10.0, 15.0, 15.0, 14.0, 20.0, 15.0, 31.0, 27.0, 27.0, 29.0, 33.0, 32.0, 56.0, 46.0, 52.0, 52.0, 46.0, 45.0, 54.0, 35.0, 31.0, 21.0, 35.0, 41.0, 30.0, 27.0, 22.0, 26.0, 11.0, 8.0, 14.0, 7.0, 2.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-28.05633544921875, -27.192575454711914, -26.328815460205078, -25.465055465698242, -24.601295471191406, -23.73753547668457, -22.873775482177734, -22.0100154876709, -21.146255493164062, -20.282495498657227, -19.41873550415039, -18.554975509643555, -17.69121551513672, -16.827455520629883, -15.963695526123047, -15.099935531616211, -14.236175537109375, -13.372415542602539, -12.508655548095703, -11.644895553588867, -10.781135559082031, -9.917375564575195, -9.05361557006836, -8.189855575561523, -7.3260955810546875, -6.462335586547852, -5.598575592041016, -4.73481559753418, -3.8710556030273438, -3.007295608520508, -2.143535614013672, -1.279775619506836, -0.416015625, 0.44774436950683594, 1.3115043640136719, 2.175264358520508, 3.0390243530273438, 3.9027843475341797, 4.766544342041016, 5.630304336547852, 6.4940643310546875, 7.357824325561523, 8.22158432006836, 9.085344314575195, 9.949104309082031, 10.812864303588867, 11.676624298095703, 12.540384292602539, 13.404144287109375, 14.267904281616211, 15.131664276123047, 15.995424270629883, 16.85918426513672, 17.722944259643555, 18.58670425415039, 19.450464248657227, 20.314224243164062, 21.1779842376709, 22.041744232177734, 22.90550422668457, 23.769264221191406, 24.633024215698242, 25.496784210205078, 26.360544204711914, 27.22430419921875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 5.0, 8.0, 10.0, 9.0, 12.0, 19.0, 16.0, 28.0, 32.0, 29.0, 31.0, 24.0, 37.0, 32.0, 38.0, 31.0, 46.0, 39.0, 57.0, 25.0, 28.0, 48.0, 43.0, 22.0, 39.0, 32.0, 30.0, 30.0, 20.0, 18.0, 18.0, 17.0, 24.0, 22.0, 6.0, 10.0, 9.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.508243560791016, -22.67460060119629, -21.84095573425293, -21.007312774658203, -20.173667907714844, -19.340024948120117, -18.50638198852539, -17.67273712158203, -16.839092254638672, -16.005449295043945, -15.171804428100586, -14.33816146850586, -13.5045166015625, -12.670873641967773, -11.83722972869873, -11.003585815429688, -10.169942855834961, -9.336298942565918, -8.502655029296875, -7.66901159286499, -6.835367679595947, -6.001723766326904, -5.1680803298950195, -4.334436416625977, -3.5007925033569336, -2.6671485900878906, -1.8335049152374268, -0.9998612403869629, -0.16621732711791992, 0.667426586151123, 1.5010700225830078, 2.334713935852051, 3.1683578491210938, 4.002001762390137, 4.83564567565918, 5.6692891120910645, 6.502933025360107, 7.33657693862915, 8.170220375061035, 9.003864288330078, 9.837508201599121, 10.671152114868164, 11.504796028137207, 12.33843994140625, 13.172082901000977, 14.005727767944336, 14.839370727539062, 15.673014640808105, 16.50665855407715, 17.340301513671875, 18.173946380615234, 19.00758934020996, 19.84123420715332, 20.674877166748047, 21.508522033691406, 22.342164993286133, 23.17580795288086, 24.009450912475586, 24.843095779418945, 25.676738739013672, 26.51038360595703, 27.344026565551758, 28.177669525146484, 29.011314392089844, 29.844959259033203]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 11.0, 6.0, 28.0, 25.0, 30.0, 47.0, 89.0, 124.0, 175.0, 258.0, 439.0, 701.0, 1063.0, 1808.0, 2848.0, 4463.0, 7490.0, 12447.0, 21131.0, 36270.0, 63995.0, 117180.0, 218846.0, 409481.0, 690896.0, 873440.0, 737718.0, 453561.0, 243820.0, 129071.0, 70805.0, 39356.0, 22495.0, 13257.0, 8118.0, 4877.0, 2984.0, 1783.0, 1213.0, 711.0, 461.0, 293.0, 192.0, 95.0, 76.0, 45.0, 27.0, 18.0, 5.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.6513671875, -31.583984375, -30.5166015625, -29.44921875, -28.3818359375, -27.314453125, -26.2470703125, -25.1796875, -24.1123046875, -23.044921875, -21.9775390625, -20.91015625, -19.8427734375, -18.775390625, -17.7080078125, -16.640625, -15.5732421875, -14.505859375, -13.4384765625, -12.37109375, -11.3037109375, -10.236328125, -9.1689453125, -8.1015625, -7.0341796875, -5.966796875, -4.8994140625, -3.83203125, -2.7646484375, -1.697265625, -0.6298828125, 0.4375, 1.5048828125, 2.572265625, 3.6396484375, 4.70703125, 5.7744140625, 6.841796875, 7.9091796875, 8.9765625, 10.0439453125, 11.111328125, 12.1787109375, 13.24609375, 14.3134765625, 15.380859375, 16.4482421875, 17.515625, 18.5830078125, 19.650390625, 20.7177734375, 21.78515625, 22.8525390625, 23.919921875, 24.9873046875, 26.0546875, 27.1220703125, 28.189453125, 29.2568359375, 30.32421875, 31.3916015625, 32.458984375, 33.5263671875, 34.59375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 5.0, 11.0, 6.0, 13.0, 12.0, 11.0, 15.0, 26.0, 18.0, 25.0, 28.0, 25.0, 27.0, 25.0, 29.0, 44.0, 26.0, 55.0, 33.0, 36.0, 36.0, 39.0, 35.0, 31.0, 38.0, 39.0, 40.0, 29.0, 24.0, 26.0, 30.0, 24.0, 13.0, 23.0, 15.0, 8.0, 17.0, 8.0, 14.0, 3.0, 4.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-20.765625, -20.0712890625, -19.376953125, -18.6826171875, -17.98828125, -17.2939453125, -16.599609375, -15.9052734375, -15.2109375, -14.5166015625, -13.822265625, -13.1279296875, -12.43359375, -11.7392578125, -11.044921875, -10.3505859375, -9.65625, -8.9619140625, -8.267578125, -7.5732421875, -6.87890625, -6.1845703125, -5.490234375, -4.7958984375, -4.1015625, -3.4072265625, -2.712890625, -2.0185546875, -1.32421875, -0.6298828125, 0.064453125, 0.7587890625, 1.453125, 2.1474609375, 2.841796875, 3.5361328125, 4.23046875, 4.9248046875, 5.619140625, 6.3134765625, 7.0078125, 7.7021484375, 8.396484375, 9.0908203125, 9.78515625, 10.4794921875, 11.173828125, 11.8681640625, 12.5625, 13.2568359375, 13.951171875, 14.6455078125, 15.33984375, 16.0341796875, 16.728515625, 17.4228515625, 18.1171875, 18.8115234375, 19.505859375, 20.2001953125, 20.89453125, 21.5888671875, 22.283203125, 22.9775390625, 23.671875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 14.0, 16.0, 26.0, 45.0, 85.0, 112.0, 155.0, 287.0, 381.0, 587.0, 810.0, 1321.0, 2055.0, 3351.0, 5532.0, 8945.0, 14398.0, 24690.0, 42834.0, 74499.0, 131410.0, 229468.0, 392967.0, 611923.0, 769843.0, 701108.0, 486135.0, 293294.0, 169287.0, 95570.0, 53972.0, 31570.0, 18558.0, 11072.0, 6691.0, 4102.0, 2618.0, 1624.0, 1034.0, 640.0, 443.0, 260.0, 169.0, 126.0, 82.0, 50.0, 36.0, 28.0, 22.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0], "bins": [-37.65625, -36.53955078125, -35.4228515625, -34.30615234375, -33.189453125, -32.07275390625, -30.9560546875, -29.83935546875, -28.72265625, -27.60595703125, -26.4892578125, -25.37255859375, -24.255859375, -23.13916015625, -22.0224609375, -20.90576171875, -19.7890625, -18.67236328125, -17.5556640625, -16.43896484375, -15.322265625, -14.20556640625, -13.0888671875, -11.97216796875, -10.85546875, -9.73876953125, -8.6220703125, -7.50537109375, -6.388671875, -5.27197265625, -4.1552734375, -3.03857421875, -1.921875, -0.80517578125, 0.3115234375, 1.42822265625, 2.544921875, 3.66162109375, 4.7783203125, 5.89501953125, 7.01171875, 8.12841796875, 9.2451171875, 10.36181640625, 11.478515625, 12.59521484375, 13.7119140625, 14.82861328125, 15.9453125, 17.06201171875, 18.1787109375, 19.29541015625, 20.412109375, 21.52880859375, 22.6455078125, 23.76220703125, 24.87890625, 25.99560546875, 27.1123046875, 28.22900390625, 29.345703125, 30.46240234375, 31.5791015625, 32.69580078125, 33.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 8.0, 10.0, 8.0, 19.0, 27.0, 28.0, 35.0, 59.0, 60.0, 83.0, 131.0, 111.0, 167.0, 157.0, 191.0, 223.0, 247.0, 252.0, 268.0, 262.0, 264.0, 220.0, 193.0, 180.0, 190.0, 117.0, 116.0, 103.0, 63.0, 58.0, 46.0, 42.0, 33.0, 15.0, 27.0, 19.0, 10.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9375, -12.489013671875, -12.04052734375, -11.592041015625, -11.1435546875, -10.695068359375, -10.24658203125, -9.798095703125, -9.349609375, -8.901123046875, -8.45263671875, -8.004150390625, -7.5556640625, -7.107177734375, -6.65869140625, -6.210205078125, -5.76171875, -5.313232421875, -4.86474609375, -4.416259765625, -3.9677734375, -3.519287109375, -3.07080078125, -2.622314453125, -2.173828125, -1.725341796875, -1.27685546875, -0.828369140625, -0.3798828125, 0.068603515625, 0.51708984375, 0.965576171875, 1.4140625, 1.862548828125, 2.31103515625, 2.759521484375, 3.2080078125, 3.656494140625, 4.10498046875, 4.553466796875, 5.001953125, 5.450439453125, 5.89892578125, 6.347412109375, 6.7958984375, 7.244384765625, 7.69287109375, 8.141357421875, 8.58984375, 9.038330078125, 9.48681640625, 9.935302734375, 10.3837890625, 10.832275390625, 11.28076171875, 11.729248046875, 12.177734375, 12.626220703125, 13.07470703125, 13.523193359375, 13.9716796875, 14.420166015625, 14.86865234375, 15.317138671875, 15.765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 4.0, 8.0, 9.0, 11.0, 20.0, 19.0, 17.0, 21.0, 32.0, 38.0, 33.0, 45.0, 52.0, 52.0, 53.0, 53.0, 46.0, 60.0, 63.0, 61.0, 44.0, 35.0, 37.0, 28.0, 28.0, 26.0, 18.0, 21.0, 9.0, 13.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28080177307129, -30.171932220458984, -29.063060760498047, -27.95418930053711, -26.845319747924805, -25.7364501953125, -24.627578735351562, -23.518707275390625, -22.40983772277832, -21.300968170166016, -20.192096710205078, -19.08322525024414, -17.974355697631836, -16.86548614501953, -15.756614685058594, -14.647744178771973, -13.538873672485352, -12.43000316619873, -11.32113265991211, -10.212262153625488, -9.103391647338867, -7.994521141052246, -6.885650634765625, -5.776780128479004, -4.667909622192383, -3.5590391159057617, -2.4501686096191406, -1.3412981033325195, -0.23242759704589844, 0.8764429092407227, 1.9853134155273438, 3.094183921813965, 4.203052520751953, 5.311923027038574, 6.420793533325195, 7.529664039611816, 8.638534545898438, 9.747405052185059, 10.85627555847168, 11.9651460647583, 13.074016571044922, 14.182887077331543, 15.291757583618164, 16.40062713623047, 17.509498596191406, 18.618370056152344, 19.72723960876465, 20.836109161376953, 21.94498062133789, 23.053852081298828, 24.162721633911133, 25.271591186523438, 26.380462646484375, 27.489334106445312, 28.598203659057617, 29.707073211669922, 30.81594467163086, 31.924816131591797, 33.03368377685547, 34.142555236816406, 35.251426696777344, 36.36029815673828, 37.46916961669922, 38.57803726196289, 39.68690872192383]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 10.0, 11.0, 9.0, 15.0, 14.0, 17.0, 14.0, 20.0, 22.0, 29.0, 34.0, 41.0, 24.0, 30.0, 37.0, 40.0, 44.0, 40.0, 43.0, 42.0, 40.0, 32.0, 42.0, 34.0, 36.0, 23.0, 27.0, 27.0, 26.0, 19.0, 20.0, 20.0, 15.0, 19.0, 14.0, 12.0, 10.0, 7.0, 5.0, 7.0, 3.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.141315460205078, -23.274580001831055, -22.4078426361084, -21.541107177734375, -20.67436981201172, -19.807634353637695, -18.940898895263672, -18.074161529541016, -17.207426071166992, -16.34069061279297, -15.473953247070312, -14.607217788696289, -13.74048137664795, -12.87374496459961, -12.007009506225586, -11.140273094177246, -10.273536682128906, -9.406800270080566, -8.540063858032227, -7.673328399658203, -6.806591987609863, -5.939855575561523, -5.073119640350342, -4.20638370513916, -3.3396472930908203, -2.4729111194610596, -1.6061749458312988, -0.7394387722015381, 0.12729740142822266, 0.9940338134765625, 1.8607697486877441, 2.727505683898926, 3.5942440032958984, 4.460980415344238, 5.32771635055542, 6.194452285766602, 7.061188697814941, 7.927925109863281, 8.794660568237305, 9.661396980285645, 10.528133392333984, 11.394869804382324, 12.261606216430664, 13.128341674804688, 13.995078086853027, 14.861814498901367, 15.72854995727539, 16.595287322998047, 17.46202278137207, 18.328758239746094, 19.19549560546875, 20.062231063842773, 20.928966522216797, 21.795703887939453, 22.662439346313477, 23.5291748046875, 24.395912170410156, 25.26264762878418, 26.129384994506836, 26.99612045288086, 27.862857818603516, 28.72959327697754, 29.596328735351562, 30.46306610107422, 31.329801559448242]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 10.0, 6.0, 14.0, 17.0, 32.0, 61.0, 99.0, 143.0, 251.0, 397.0, 616.0, 1010.0, 1519.0, 2480.0, 4005.0, 6454.0, 10236.0, 16321.0, 26168.0, 40478.0, 62945.0, 93117.0, 127314.0, 149838.0, 146896.0, 118220.0, 84724.0, 56357.0, 36307.0, 23522.0, 14625.0, 9029.0, 5785.0, 3569.0, 2211.0, 1434.0, 875.0, 557.0, 314.0, 210.0, 134.0, 100.0, 54.0, 32.0, 23.0, 15.0, 14.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-13.265625, -12.88525390625, -12.5048828125, -12.12451171875, -11.744140625, -11.36376953125, -10.9833984375, -10.60302734375, -10.22265625, -9.84228515625, -9.4619140625, -9.08154296875, -8.701171875, -8.32080078125, -7.9404296875, -7.56005859375, -7.1796875, -6.79931640625, -6.4189453125, -6.03857421875, -5.658203125, -5.27783203125, -4.8974609375, -4.51708984375, -4.13671875, -3.75634765625, -3.3759765625, -2.99560546875, -2.615234375, -2.23486328125, -1.8544921875, -1.47412109375, -1.09375, -0.71337890625, -0.3330078125, 0.04736328125, 0.427734375, 0.80810546875, 1.1884765625, 1.56884765625, 1.94921875, 2.32958984375, 2.7099609375, 3.09033203125, 3.470703125, 3.85107421875, 4.2314453125, 4.61181640625, 4.9921875, 5.37255859375, 5.7529296875, 6.13330078125, 6.513671875, 6.89404296875, 7.2744140625, 7.65478515625, 8.03515625, 8.41552734375, 8.7958984375, 9.17626953125, 9.556640625, 9.93701171875, 10.3173828125, 10.69775390625, 11.078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 8.0, 6.0, 8.0, 14.0, 15.0, 20.0, 14.0, 17.0, 23.0, 16.0, 19.0, 32.0, 33.0, 38.0, 29.0, 31.0, 36.0, 50.0, 44.0, 53.0, 42.0, 46.0, 42.0, 37.0, 32.0, 26.0, 22.0, 34.0, 25.0, 32.0, 31.0, 11.0, 20.0, 19.0, 14.0, 6.0, 14.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.03125, -28.0986328125, -27.166015625, -26.2333984375, -25.30078125, -24.3681640625, -23.435546875, -22.5029296875, -21.5703125, -20.6376953125, -19.705078125, -18.7724609375, -17.83984375, -16.9072265625, -15.974609375, -15.0419921875, -14.109375, -13.1767578125, -12.244140625, -11.3115234375, -10.37890625, -9.4462890625, -8.513671875, -7.5810546875, -6.6484375, -5.7158203125, -4.783203125, -3.8505859375, -2.91796875, -1.9853515625, -1.052734375, -0.1201171875, 0.8125, 1.7451171875, 2.677734375, 3.6103515625, 4.54296875, 5.4755859375, 6.408203125, 7.3408203125, 8.2734375, 9.2060546875, 10.138671875, 11.0712890625, 12.00390625, 12.9365234375, 13.869140625, 14.8017578125, 15.734375, 16.6669921875, 17.599609375, 18.5322265625, 19.46484375, 20.3974609375, 21.330078125, 22.2626953125, 23.1953125, 24.1279296875, 25.060546875, 25.9931640625, 26.92578125, 27.8583984375, 28.791015625, 29.7236328125, 30.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 2.0, 5.0, 16.0, 29.0, 27.0, 59.0, 85.0, 121.0, 193.0, 338.0, 506.0, 821.0, 1347.0, 2411.0, 4081.0, 7361.0, 13245.0, 23959.0, 43790.0, 79309.0, 137206.0, 199946.0, 202919.0, 142915.0, 84028.0, 46146.0, 25478.0, 14027.0, 7680.0, 4234.0, 2529.0, 1480.0, 869.0, 535.0, 315.0, 182.0, 125.0, 77.0, 53.0, 29.0, 26.0, 13.0, 18.0, 10.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.319091796875, -18.71630859375, -18.113525390625, -17.5107421875, -16.907958984375, -16.30517578125, -15.702392578125, -15.099609375, -14.496826171875, -13.89404296875, -13.291259765625, -12.6884765625, -12.085693359375, -11.48291015625, -10.880126953125, -10.27734375, -9.674560546875, -9.07177734375, -8.468994140625, -7.8662109375, -7.263427734375, -6.66064453125, -6.057861328125, -5.455078125, -4.852294921875, -4.24951171875, -3.646728515625, -3.0439453125, -2.441162109375, -1.83837890625, -1.235595703125, -0.6328125, -0.030029296875, 0.57275390625, 1.175537109375, 1.7783203125, 2.381103515625, 2.98388671875, 3.586669921875, 4.189453125, 4.792236328125, 5.39501953125, 5.997802734375, 6.6005859375, 7.203369140625, 7.80615234375, 8.408935546875, 9.01171875, 9.614501953125, 10.21728515625, 10.820068359375, 11.4228515625, 12.025634765625, 12.62841796875, 13.231201171875, 13.833984375, 14.436767578125, 15.03955078125, 15.642333984375, 16.2451171875, 16.847900390625, 17.45068359375, 18.053466796875, 18.65625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 8.0, 11.0, 14.0, 17.0, 24.0, 28.0, 28.0, 36.0, 27.0, 43.0, 37.0, 29.0, 48.0, 48.0, 52.0, 52.0, 42.0, 42.0, 45.0, 38.0, 33.0, 28.0, 31.0, 31.0, 34.0, 22.0, 21.0, 20.0, 8.0, 20.0, 13.0, 6.0, 5.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -20.039306640625, -19.40673828125, -18.774169921875, -18.1416015625, -17.509033203125, -16.87646484375, -16.243896484375, -15.611328125, -14.978759765625, -14.34619140625, -13.713623046875, -13.0810546875, -12.448486328125, -11.81591796875, -11.183349609375, -10.55078125, -9.918212890625, -9.28564453125, -8.653076171875, -8.0205078125, -7.387939453125, -6.75537109375, -6.122802734375, -5.490234375, -4.857666015625, -4.22509765625, -3.592529296875, -2.9599609375, -2.327392578125, -1.69482421875, -1.062255859375, -0.4296875, 0.202880859375, 0.83544921875, 1.468017578125, 2.1005859375, 2.733154296875, 3.36572265625, 3.998291015625, 4.630859375, 5.263427734375, 5.89599609375, 6.528564453125, 7.1611328125, 7.793701171875, 8.42626953125, 9.058837890625, 9.69140625, 10.323974609375, 10.95654296875, 11.589111328125, 12.2216796875, 12.854248046875, 13.48681640625, 14.119384765625, 14.751953125, 15.384521484375, 16.01708984375, 16.649658203125, 17.2822265625, 17.914794921875, 18.54736328125, 19.179931640625, 19.8125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 12.0, 19.0, 30.0, 32.0, 53.0, 88.0, 136.0, 196.0, 301.0, 485.0, 763.0, 1116.0, 1781.0, 3004.0, 5258.0, 9735.0, 18323.0, 36722.0, 74546.0, 146512.0, 237381.0, 230927.0, 138135.0, 69470.0, 34235.0, 17292.0, 9153.0, 4993.0, 2883.0, 1824.0, 1089.0, 706.0, 460.0, 287.0, 199.0, 118.0, 77.0, 58.0, 46.0, 31.0, 21.0, 11.0, 6.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8795166015625, -5.669189453125, -5.4588623046875, -5.24853515625, -5.0382080078125, -4.827880859375, -4.6175537109375, -4.4072265625, -4.1968994140625, -3.986572265625, -3.7762451171875, -3.56591796875, -3.3555908203125, -3.145263671875, -2.9349365234375, -2.724609375, -2.5142822265625, -2.303955078125, -2.0936279296875, -1.88330078125, -1.6729736328125, -1.462646484375, -1.2523193359375, -1.0419921875, -0.8316650390625, -0.621337890625, -0.4110107421875, -0.20068359375, 0.0096435546875, 0.219970703125, 0.4302978515625, 0.640625, 0.8509521484375, 1.061279296875, 1.2716064453125, 1.48193359375, 1.6922607421875, 1.902587890625, 2.1129150390625, 2.3232421875, 2.5335693359375, 2.743896484375, 2.9542236328125, 3.16455078125, 3.3748779296875, 3.585205078125, 3.7955322265625, 4.005859375, 4.2161865234375, 4.426513671875, 4.6368408203125, 4.84716796875, 5.0574951171875, 5.267822265625, 5.4781494140625, 5.6884765625, 5.8988037109375, 6.109130859375, 6.3194580078125, 6.52978515625, 6.7401123046875, 6.950439453125, 7.1607666015625, 7.37109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 12.0, 13.0, 22.0, 25.0, 30.0, 49.0, 42.0, 52.0, 56.0, 68.0, 76.0, 70.0, 71.0, 57.0, 57.0, 73.0, 42.0, 34.0, 34.0, 25.0, 20.0, 14.0, 8.0, 10.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003371909260749817, -0.0003200918436050415, -0.0003029927611351013, -0.00028589367866516113, -0.00026879459619522095, -0.00025169551372528076, -0.00023459643125534058, -0.0002174973487854004, -0.0002003982663154602, -0.00018329918384552002, -0.00016620010137557983, -0.00014910101890563965, -0.00013200193643569946, -0.00011490285396575928, -9.780377149581909e-05, -8.07046890258789e-05, -6.360560655593872e-05, -4.6506524085998535e-05, -2.940744161605835e-05, -1.2308359146118164e-05, 4.7907233238220215e-06, 2.1889805793762207e-05, 3.898888826370239e-05, 5.608797073364258e-05, 7.318705320358276e-05, 9.028613567352295e-05, 0.00010738521814346313, 0.00012448430061340332, 0.0001415833830833435, 0.0001586824655532837, 0.00017578154802322388, 0.00019288063049316406, 0.00020997971296310425, 0.00022707879543304443, 0.0002441778779029846, 0.0002612769603729248, 0.000278376042842865, 0.0002954751253128052, 0.00031257420778274536, 0.00032967329025268555, 0.00034677237272262573, 0.0003638714551925659, 0.0003809705376625061, 0.0003980696201324463, 0.0004151687026023865, 0.00043226778507232666, 0.00044936686754226685, 0.00046646595001220703, 0.0004835650324821472, 0.0005006641149520874, 0.0005177631974220276, 0.0005348622798919678, 0.000551961362361908, 0.0005690604448318481, 0.0005861595273017883, 0.0006032586097717285, 0.0006203576922416687, 0.0006374567747116089, 0.0006545558571815491, 0.0006716549396514893, 0.0006887540221214294, 0.0007058531045913696, 0.0007229521870613098, 0.00074005126953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 5.0, 7.0, 13.0, 12.0, 23.0, 54.0, 72.0, 90.0, 151.0, 234.0, 349.0, 581.0, 966.0, 1426.0, 2559.0, 4383.0, 7695.0, 13723.0, 25453.0, 48065.0, 91723.0, 159932.0, 219959.0, 198534.0, 125128.0, 67763.0, 35777.0, 19133.0, 10463.0, 5755.0, 3326.0, 1954.0, 1220.0, 763.0, 442.0, 300.0, 159.0, 132.0, 75.0, 44.0, 34.0, 25.0, 17.0, 13.0, 11.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.1953125, -6.96142578125, -6.7275390625, -6.49365234375, -6.259765625, -6.02587890625, -5.7919921875, -5.55810546875, -5.32421875, -5.09033203125, -4.8564453125, -4.62255859375, -4.388671875, -4.15478515625, -3.9208984375, -3.68701171875, -3.453125, -3.21923828125, -2.9853515625, -2.75146484375, -2.517578125, -2.28369140625, -2.0498046875, -1.81591796875, -1.58203125, -1.34814453125, -1.1142578125, -0.88037109375, -0.646484375, -0.41259765625, -0.1787109375, 0.05517578125, 0.2890625, 0.52294921875, 0.7568359375, 0.99072265625, 1.224609375, 1.45849609375, 1.6923828125, 1.92626953125, 2.16015625, 2.39404296875, 2.6279296875, 2.86181640625, 3.095703125, 3.32958984375, 3.5634765625, 3.79736328125, 4.03125, 4.26513671875, 4.4990234375, 4.73291015625, 4.966796875, 5.20068359375, 5.4345703125, 5.66845703125, 5.90234375, 6.13623046875, 6.3701171875, 6.60400390625, 6.837890625, 7.07177734375, 7.3056640625, 7.53955078125, 7.7734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 7.0, 8.0, 16.0, 18.0, 21.0, 27.0, 20.0, 32.0, 27.0, 45.0, 51.0, 61.0, 57.0, 52.0, 64.0, 71.0, 65.0, 61.0, 51.0, 42.0, 34.0, 28.0, 25.0, 23.0, 27.0, 4.0, 7.0, 8.0, 4.0, 9.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.938934326171875, -1.86614990234375, -1.793365478515625, -1.7205810546875, -1.647796630859375, -1.57501220703125, -1.502227783203125, -1.429443359375, -1.356658935546875, -1.28387451171875, -1.211090087890625, -1.1383056640625, -1.065521240234375, -0.99273681640625, -0.919952392578125, -0.84716796875, -0.774383544921875, -0.70159912109375, -0.628814697265625, -0.5560302734375, -0.483245849609375, -0.41046142578125, -0.337677001953125, -0.264892578125, -0.192108154296875, -0.11932373046875, -0.046539306640625, 0.0262451171875, 0.099029541015625, 0.17181396484375, 0.244598388671875, 0.3173828125, 0.390167236328125, 0.46295166015625, 0.535736083984375, 0.6085205078125, 0.681304931640625, 0.75408935546875, 0.826873779296875, 0.899658203125, 0.972442626953125, 1.04522705078125, 1.118011474609375, 1.1907958984375, 1.263580322265625, 1.33636474609375, 1.409149169921875, 1.48193359375, 1.554718017578125, 1.62750244140625, 1.700286865234375, 1.7730712890625, 1.845855712890625, 1.91864013671875, 1.991424560546875, 2.064208984375, 2.136993408203125, 2.20977783203125, 2.282562255859375, 2.3553466796875, 2.428131103515625, 2.50091552734375, 2.573699951171875, 2.646484375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 9.0, 9.0, 7.0, 9.0, 16.0, 18.0, 21.0, 25.0, 28.0, 34.0, 32.0, 43.0, 50.0, 50.0, 53.0, 42.0, 51.0, 51.0, 61.0, 56.0, 45.0, 54.0, 39.0, 22.0, 30.0, 23.0, 18.0, 27.0, 14.0, 15.0, 9.0, 4.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.657066345214844, -29.584033966064453, -28.51099967956543, -27.43796730041504, -26.364933013916016, -25.291900634765625, -24.218868255615234, -23.145835876464844, -22.07280158996582, -20.99976921081543, -19.926734924316406, -18.853702545166016, -17.780670166015625, -16.7076358795166, -15.634603500366211, -14.561570167541504, -13.488536834716797, -12.41550350189209, -11.342470169067383, -10.269437789916992, -9.196404457092285, -8.123371124267578, -7.050338268280029, -5.9773054122924805, -4.904272079467773, -3.8312389850616455, -2.7582058906555176, -1.6851727962493896, -0.6121397018432617, 0.4608936309814453, 1.5339264869689941, 2.606959342956543, 3.67999267578125, 4.753026008605957, 5.826058864593506, 6.899091720581055, 7.972125053405762, 9.045158386230469, 10.11819076538086, 11.191224098205566, 12.264257431030273, 13.33729076385498, 14.410324096679688, 15.483356475830078, 16.55638885498047, 17.629423141479492, 18.702455520629883, 19.775489807128906, 20.848522186279297, 21.921554565429688, 22.99458885192871, 24.0676212310791, 25.140655517578125, 26.213687896728516, 27.286720275878906, 28.359752655029297, 29.43278694152832, 30.50581932067871, 31.578853607177734, 32.651885986328125, 33.724918365478516, 34.797950744628906, 35.87098693847656, 36.94401931762695, 38.017051696777344]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 15.0, 7.0, 16.0, 19.0, 11.0, 15.0, 22.0, 26.0, 23.0, 41.0, 33.0, 28.0, 22.0, 47.0, 42.0, 42.0, 39.0, 46.0, 32.0, 46.0, 34.0, 37.0, 36.0, 35.0, 18.0, 32.0, 28.0, 26.0, 18.0, 15.0, 27.0, 18.0, 16.0, 14.0, 14.0, 5.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.079010009765625, -23.21695899963379, -22.354907989501953, -21.492855072021484, -20.63080406188965, -19.768753051757812, -18.906700134277344, -18.044649124145508, -17.182598114013672, -16.320547103881836, -15.458495140075684, -14.596443176269531, -13.734392166137695, -12.87234115600586, -12.010289192199707, -11.148237228393555, -10.286186218261719, -9.424135208129883, -8.56208324432373, -7.700031757354736, -6.837980270385742, -5.975928783416748, -5.113877296447754, -4.25182580947876, -3.3897743225097656, -2.5277228355407715, -1.6656713485717773, -0.8036198616027832, 0.05843162536621094, 0.9204831123352051, 1.7825345993041992, 2.6445860862731934, 3.5066356658935547, 4.368687152862549, 5.230738639831543, 6.092790126800537, 6.954841613769531, 7.816893100738525, 8.67894458770752, 9.540996551513672, 10.403047561645508, 11.265098571777344, 12.127150535583496, 12.989202499389648, 13.851253509521484, 14.71330451965332, 15.575356483459473, 16.437408447265625, 17.29945945739746, 18.161510467529297, 19.023563385009766, 19.8856143951416, 20.747665405273438, 21.609716415405273, 22.47176742553711, 23.333820343017578, 24.195871353149414, 25.05792236328125, 25.91997528076172, 26.782026290893555, 27.64407730102539, 28.506128311157227, 29.368179321289062, 30.23023223876953, 31.092283248901367]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 10.0, 13.0, 15.0, 24.0, 45.0, 72.0, 113.0, 169.0, 276.0, 423.0, 762.0, 1170.0, 1865.0, 3025.0, 4969.0, 7816.0, 12895.0, 20396.0, 32089.0, 48856.0, 70667.0, 96276.0, 119186.0, 131807.0, 127548.0, 109689.0, 85341.0, 60900.0, 41384.0, 26314.0, 16795.0, 10452.0, 6560.0, 4015.0, 2520.0, 1552.0, 966.0, 590.0, 398.0, 205.0, 129.0, 90.0, 62.0, 34.0, 20.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 0.0, 5.0, 1.0], "bins": [-26.59375, -25.806640625, -25.01953125, -24.232421875, -23.4453125, -22.658203125, -21.87109375, -21.083984375, -20.296875, -19.509765625, -18.72265625, -17.935546875, -17.1484375, -16.361328125, -15.57421875, -14.787109375, -14.0, -13.212890625, -12.42578125, -11.638671875, -10.8515625, -10.064453125, -9.27734375, -8.490234375, -7.703125, -6.916015625, -6.12890625, -5.341796875, -4.5546875, -3.767578125, -2.98046875, -2.193359375, -1.40625, -0.619140625, 0.16796875, 0.955078125, 1.7421875, 2.529296875, 3.31640625, 4.103515625, 4.890625, 5.677734375, 6.46484375, 7.251953125, 8.0390625, 8.826171875, 9.61328125, 10.400390625, 11.1875, 11.974609375, 12.76171875, 13.548828125, 14.3359375, 15.123046875, 15.91015625, 16.697265625, 17.484375, 18.271484375, 19.05859375, 19.845703125, 20.6328125, 21.419921875, 22.20703125, 22.994140625, 23.78125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 6.0, 7.0, 8.0, 10.0, 11.0, 22.0, 20.0, 20.0, 16.0, 27.0, 29.0, 34.0, 32.0, 34.0, 36.0, 35.0, 50.0, 55.0, 46.0, 45.0, 34.0, 38.0, 39.0, 31.0, 40.0, 36.0, 30.0, 31.0, 25.0, 17.0, 17.0, 14.0, 12.0, 25.0, 8.0, 12.0, 9.0, 9.0, 3.0, 2.0, 9.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.921875, -26.969970703125, -26.01806640625, -25.066162109375, -24.1142578125, -23.162353515625, -22.21044921875, -21.258544921875, -20.306640625, -19.354736328125, -18.40283203125, -17.450927734375, -16.4990234375, -15.547119140625, -14.59521484375, -13.643310546875, -12.69140625, -11.739501953125, -10.78759765625, -9.835693359375, -8.8837890625, -7.931884765625, -6.97998046875, -6.028076171875, -5.076171875, -4.124267578125, -3.17236328125, -2.220458984375, -1.2685546875, -0.316650390625, 0.63525390625, 1.587158203125, 2.5390625, 3.490966796875, 4.44287109375, 5.394775390625, 6.3466796875, 7.298583984375, 8.25048828125, 9.202392578125, 10.154296875, 11.106201171875, 12.05810546875, 13.010009765625, 13.9619140625, 14.913818359375, 15.86572265625, 16.817626953125, 17.76953125, 18.721435546875, 19.67333984375, 20.625244140625, 21.5771484375, 22.529052734375, 23.48095703125, 24.432861328125, 25.384765625, 26.336669921875, 27.28857421875, 28.240478515625, 29.1923828125, 30.144287109375, 31.09619140625, 32.048095703125, 33.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 8.0, 18.0, 35.0, 30.0, 63.0, 116.0, 139.0, 234.0, 362.0, 601.0, 816.0, 1368.0, 2044.0, 3183.0, 4690.0, 7318.0, 10934.0, 16577.0, 24619.0, 35975.0, 50840.0, 68961.0, 89580.0, 107172.0, 116673.0, 115262.0, 102211.0, 82839.0, 62634.0, 46066.0, 32059.0, 21728.0, 14693.0, 9750.0, 6495.0, 4323.0, 2854.0, 1880.0, 1187.0, 839.0, 515.0, 311.0, 209.0, 128.0, 73.0, 55.0, 37.0, 18.0, 11.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.453125, -23.708740234375, -22.96435546875, -22.219970703125, -21.4755859375, -20.731201171875, -19.98681640625, -19.242431640625, -18.498046875, -17.753662109375, -17.00927734375, -16.264892578125, -15.5205078125, -14.776123046875, -14.03173828125, -13.287353515625, -12.54296875, -11.798583984375, -11.05419921875, -10.309814453125, -9.5654296875, -8.821044921875, -8.07666015625, -7.332275390625, -6.587890625, -5.843505859375, -5.09912109375, -4.354736328125, -3.6103515625, -2.865966796875, -2.12158203125, -1.377197265625, -0.6328125, 0.111572265625, 0.85595703125, 1.600341796875, 2.3447265625, 3.089111328125, 3.83349609375, 4.577880859375, 5.322265625, 6.066650390625, 6.81103515625, 7.555419921875, 8.2998046875, 9.044189453125, 9.78857421875, 10.532958984375, 11.27734375, 12.021728515625, 12.76611328125, 13.510498046875, 14.2548828125, 14.999267578125, 15.74365234375, 16.488037109375, 17.232421875, 17.976806640625, 18.72119140625, 19.465576171875, 20.2099609375, 20.954345703125, 21.69873046875, 22.443115234375, 23.1875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 5.0, 5.0, 17.0, 11.0, 18.0, 19.0, 19.0, 22.0, 29.0, 26.0, 22.0, 32.0, 34.0, 43.0, 35.0, 51.0, 35.0, 35.0, 40.0, 47.0, 40.0, 33.0, 49.0, 31.0, 19.0, 34.0, 38.0, 24.0, 30.0, 22.0, 14.0, 21.0, 7.0, 18.0, 9.0, 10.0, 11.0, 6.0, 5.0, 2.0, 8.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.9375, -18.323974609375, -17.71044921875, -17.096923828125, -16.4833984375, -15.869873046875, -15.25634765625, -14.642822265625, -14.029296875, -13.415771484375, -12.80224609375, -12.188720703125, -11.5751953125, -10.961669921875, -10.34814453125, -9.734619140625, -9.12109375, -8.507568359375, -7.89404296875, -7.280517578125, -6.6669921875, -6.053466796875, -5.43994140625, -4.826416015625, -4.212890625, -3.599365234375, -2.98583984375, -2.372314453125, -1.7587890625, -1.145263671875, -0.53173828125, 0.081787109375, 0.6953125, 1.308837890625, 1.92236328125, 2.535888671875, 3.1494140625, 3.762939453125, 4.37646484375, 4.989990234375, 5.603515625, 6.217041015625, 6.83056640625, 7.444091796875, 8.0576171875, 8.671142578125, 9.28466796875, 9.898193359375, 10.51171875, 11.125244140625, 11.73876953125, 12.352294921875, 12.9658203125, 13.579345703125, 14.19287109375, 14.806396484375, 15.419921875, 16.033447265625, 16.64697265625, 17.260498046875, 17.8740234375, 18.487548828125, 19.10107421875, 19.714599609375, 20.328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 25.0, 22.0, 45.0, 42.0, 83.0, 139.0, 229.0, 339.0, 555.0, 916.0, 1414.0, 2304.0, 3792.0, 6081.0, 10002.0, 16363.0, 26099.0, 41179.0, 63170.0, 92091.0, 123227.0, 144334.0, 143115.0, 119675.0, 88760.0, 60372.0, 39006.0, 24737.0, 15421.0, 9517.0, 5947.0, 3634.0, 2295.0, 1338.0, 857.0, 528.0, 323.0, 207.0, 125.0, 82.0, 52.0, 37.0, 19.0, 14.0, 12.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-10.7734375, -10.4560546875, -10.138671875, -9.8212890625, -9.50390625, -9.1865234375, -8.869140625, -8.5517578125, -8.234375, -7.9169921875, -7.599609375, -7.2822265625, -6.96484375, -6.6474609375, -6.330078125, -6.0126953125, -5.6953125, -5.3779296875, -5.060546875, -4.7431640625, -4.42578125, -4.1083984375, -3.791015625, -3.4736328125, -3.15625, -2.8388671875, -2.521484375, -2.2041015625, -1.88671875, -1.5693359375, -1.251953125, -0.9345703125, -0.6171875, -0.2998046875, 0.017578125, 0.3349609375, 0.65234375, 0.9697265625, 1.287109375, 1.6044921875, 1.921875, 2.2392578125, 2.556640625, 2.8740234375, 3.19140625, 3.5087890625, 3.826171875, 4.1435546875, 4.4609375, 4.7783203125, 5.095703125, 5.4130859375, 5.73046875, 6.0478515625, 6.365234375, 6.6826171875, 7.0, 7.3173828125, 7.634765625, 7.9521484375, 8.26953125, 8.5869140625, 8.904296875, 9.2216796875, 9.5390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 7.0, 5.0, 7.0, 15.0, 21.0, 21.0, 17.0, 27.0, 27.0, 37.0, 35.0, 36.0, 42.0, 37.0, 51.0, 47.0, 46.0, 64.0, 63.0, 43.0, 43.0, 61.0, 34.0, 29.0, 26.0, 20.0, 22.0, 24.0, 16.0, 12.0, 8.0, 7.0, 9.0, 5.0, 3.0, 9.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0010843276977539062, -0.0010512620210647583, -0.0010181963443756104, -0.0009851306676864624, -0.0009520649909973145, -0.0009189993143081665, -0.0008859336376190186, -0.0008528679609298706, -0.0008198022842407227, -0.0007867366075515747, -0.0007536709308624268, -0.0007206052541732788, -0.0006875395774841309, -0.0006544739007949829, -0.000621408224105835, -0.000588342547416687, -0.0005552768707275391, -0.0005222111940383911, -0.0004891455173492432, -0.0004560798406600952, -0.00042301416397094727, -0.0003899484872817993, -0.00035688281059265137, -0.0003238171339035034, -0.00029075145721435547, -0.0002576857805252075, -0.00022462010383605957, -0.00019155442714691162, -0.00015848875045776367, -0.00012542307376861572, -9.235739707946777e-05, -5.9291720390319824e-05, -2.6226043701171875e-05, 6.839632987976074e-06, 3.9905309677124023e-05, 7.297098636627197e-05, 0.00010603666305541992, 0.00013910233974456787, 0.00017216801643371582, 0.00020523369312286377, 0.00023829936981201172, 0.00027136504650115967, 0.0003044307231903076, 0.00033749639987945557, 0.0003705620765686035, 0.00040362775325775146, 0.0004366934299468994, 0.00046975910663604736, 0.0005028247833251953, 0.0005358904600143433, 0.0005689561367034912, 0.0006020218133926392, 0.0006350874900817871, 0.0006681531667709351, 0.000701218843460083, 0.000734284520149231, 0.0007673501968383789, 0.0008004158735275269, 0.0008334815502166748, 0.0008665472269058228, 0.0008996129035949707, 0.0009326785802841187, 0.0009657442569732666, 0.0009988099336624146, 0.0010318756103515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 8.0, 13.0, 25.0, 34.0, 50.0, 58.0, 124.0, 156.0, 307.0, 449.0, 740.0, 1185.0, 1897.0, 3183.0, 5313.0, 9142.0, 15879.0, 26876.0, 46308.0, 78085.0, 119635.0, 161447.0, 174194.0, 147110.0, 102110.0, 64039.0, 37500.0, 21846.0, 12484.0, 7372.0, 4285.0, 2636.0, 1522.0, 1000.0, 561.0, 362.0, 237.0, 138.0, 103.0, 50.0, 38.0, 18.0, 14.0, 7.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2584228515625, -10.860595703125, -10.4627685546875, -10.06494140625, -9.6671142578125, -9.269287109375, -8.8714599609375, -8.4736328125, -8.0758056640625, -7.677978515625, -7.2801513671875, -6.88232421875, -6.4844970703125, -6.086669921875, -5.6888427734375, -5.291015625, -4.8931884765625, -4.495361328125, -4.0975341796875, -3.69970703125, -3.3018798828125, -2.904052734375, -2.5062255859375, -2.1083984375, -1.7105712890625, -1.312744140625, -0.9149169921875, -0.51708984375, -0.1192626953125, 0.278564453125, 0.6763916015625, 1.07421875, 1.4720458984375, 1.869873046875, 2.2677001953125, 2.66552734375, 3.0633544921875, 3.461181640625, 3.8590087890625, 4.2568359375, 4.6546630859375, 5.052490234375, 5.4503173828125, 5.84814453125, 6.2459716796875, 6.643798828125, 7.0416259765625, 7.439453125, 7.8372802734375, 8.235107421875, 8.6329345703125, 9.03076171875, 9.4285888671875, 9.826416015625, 10.2242431640625, 10.6220703125, 11.0198974609375, 11.417724609375, 11.8155517578125, 12.21337890625, 12.6112060546875, 13.009033203125, 13.4068603515625, 13.8046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 11.0, 9.0, 10.0, 13.0, 14.0, 22.0, 24.0, 27.0, 40.0, 33.0, 39.0, 34.0, 54.0, 44.0, 58.0, 56.0, 59.0, 46.0, 40.0, 45.0, 53.0, 36.0, 31.0, 28.0, 22.0, 24.0, 24.0, 15.0, 18.0, 16.0, 10.0, 5.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0], "bins": [-5.0234375, -4.891815185546875, -4.76019287109375, -4.628570556640625, -4.4969482421875, -4.365325927734375, -4.23370361328125, -4.102081298828125, -3.970458984375, -3.838836669921875, -3.70721435546875, -3.575592041015625, -3.4439697265625, -3.312347412109375, -3.18072509765625, -3.049102783203125, -2.91748046875, -2.785858154296875, -2.65423583984375, -2.522613525390625, -2.3909912109375, -2.259368896484375, -2.12774658203125, -1.996124267578125, -1.864501953125, -1.732879638671875, -1.60125732421875, -1.469635009765625, -1.3380126953125, -1.206390380859375, -1.07476806640625, -0.943145751953125, -0.8115234375, -0.679901123046875, -0.54827880859375, -0.416656494140625, -0.2850341796875, -0.153411865234375, -0.02178955078125, 0.109832763671875, 0.241455078125, 0.373077392578125, 0.50469970703125, 0.636322021484375, 0.7679443359375, 0.899566650390625, 1.03118896484375, 1.162811279296875, 1.29443359375, 1.426055908203125, 1.55767822265625, 1.689300537109375, 1.8209228515625, 1.952545166015625, 2.08416748046875, 2.215789794921875, 2.347412109375, 2.479034423828125, 2.61065673828125, 2.742279052734375, 2.8739013671875, 3.005523681640625, 3.13714599609375, 3.268768310546875, 3.400390625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 10.0, 4.0, 6.0, 13.0, 19.0, 23.0, 23.0, 26.0, 29.0, 37.0, 45.0, 49.0, 37.0, 50.0, 52.0, 48.0, 54.0, 49.0, 55.0, 45.0, 37.0, 45.0, 31.0, 33.0, 22.0, 29.0, 21.0, 25.0, 8.0, 17.0, 6.0, 8.0, 0.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.262115478515625, -30.227493286132812, -29.192869186401367, -28.158246994018555, -27.12362289428711, -26.089000701904297, -25.054378509521484, -24.01975440979004, -22.985130310058594, -21.95050811767578, -20.915884017944336, -19.881261825561523, -18.846637725830078, -17.812015533447266, -16.777393341064453, -15.742769241333008, -14.708147048950195, -13.673523902893066, -12.638900756835938, -11.604278564453125, -10.56965446472168, -9.535032272338867, -8.500409126281738, -7.465785980224609, -6.4311628341674805, -5.396539688110352, -4.361916542053223, -3.327293872833252, -2.292670726776123, -1.2580475807189941, -0.22342491149902344, 0.8111982345581055, 1.8458213806152344, 2.8804445266723633, 3.915067434310913, 4.949690341949463, 5.984313488006592, 7.018936634063721, 8.053559303283691, 9.08818244934082, 10.12280559539795, 11.157428741455078, 12.192051887512207, 13.226675033569336, 14.261297225952148, 15.295921325683594, 16.330543518066406, 17.36516571044922, 18.399789810180664, 19.434412002563477, 20.469036102294922, 21.503658294677734, 22.53828239440918, 23.572904586791992, 24.607528686523438, 25.64215087890625, 26.676773071289062, 27.711395263671875, 28.74601936340332, 29.780641555786133, 30.815265655517578, 31.84988784790039, 32.8845100402832, 33.91913604736328, 34.953758239746094]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 12.0, 14.0, 8.0, 8.0, 21.0, 25.0, 18.0, 20.0, 34.0, 26.0, 29.0, 29.0, 44.0, 46.0, 34.0, 42.0, 34.0, 43.0, 37.0, 42.0, 44.0, 51.0, 35.0, 35.0, 29.0, 25.0, 27.0, 31.0, 16.0, 23.0, 21.0, 21.0, 9.0, 17.0, 7.0, 10.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.238452911376953, -26.227962493896484, -25.217472076416016, -24.206981658935547, -23.196491241455078, -22.18600082397461, -21.175508499145508, -20.16501808166504, -19.15452766418457, -18.1440372467041, -17.133546829223633, -16.123056411743164, -15.112565040588379, -14.10207462310791, -13.091583251953125, -12.081092834472656, -11.070602416992188, -10.060111999511719, -9.04962158203125, -8.039130210876465, -7.028639793395996, -6.018149375915527, -5.0076584815979, -3.9971675872802734, -2.9866771697998047, -1.9761865139007568, -0.965695858001709, 0.04479479789733887, 1.0552854537963867, 2.0657758712768555, 3.0762667655944824, 4.086757659912109, 5.097251892089844, 6.1077423095703125, 7.1182332038879395, 8.128724098205566, 9.139214515686035, 10.149704933166504, 11.160196304321289, 12.170686721801758, 13.181177139282227, 14.191667556762695, 15.202157974243164, 16.212648391723633, 17.223140716552734, 18.233631134033203, 19.244121551513672, 20.25461196899414, 21.26510238647461, 22.275592803955078, 23.286083221435547, 24.296573638916016, 25.307064056396484, 26.317554473876953, 27.328046798706055, 28.338537216186523, 29.349027633666992, 30.35951805114746, 31.37000846862793, 32.38050079345703, 33.3909912109375, 34.40148162841797, 35.41197204589844, 36.422462463378906, 37.432952880859375]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 23.0, 26.0, 36.0, 43.0, 82.0, 107.0, 149.0, 215.0, 338.0, 476.0, 773.0, 1091.0, 1595.0, 2556.0, 3781.0, 5682.0, 8661.0, 13766.0, 21694.0, 34854.0, 56978.0, 95607.0, 164450.0, 284842.0, 470361.0, 676256.0, 750231.0, 610170.0, 397805.0, 236959.0, 138951.0, 82312.0, 49204.0, 30625.0, 19037.0, 12027.0, 7706.0, 5052.0, 3289.0, 2138.0, 1408.0, 964.0, 657.0, 424.0, 305.0, 180.0, 139.0, 90.0, 49.0, 37.0, 27.0, 15.0, 17.0, 5.0, 11.0, 5.0, 2.0], "bins": [-35.65625, -34.58642578125, -33.5166015625, -32.44677734375, -31.376953125, -30.30712890625, -29.2373046875, -28.16748046875, -27.09765625, -26.02783203125, -24.9580078125, -23.88818359375, -22.818359375, -21.74853515625, -20.6787109375, -19.60888671875, -18.5390625, -17.46923828125, -16.3994140625, -15.32958984375, -14.259765625, -13.18994140625, -12.1201171875, -11.05029296875, -9.98046875, -8.91064453125, -7.8408203125, -6.77099609375, -5.701171875, -4.63134765625, -3.5615234375, -2.49169921875, -1.421875, -0.35205078125, 0.7177734375, 1.78759765625, 2.857421875, 3.92724609375, 4.9970703125, 6.06689453125, 7.13671875, 8.20654296875, 9.2763671875, 10.34619140625, 11.416015625, 12.48583984375, 13.5556640625, 14.62548828125, 15.6953125, 16.76513671875, 17.8349609375, 18.90478515625, 19.974609375, 21.04443359375, 22.1142578125, 23.18408203125, 24.25390625, 25.32373046875, 26.3935546875, 27.46337890625, 28.533203125, 29.60302734375, 30.6728515625, 31.74267578125, 32.8125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 12.0, 16.0, 10.0, 17.0, 23.0, 18.0, 20.0, 27.0, 37.0, 25.0, 34.0, 38.0, 36.0, 46.0, 44.0, 45.0, 39.0, 49.0, 36.0, 48.0, 46.0, 40.0, 31.0, 24.0, 40.0, 22.0, 28.0, 23.0, 27.0, 20.0, 14.0, 13.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.706787109375, -24.74169921875, -23.776611328125, -22.8115234375, -21.846435546875, -20.88134765625, -19.916259765625, -18.951171875, -17.986083984375, -17.02099609375, -16.055908203125, -15.0908203125, -14.125732421875, -13.16064453125, -12.195556640625, -11.23046875, -10.265380859375, -9.30029296875, -8.335205078125, -7.3701171875, -6.405029296875, -5.43994140625, -4.474853515625, -3.509765625, -2.544677734375, -1.57958984375, -0.614501953125, 0.3505859375, 1.315673828125, 2.28076171875, 3.245849609375, 4.2109375, 5.176025390625, 6.14111328125, 7.106201171875, 8.0712890625, 9.036376953125, 10.00146484375, 10.966552734375, 11.931640625, 12.896728515625, 13.86181640625, 14.826904296875, 15.7919921875, 16.757080078125, 17.72216796875, 18.687255859375, 19.65234375, 20.617431640625, 21.58251953125, 22.547607421875, 23.5126953125, 24.477783203125, 25.44287109375, 26.407958984375, 27.373046875, 28.338134765625, 29.30322265625, 30.268310546875, 31.2333984375, 32.198486328125, 33.16357421875, 34.128662109375, 35.09375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 9.0, 11.0, 26.0, 35.0, 70.0, 129.0, 223.0, 504.0, 879.0, 1756.0, 3392.0, 7017.0, 14461.0, 31880.0, 73262.0, 174591.0, 415794.0, 871343.0, 1163478.0, 797461.0, 367344.0, 152677.0, 64043.0, 28093.0, 13169.0, 6317.0, 3066.0, 1513.0, 829.0, 426.0, 204.0, 104.0, 69.0, 38.0, 23.0, 13.0, 6.0, 3.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.03125, -55.98974609375, -53.9482421875, -51.90673828125, -49.865234375, -47.82373046875, -45.7822265625, -43.74072265625, -41.69921875, -39.65771484375, -37.6162109375, -35.57470703125, -33.533203125, -31.49169921875, -29.4501953125, -27.40869140625, -25.3671875, -23.32568359375, -21.2841796875, -19.24267578125, -17.201171875, -15.15966796875, -13.1181640625, -11.07666015625, -9.03515625, -6.99365234375, -4.9521484375, -2.91064453125, -0.869140625, 1.17236328125, 3.2138671875, 5.25537109375, 7.296875, 9.33837890625, 11.3798828125, 13.42138671875, 15.462890625, 17.50439453125, 19.5458984375, 21.58740234375, 23.62890625, 25.67041015625, 27.7119140625, 29.75341796875, 31.794921875, 33.83642578125, 35.8779296875, 37.91943359375, 39.9609375, 42.00244140625, 44.0439453125, 46.08544921875, 48.126953125, 50.16845703125, 52.2099609375, 54.25146484375, 56.29296875, 58.33447265625, 60.3759765625, 62.41748046875, 64.458984375, 66.50048828125, 68.5419921875, 70.58349609375, 72.625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 9.0, 9.0, 20.0, 20.0, 31.0, 25.0, 39.0, 44.0, 75.0, 80.0, 75.0, 105.0, 126.0, 131.0, 189.0, 186.0, 227.0, 224.0, 259.0, 254.0, 259.0, 212.0, 203.0, 180.0, 190.0, 151.0, 155.0, 98.0, 101.0, 72.0, 54.0, 58.0, 54.0, 35.0, 38.0, 18.0, 11.0, 14.0, 12.0, 10.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.71875, -14.2255859375, -13.732421875, -13.2392578125, -12.74609375, -12.2529296875, -11.759765625, -11.2666015625, -10.7734375, -10.2802734375, -9.787109375, -9.2939453125, -8.80078125, -8.3076171875, -7.814453125, -7.3212890625, -6.828125, -6.3349609375, -5.841796875, -5.3486328125, -4.85546875, -4.3623046875, -3.869140625, -3.3759765625, -2.8828125, -2.3896484375, -1.896484375, -1.4033203125, -0.91015625, -0.4169921875, 0.076171875, 0.5693359375, 1.0625, 1.5556640625, 2.048828125, 2.5419921875, 3.03515625, 3.5283203125, 4.021484375, 4.5146484375, 5.0078125, 5.5009765625, 5.994140625, 6.4873046875, 6.98046875, 7.4736328125, 7.966796875, 8.4599609375, 8.953125, 9.4462890625, 9.939453125, 10.4326171875, 10.92578125, 11.4189453125, 11.912109375, 12.4052734375, 12.8984375, 13.3916015625, 13.884765625, 14.3779296875, 14.87109375, 15.3642578125, 15.857421875, 16.3505859375, 16.84375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 3.0, 4.0, 10.0, 9.0, 11.0, 16.0, 16.0, 18.0, 33.0, 44.0, 49.0, 38.0, 50.0, 48.0, 58.0, 47.0, 64.0, 55.0, 61.0, 58.0, 52.0, 47.0, 42.0, 38.0, 24.0, 16.0, 24.0, 12.0, 13.0, 6.0, 8.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.733158111572266, -41.240211486816406, -39.74726104736328, -38.25431442260742, -36.7613639831543, -35.26841735839844, -33.77546691894531, -32.28252029418945, -30.789573669433594, -29.2966251373291, -27.80367660522461, -26.31072998046875, -24.817781448364258, -23.324832916259766, -21.831884384155273, -20.33893585205078, -18.84598731994629, -17.353038787841797, -15.860091209411621, -14.367142677307129, -12.874195098876953, -11.381246566772461, -9.888298034667969, -8.395350456237793, -6.902401924133301, -5.409453868865967, -3.9165055751800537, -2.4235572814941406, -0.9306092262268066, 0.5623388290405273, 2.0552873611450195, 3.5482349395751953, 5.0411834716796875, 6.5341315269470215, 8.027079582214355, 9.520028114318848, 11.012975692749023, 12.505924224853516, 13.998872756958008, 15.491820335388184, 16.98476791381836, 18.47771644592285, 19.970664978027344, 21.463611602783203, 22.956560134887695, 24.449508666992188, 25.94245719909668, 27.435405731201172, 28.928354263305664, 30.421302795410156, 31.91425132751465, 33.40719985961914, 34.900146484375, 36.393096923828125, 37.886043548583984, 39.378990173339844, 40.87194061279297, 42.36488723754883, 43.85783767700195, 45.35078430175781, 46.84373474121094, 48.3366813659668, 49.829627990722656, 51.32257843017578, 52.81552505493164]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 5.0, 14.0, 8.0, 7.0, 19.0, 19.0, 14.0, 22.0, 27.0, 38.0, 40.0, 32.0, 39.0, 39.0, 43.0, 60.0, 48.0, 46.0, 37.0, 43.0, 47.0, 36.0, 36.0, 41.0, 40.0, 21.0, 40.0, 28.0, 15.0, 19.0, 21.0, 12.0, 10.0, 7.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.154190063476562, -28.934864044189453, -27.715539932250977, -26.496213912963867, -25.27688980102539, -24.05756378173828, -22.838237762451172, -21.618911743164062, -20.399587631225586, -19.180261611938477, -17.9609375, -16.74161148071289, -15.522286415100098, -14.302961349487305, -13.083635330200195, -11.864310264587402, -10.64498519897461, -9.425660133361816, -8.206335067749023, -6.987009048461914, -5.767683982849121, -4.548358917236328, -3.329033374786377, -2.109707832336426, -0.8903827667236328, 0.32894253730773926, 1.5482678413391113, 2.7675931453704834, 3.9869184494018555, 5.206243515014648, 6.4255690574646, 7.644894599914551, 8.86422348022461, 10.083548545837402, 11.302873611450195, 12.522199630737305, 13.741524696350098, 14.96084976196289, 16.18017578125, 17.39950180053711, 18.618825912475586, 19.838151931762695, 21.057476043701172, 22.27680206298828, 23.49612808227539, 24.715452194213867, 25.934778213500977, 27.154102325439453, 28.373428344726562, 29.592754364013672, 30.81207847595215, 32.031402587890625, 33.250728607177734, 34.470054626464844, 35.68938064575195, 36.90870666503906, 38.128028869628906, 39.347354888916016, 40.566680908203125, 41.78600311279297, 43.00532913208008, 44.22465515136719, 45.4439811706543, 46.663307189941406, 47.882633209228516]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 5.0, 9.0, 6.0, 16.0, 28.0, 53.0, 71.0, 81.0, 146.0, 271.0, 350.0, 571.0, 906.0, 1372.0, 2118.0, 3424.0, 5461.0, 8747.0, 14234.0, 23135.0, 36757.0, 58280.0, 89490.0, 126508.0, 156072.0, 155709.0, 124866.0, 87631.0, 56808.0, 35975.0, 22326.0, 13826.0, 8765.0, 5314.0, 3379.0, 2092.0, 1358.0, 812.0, 575.0, 361.0, 225.0, 158.0, 90.0, 71.0, 38.0, 23.0, 15.0, 11.0, 10.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.34375, -14.8638916015625, -14.384033203125, -13.9041748046875, -13.42431640625, -12.9444580078125, -12.464599609375, -11.9847412109375, -11.5048828125, -11.0250244140625, -10.545166015625, -10.0653076171875, -9.58544921875, -9.1055908203125, -8.625732421875, -8.1458740234375, -7.666015625, -7.1861572265625, -6.706298828125, -6.2264404296875, -5.74658203125, -5.2667236328125, -4.786865234375, -4.3070068359375, -3.8271484375, -3.3472900390625, -2.867431640625, -2.3875732421875, -1.90771484375, -1.4278564453125, -0.947998046875, -0.4681396484375, 0.01171875, 0.4915771484375, 0.971435546875, 1.4512939453125, 1.93115234375, 2.4110107421875, 2.890869140625, 3.3707275390625, 3.8505859375, 4.3304443359375, 4.810302734375, 5.2901611328125, 5.77001953125, 6.2498779296875, 6.729736328125, 7.2095947265625, 7.689453125, 8.1693115234375, 8.649169921875, 9.1290283203125, 9.60888671875, 10.0887451171875, 10.568603515625, 11.0484619140625, 11.5283203125, 12.0081787109375, 12.488037109375, 12.9678955078125, 13.44775390625, 13.9276123046875, 14.407470703125, 14.8873291015625, 15.3671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 9.0, 9.0, 11.0, 15.0, 21.0, 19.0, 21.0, 19.0, 30.0, 39.0, 34.0, 38.0, 39.0, 39.0, 52.0, 52.0, 51.0, 38.0, 48.0, 57.0, 43.0, 39.0, 45.0, 34.0, 22.0, 30.0, 33.0, 23.0, 21.0, 17.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.28125, -30.93359375, -29.5859375, -28.23828125, -26.890625, -25.54296875, -24.1953125, -22.84765625, -21.5, -20.15234375, -18.8046875, -17.45703125, -16.109375, -14.76171875, -13.4140625, -12.06640625, -10.71875, -9.37109375, -8.0234375, -6.67578125, -5.328125, -3.98046875, -2.6328125, -1.28515625, 0.0625, 1.41015625, 2.7578125, 4.10546875, 5.453125, 6.80078125, 8.1484375, 9.49609375, 10.84375, 12.19140625, 13.5390625, 14.88671875, 16.234375, 17.58203125, 18.9296875, 20.27734375, 21.625, 22.97265625, 24.3203125, 25.66796875, 27.015625, 28.36328125, 29.7109375, 31.05859375, 32.40625, 33.75390625, 35.1015625, 36.44921875, 37.796875, 39.14453125, 40.4921875, 41.83984375, 43.1875, 44.53515625, 45.8828125, 47.23046875, 48.578125, 49.92578125, 51.2734375, 52.62109375, 53.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 20.0, 20.0, 23.0, 42.0, 51.0, 89.0, 124.0, 207.0, 323.0, 493.0, 741.0, 1156.0, 1830.0, 2720.0, 4375.0, 7144.0, 11327.0, 18440.0, 30400.0, 48974.0, 78881.0, 121628.0, 164321.0, 172690.0, 138461.0, 92586.0, 58047.0, 35375.0, 22070.0, 13357.0, 8120.0, 5201.0, 3346.0, 2087.0, 1414.0, 889.0, 513.0, 338.0, 228.0, 159.0, 96.0, 77.0, 64.0, 29.0, 34.0, 11.0, 10.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-18.8125, -18.227783203125, -17.64306640625, -17.058349609375, -16.4736328125, -15.888916015625, -15.30419921875, -14.719482421875, -14.134765625, -13.550048828125, -12.96533203125, -12.380615234375, -11.7958984375, -11.211181640625, -10.62646484375, -10.041748046875, -9.45703125, -8.872314453125, -8.28759765625, -7.702880859375, -7.1181640625, -6.533447265625, -5.94873046875, -5.364013671875, -4.779296875, -4.194580078125, -3.60986328125, -3.025146484375, -2.4404296875, -1.855712890625, -1.27099609375, -0.686279296875, -0.1015625, 0.483154296875, 1.06787109375, 1.652587890625, 2.2373046875, 2.822021484375, 3.40673828125, 3.991455078125, 4.576171875, 5.160888671875, 5.74560546875, 6.330322265625, 6.9150390625, 7.499755859375, 8.08447265625, 8.669189453125, 9.25390625, 9.838623046875, 10.42333984375, 11.008056640625, 11.5927734375, 12.177490234375, 12.76220703125, 13.346923828125, 13.931640625, 14.516357421875, 15.10107421875, 15.685791015625, 16.2705078125, 16.855224609375, 17.43994140625, 18.024658203125, 18.609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 14.0, 12.0, 16.0, 21.0, 14.0, 23.0, 25.0, 21.0, 36.0, 38.0, 30.0, 36.0, 38.0, 42.0, 35.0, 36.0, 46.0, 48.0, 48.0, 52.0, 36.0, 44.0, 34.0, 21.0, 25.0, 36.0, 20.0, 20.0, 18.0, 12.0, 6.0, 13.0, 11.0, 5.0, 7.0, 4.0, 9.0, 2.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.921630859375, -21.21826171875, -20.514892578125, -19.8115234375, -19.108154296875, -18.40478515625, -17.701416015625, -16.998046875, -16.294677734375, -15.59130859375, -14.887939453125, -14.1845703125, -13.481201171875, -12.77783203125, -12.074462890625, -11.37109375, -10.667724609375, -9.96435546875, -9.260986328125, -8.5576171875, -7.854248046875, -7.15087890625, -6.447509765625, -5.744140625, -5.040771484375, -4.33740234375, -3.634033203125, -2.9306640625, -2.227294921875, -1.52392578125, -0.820556640625, -0.1171875, 0.586181640625, 1.28955078125, 1.992919921875, 2.6962890625, 3.399658203125, 4.10302734375, 4.806396484375, 5.509765625, 6.213134765625, 6.91650390625, 7.619873046875, 8.3232421875, 9.026611328125, 9.72998046875, 10.433349609375, 11.13671875, 11.840087890625, 12.54345703125, 13.246826171875, 13.9501953125, 14.653564453125, 15.35693359375, 16.060302734375, 16.763671875, 17.467041015625, 18.17041015625, 18.873779296875, 19.5771484375, 20.280517578125, 20.98388671875, 21.687255859375, 22.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 15.0, 13.0, 23.0, 43.0, 58.0, 73.0, 110.0, 186.0, 278.0, 392.0, 694.0, 1094.0, 1858.0, 3420.0, 6007.0, 11303.0, 22388.0, 44726.0, 87633.0, 160392.0, 233847.0, 210787.0, 127219.0, 65914.0, 33187.0, 16715.0, 8698.0, 4686.0, 2554.0, 1591.0, 952.0, 641.0, 346.0, 233.0, 169.0, 85.0, 55.0, 49.0, 32.0, 20.0, 19.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-7.328125, -7.11749267578125, -6.9068603515625, -6.69622802734375, -6.485595703125, -6.27496337890625, -6.0643310546875, -5.85369873046875, -5.64306640625, -5.43243408203125, -5.2218017578125, -5.01116943359375, -4.800537109375, -4.58990478515625, -4.3792724609375, -4.16864013671875, -3.9580078125, -3.74737548828125, -3.5367431640625, -3.32611083984375, -3.115478515625, -2.90484619140625, -2.6942138671875, -2.48358154296875, -2.27294921875, -2.06231689453125, -1.8516845703125, -1.64105224609375, -1.430419921875, -1.21978759765625, -1.0091552734375, -0.79852294921875, -0.587890625, -0.37725830078125, -0.1666259765625, 0.04400634765625, 0.254638671875, 0.46527099609375, 0.6759033203125, 0.88653564453125, 1.09716796875, 1.30780029296875, 1.5184326171875, 1.72906494140625, 1.939697265625, 2.15032958984375, 2.3609619140625, 2.57159423828125, 2.7822265625, 2.99285888671875, 3.2034912109375, 3.41412353515625, 3.624755859375, 3.83538818359375, 4.0460205078125, 4.25665283203125, 4.46728515625, 4.67791748046875, 4.8885498046875, 5.09918212890625, 5.309814453125, 5.52044677734375, 5.7310791015625, 5.94171142578125, 6.15234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 8.0, 15.0, 11.0, 13.0, 23.0, 38.0, 40.0, 47.0, 49.0, 35.0, 49.0, 57.0, 61.0, 54.0, 51.0, 47.0, 46.0, 55.0, 46.0, 39.0, 35.0, 26.0, 22.0, 23.0, 17.0, 12.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004603862762451172, -0.0004449225962162018, -0.0004294589161872864, -0.00041399523615837097, -0.00039853155612945557, -0.00038306787610054016, -0.00036760419607162476, -0.00035214051604270935, -0.00033667683601379395, -0.00032121315598487854, -0.00030574947595596313, -0.00029028579592704773, -0.0002748221158981323, -0.0002593584358692169, -0.00024389475584030151, -0.0002284310758113861, -0.0002129673957824707, -0.0001975037157535553, -0.0001820400357246399, -0.0001665763556957245, -0.00015111267566680908, -0.00013564899563789368, -0.00012018531560897827, -0.00010472163558006287, -8.925795555114746e-05, -7.379427552223206e-05, -5.833059549331665e-05, -4.2866915464401245e-05, -2.740323543548584e-05, -1.1939555406570435e-05, 3.5241246223449707e-06, 1.8987804651260376e-05, 3.445148468017578e-05, 4.9915164709091187e-05, 6.537884473800659e-05, 8.0842524766922e-05, 9.63062047958374e-05, 0.00011176988482475281, 0.0001272335648536682, 0.00014269724488258362, 0.00015816092491149902, 0.00017362460494041443, 0.00018908828496932983, 0.00020455196499824524, 0.00022001564502716064, 0.00023547932505607605, 0.00025094300508499146, 0.00026640668511390686, 0.00028187036514282227, 0.00029733404517173767, 0.0003127977252006531, 0.0003282614052295685, 0.0003437250852584839, 0.0003591887652873993, 0.0003746524453163147, 0.0003901161253452301, 0.0004055798053741455, 0.0004210434854030609, 0.0004365071654319763, 0.0004519708454608917, 0.00046743452548980713, 0.00048289820551872253, 0.0004983618855476379, 0.0005138255655765533, 0.0005292892456054688]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 17.0, 24.0, 34.0, 51.0, 89.0, 156.0, 282.0, 529.0, 967.0, 1910.0, 3870.0, 8171.0, 17947.0, 41519.0, 97837.0, 205482.0, 285722.0, 207269.0, 100305.0, 42075.0, 18024.0, 8261.0, 3882.0, 1848.0, 1032.0, 542.0, 274.0, 171.0, 76.0, 59.0, 41.0, 20.0, 14.0, 10.0, 12.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.740234375, -9.41015625, -9.080078125, -8.75, -8.419921875, -8.08984375, -7.759765625, -7.4296875, -7.099609375, -6.76953125, -6.439453125, -6.109375, -5.779296875, -5.44921875, -5.119140625, -4.7890625, -4.458984375, -4.12890625, -3.798828125, -3.46875, -3.138671875, -2.80859375, -2.478515625, -2.1484375, -1.818359375, -1.48828125, -1.158203125, -0.828125, -0.498046875, -0.16796875, 0.162109375, 0.4921875, 0.822265625, 1.15234375, 1.482421875, 1.8125, 2.142578125, 2.47265625, 2.802734375, 3.1328125, 3.462890625, 3.79296875, 4.123046875, 4.453125, 4.783203125, 5.11328125, 5.443359375, 5.7734375, 6.103515625, 6.43359375, 6.763671875, 7.09375, 7.423828125, 7.75390625, 8.083984375, 8.4140625, 8.744140625, 9.07421875, 9.404296875, 9.734375, 10.064453125, 10.39453125, 10.724609375, 11.0546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 10.0, 9.0, 18.0, 19.0, 26.0, 25.0, 44.0, 37.0, 35.0, 56.0, 79.0, 63.0, 78.0, 64.0, 69.0, 46.0, 61.0, 51.0, 47.0, 32.0, 35.0, 15.0, 13.0, 16.0, 7.0, 14.0, 2.0, 8.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -2.994964599609375, -2.89617919921875, -2.797393798828125, -2.6986083984375, -2.599822998046875, -2.50103759765625, -2.402252197265625, -2.303466796875, -2.204681396484375, -2.10589599609375, -2.007110595703125, -1.9083251953125, -1.809539794921875, -1.71075439453125, -1.611968994140625, -1.51318359375, -1.414398193359375, -1.31561279296875, -1.216827392578125, -1.1180419921875, -1.019256591796875, -0.92047119140625, -0.821685791015625, -0.722900390625, -0.624114990234375, -0.52532958984375, -0.426544189453125, -0.3277587890625, -0.228973388671875, -0.13018798828125, -0.031402587890625, 0.0673828125, 0.166168212890625, 0.26495361328125, 0.363739013671875, 0.4625244140625, 0.561309814453125, 0.66009521484375, 0.758880615234375, 0.857666015625, 0.956451416015625, 1.05523681640625, 1.154022216796875, 1.2528076171875, 1.351593017578125, 1.45037841796875, 1.549163818359375, 1.64794921875, 1.746734619140625, 1.84552001953125, 1.944305419921875, 2.0430908203125, 2.141876220703125, 2.24066162109375, 2.339447021484375, 2.438232421875, 2.537017822265625, 2.63580322265625, 2.734588623046875, 2.8333740234375, 2.932159423828125, 3.03094482421875, 3.129730224609375, 3.228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 4.0, 11.0, 13.0, 18.0, 18.0, 33.0, 44.0, 40.0, 45.0, 50.0, 55.0, 63.0, 56.0, 63.0, 64.0, 58.0, 60.0, 58.0, 53.0, 28.0, 38.0, 25.0, 24.0, 14.0, 11.0, 10.0, 13.0, 6.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.611724853515625, -44.01176071166992, -42.41179275512695, -40.81182861328125, -39.21186065673828, -37.61189651489258, -36.011932373046875, -34.411964416503906, -32.8120002746582, -31.212034225463867, -29.61206817626953, -28.012104034423828, -26.412137985229492, -24.812171936035156, -23.21220588684082, -21.612239837646484, -20.01227378845215, -18.412307739257812, -16.812341690063477, -15.212376594543457, -13.612411499023438, -12.012445449829102, -10.412479400634766, -8.812514305114746, -7.21254825592041, -5.612582683563232, -4.012617111206055, -2.4126510620117188, -0.812685489654541, 0.7872800827026367, 2.3872461318969727, 3.987211227416992, 5.587177276611328, 7.187142848968506, 8.787108421325684, 10.38707447052002, 11.987039566040039, 13.587005615234375, 15.186971664428711, 16.786937713623047, 18.38690185546875, 19.986867904663086, 21.586833953857422, 23.186798095703125, 24.78676414489746, 26.386730194091797, 27.986696243286133, 29.58666229248047, 31.186628341674805, 32.78659439086914, 34.386558532714844, 35.98652648925781, 37.586490631103516, 39.18645477294922, 40.78642272949219, 42.38638687133789, 43.98635482788086, 45.58631896972656, 47.18628692626953, 48.786251068115234, 50.3862190246582, 51.986183166503906, 53.586151123046875, 55.18611526489258, 56.78607940673828]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 10.0, 13.0, 17.0, 21.0, 13.0, 20.0, 29.0, 40.0, 32.0, 36.0, 46.0, 31.0, 52.0, 52.0, 53.0, 37.0, 46.0, 49.0, 36.0, 41.0, 40.0, 37.0, 34.0, 26.0, 37.0, 25.0, 13.0, 23.0, 21.0, 10.0, 9.0, 7.0, 5.0, 6.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.726268768310547, -28.51274871826172, -27.29922866821289, -26.085708618164062, -24.872188568115234, -23.658668518066406, -22.445148468017578, -21.23162841796875, -20.018108367919922, -18.804588317871094, -17.591068267822266, -16.377548217773438, -15.16402816772461, -13.950508117675781, -12.736988067626953, -11.523468017578125, -10.309947967529297, -9.096427917480469, -7.882907867431641, -6.6693878173828125, -5.455867767333984, -4.242347717285156, -3.028827667236328, -1.8153076171875, -0.6017875671386719, 0.6117324829101562, 1.8252525329589844, 3.0387725830078125, 4.252292633056641, 5.465812683105469, 6.679332733154297, 7.892852783203125, 9.106372833251953, 10.319892883300781, 11.53341293334961, 12.746932983398438, 13.960453033447266, 15.173973083496094, 16.387493133544922, 17.60101318359375, 18.814533233642578, 20.028053283691406, 21.241573333740234, 22.455093383789062, 23.66861343383789, 24.88213348388672, 26.095653533935547, 27.309173583984375, 28.522693634033203, 29.73621368408203, 30.94973373413086, 32.16325378417969, 33.376773834228516, 34.590293884277344, 35.80381393432617, 37.017333984375, 38.23085403442383, 39.444374084472656, 40.657894134521484, 41.87141418457031, 43.08493423461914, 44.29845428466797, 45.5119743347168, 46.725494384765625, 47.93901443481445]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 16.0, 28.0, 39.0, 53.0, 64.0, 111.0, 175.0, 220.0, 356.0, 547.0, 841.0, 1271.0, 1850.0, 2868.0, 4395.0, 6670.0, 10028.0, 15175.0, 22286.0, 32666.0, 46639.0, 62924.0, 82274.0, 100262.0, 111837.0, 114269.0, 105514.0, 89426.0, 70010.0, 51820.0, 36792.0, 25574.0, 17281.0, 11591.0, 7809.0, 5094.0, 3375.0, 2165.0, 1414.0, 941.0, 624.0, 410.0, 271.0, 181.0, 130.0, 89.0, 46.0, 43.0, 30.0, 22.0, 14.0, 5.0, 3.0, 1.0, 3.0, 5.0], "bins": [-27.125, -26.307373046875, -25.48974609375, -24.672119140625, -23.8544921875, -23.036865234375, -22.21923828125, -21.401611328125, -20.583984375, -19.766357421875, -18.94873046875, -18.131103515625, -17.3134765625, -16.495849609375, -15.67822265625, -14.860595703125, -14.04296875, -13.225341796875, -12.40771484375, -11.590087890625, -10.7724609375, -9.954833984375, -9.13720703125, -8.319580078125, -7.501953125, -6.684326171875, -5.86669921875, -5.049072265625, -4.2314453125, -3.413818359375, -2.59619140625, -1.778564453125, -0.9609375, -0.143310546875, 0.67431640625, 1.491943359375, 2.3095703125, 3.127197265625, 3.94482421875, 4.762451171875, 5.580078125, 6.397705078125, 7.21533203125, 8.032958984375, 8.8505859375, 9.668212890625, 10.48583984375, 11.303466796875, 12.12109375, 12.938720703125, 13.75634765625, 14.573974609375, 15.3916015625, 16.209228515625, 17.02685546875, 17.844482421875, 18.662109375, 19.479736328125, 20.29736328125, 21.114990234375, 21.9326171875, 22.750244140625, 23.56787109375, 24.385498046875, 25.203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 6.0, 1.0, 10.0, 4.0, 4.0, 17.0, 15.0, 19.0, 19.0, 25.0, 32.0, 43.0, 30.0, 35.0, 41.0, 41.0, 49.0, 63.0, 36.0, 41.0, 48.0, 43.0, 39.0, 46.0, 37.0, 51.0, 40.0, 29.0, 29.0, 24.0, 21.0, 14.0, 15.0, 10.0, 4.0, 11.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -29.909423828125, -28.58447265625, -27.259521484375, -25.9345703125, -24.609619140625, -23.28466796875, -21.959716796875, -20.634765625, -19.309814453125, -17.98486328125, -16.659912109375, -15.3349609375, -14.010009765625, -12.68505859375, -11.360107421875, -10.03515625, -8.710205078125, -7.38525390625, -6.060302734375, -4.7353515625, -3.410400390625, -2.08544921875, -0.760498046875, 0.564453125, 1.889404296875, 3.21435546875, 4.539306640625, 5.8642578125, 7.189208984375, 8.51416015625, 9.839111328125, 11.1640625, 12.489013671875, 13.81396484375, 15.138916015625, 16.4638671875, 17.788818359375, 19.11376953125, 20.438720703125, 21.763671875, 23.088623046875, 24.41357421875, 25.738525390625, 27.0634765625, 28.388427734375, 29.71337890625, 31.038330078125, 32.36328125, 33.688232421875, 35.01318359375, 36.338134765625, 37.6630859375, 38.988037109375, 40.31298828125, 41.637939453125, 42.962890625, 44.287841796875, 45.61279296875, 46.937744140625, 48.2626953125, 49.587646484375, 50.91259765625, 52.237548828125, 53.5625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 13.0, 24.0, 39.0, 52.0, 70.0, 119.0, 198.0, 317.0, 447.0, 702.0, 1040.0, 1613.0, 2563.0, 4092.0, 6248.0, 9350.0, 14500.0, 21899.0, 32878.0, 46898.0, 65816.0, 86611.0, 105228.0, 117219.0, 117992.0, 106768.0, 88636.0, 67468.0, 49321.0, 34036.0, 23194.0, 15209.0, 9909.0, 6283.0, 4194.0, 2595.0, 1802.0, 1128.0, 719.0, 482.0, 295.0, 212.0, 128.0, 78.0, 60.0, 36.0, 25.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.609375, -27.716796875, -26.82421875, -25.931640625, -25.0390625, -24.146484375, -23.25390625, -22.361328125, -21.46875, -20.576171875, -19.68359375, -18.791015625, -17.8984375, -17.005859375, -16.11328125, -15.220703125, -14.328125, -13.435546875, -12.54296875, -11.650390625, -10.7578125, -9.865234375, -8.97265625, -8.080078125, -7.1875, -6.294921875, -5.40234375, -4.509765625, -3.6171875, -2.724609375, -1.83203125, -0.939453125, -0.046875, 0.845703125, 1.73828125, 2.630859375, 3.5234375, 4.416015625, 5.30859375, 6.201171875, 7.09375, 7.986328125, 8.87890625, 9.771484375, 10.6640625, 11.556640625, 12.44921875, 13.341796875, 14.234375, 15.126953125, 16.01953125, 16.912109375, 17.8046875, 18.697265625, 19.58984375, 20.482421875, 21.375, 22.267578125, 23.16015625, 24.052734375, 24.9453125, 25.837890625, 26.73046875, 27.623046875, 28.515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 10.0, 4.0, 6.0, 4.0, 5.0, 8.0, 15.0, 18.0, 9.0, 20.0, 20.0, 30.0, 19.0, 31.0, 35.0, 35.0, 33.0, 33.0, 35.0, 50.0, 41.0, 43.0, 44.0, 45.0, 30.0, 42.0, 49.0, 27.0, 42.0, 30.0, 35.0, 30.0, 22.0, 15.0, 21.0, 14.0, 15.0, 11.0, 8.0, 4.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.660400390625, -21.91455078125, -21.168701171875, -20.4228515625, -19.677001953125, -18.93115234375, -18.185302734375, -17.439453125, -16.693603515625, -15.94775390625, -15.201904296875, -14.4560546875, -13.710205078125, -12.96435546875, -12.218505859375, -11.47265625, -10.726806640625, -9.98095703125, -9.235107421875, -8.4892578125, -7.743408203125, -6.99755859375, -6.251708984375, -5.505859375, -4.760009765625, -4.01416015625, -3.268310546875, -2.5224609375, -1.776611328125, -1.03076171875, -0.284912109375, 0.4609375, 1.206787109375, 1.95263671875, 2.698486328125, 3.4443359375, 4.190185546875, 4.93603515625, 5.681884765625, 6.427734375, 7.173583984375, 7.91943359375, 8.665283203125, 9.4111328125, 10.156982421875, 10.90283203125, 11.648681640625, 12.39453125, 13.140380859375, 13.88623046875, 14.632080078125, 15.3779296875, 16.123779296875, 16.86962890625, 17.615478515625, 18.361328125, 19.107177734375, 19.85302734375, 20.598876953125, 21.3447265625, 22.090576171875, 22.83642578125, 23.582275390625, 24.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 11.0, 15.0, 20.0, 28.0, 31.0, 60.0, 60.0, 104.0, 131.0, 197.0, 307.0, 462.0, 740.0, 1250.0, 2163.0, 4125.0, 8078.0, 16903.0, 37039.0, 81309.0, 163529.0, 247860.0, 229338.0, 134230.0, 63351.0, 28850.0, 13549.0, 6567.0, 3379.0, 1866.0, 1064.0, 645.0, 391.0, 259.0, 179.0, 124.0, 96.0, 70.0, 48.0, 36.0, 29.0, 18.0, 11.0, 6.0, 6.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.420654296875, -21.66943359375, -20.918212890625, -20.1669921875, -19.415771484375, -18.66455078125, -17.913330078125, -17.162109375, -16.410888671875, -15.65966796875, -14.908447265625, -14.1572265625, -13.406005859375, -12.65478515625, -11.903564453125, -11.15234375, -10.401123046875, -9.64990234375, -8.898681640625, -8.1474609375, -7.396240234375, -6.64501953125, -5.893798828125, -5.142578125, -4.391357421875, -3.64013671875, -2.888916015625, -2.1376953125, -1.386474609375, -0.63525390625, 0.115966796875, 0.8671875, 1.618408203125, 2.36962890625, 3.120849609375, 3.8720703125, 4.623291015625, 5.37451171875, 6.125732421875, 6.876953125, 7.628173828125, 8.37939453125, 9.130615234375, 9.8818359375, 10.633056640625, 11.38427734375, 12.135498046875, 12.88671875, 13.637939453125, 14.38916015625, 15.140380859375, 15.8916015625, 16.642822265625, 17.39404296875, 18.145263671875, 18.896484375, 19.647705078125, 20.39892578125, 21.150146484375, 21.9013671875, 22.652587890625, 23.40380859375, 24.155029296875, 24.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 12.0, 31.0, 28.0, 51.0, 74.0, 83.0, 95.0, 103.0, 99.0, 95.0, 68.0, 64.0, 41.0, 38.0, 28.0, 16.0, 15.0, 8.0, 6.0, 4.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0021762847900390625, -0.0020858049392700195, -0.0019953250885009766, -0.0019048452377319336, -0.0018143653869628906, -0.0017238855361938477, -0.0016334056854248047, -0.0015429258346557617, -0.0014524459838867188, -0.0013619661331176758, -0.0012714862823486328, -0.0011810064315795898, -0.0010905265808105469, -0.001000046730041504, -0.0009095668792724609, -0.000819087028503418, -0.000728607177734375, -0.000638127326965332, -0.0005476474761962891, -0.0004571676254272461, -0.0003666877746582031, -0.00027620792388916016, -0.0001857280731201172, -9.524822235107422e-05, -4.76837158203125e-06, 8.571147918701172e-05, 0.0001761913299560547, 0.00026667118072509766, 0.0003571510314941406, 0.0004476308822631836, 0.0005381107330322266, 0.0006285905838012695, 0.0007190704345703125, 0.0008095502853393555, 0.0009000301361083984, 0.0009905099868774414, 0.0010809898376464844, 0.0011714696884155273, 0.0012619495391845703, 0.0013524293899536133, 0.0014429092407226562, 0.0015333890914916992, 0.0016238689422607422, 0.0017143487930297852, 0.0018048286437988281, 0.001895308494567871, 0.001985788345336914, 0.002076268196105957, 0.002166748046875, 0.002257227897644043, 0.002347707748413086, 0.002438187599182129, 0.002528667449951172, 0.002619147300720215, 0.002709627151489258, 0.0028001070022583008, 0.0028905868530273438, 0.0029810667037963867, 0.0030715465545654297, 0.0031620264053344727, 0.0032525062561035156, 0.0033429861068725586, 0.0034334659576416016, 0.0035239458084106445, 0.0036144256591796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 11.0, 6.0, 11.0, 16.0, 16.0, 25.0, 31.0, 46.0, 58.0, 85.0, 132.0, 182.0, 283.0, 376.0, 547.0, 825.0, 1264.0, 2140.0, 3704.0, 6627.0, 12501.0, 24432.0, 50253.0, 102209.0, 184205.0, 239875.0, 194689.0, 111331.0, 55137.0, 26482.0, 13400.0, 7098.0, 4047.0, 2319.0, 1474.0, 858.0, 574.0, 408.0, 265.0, 184.0, 131.0, 93.0, 55.0, 39.0, 39.0, 21.0, 17.0, 13.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0], "bins": [-25.71875, -24.974609375, -24.23046875, -23.486328125, -22.7421875, -21.998046875, -21.25390625, -20.509765625, -19.765625, -19.021484375, -18.27734375, -17.533203125, -16.7890625, -16.044921875, -15.30078125, -14.556640625, -13.8125, -13.068359375, -12.32421875, -11.580078125, -10.8359375, -10.091796875, -9.34765625, -8.603515625, -7.859375, -7.115234375, -6.37109375, -5.626953125, -4.8828125, -4.138671875, -3.39453125, -2.650390625, -1.90625, -1.162109375, -0.41796875, 0.326171875, 1.0703125, 1.814453125, 2.55859375, 3.302734375, 4.046875, 4.791015625, 5.53515625, 6.279296875, 7.0234375, 7.767578125, 8.51171875, 9.255859375, 10.0, 10.744140625, 11.48828125, 12.232421875, 12.9765625, 13.720703125, 14.46484375, 15.208984375, 15.953125, 16.697265625, 17.44140625, 18.185546875, 18.9296875, 19.673828125, 20.41796875, 21.162109375, 21.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 4.0, 1.0, 11.0, 12.0, 8.0, 26.0, 14.0, 27.0, 34.0, 38.0, 47.0, 49.0, 50.0, 74.0, 64.0, 63.0, 61.0, 56.0, 51.0, 51.0, 55.0, 33.0, 26.0, 44.0, 19.0, 14.0, 8.0, 10.0, 13.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.86883544921875, -5.6478271484375, -5.42681884765625, -5.205810546875, -4.98480224609375, -4.7637939453125, -4.54278564453125, -4.32177734375, -4.10076904296875, -3.8797607421875, -3.65875244140625, -3.437744140625, -3.21673583984375, -2.9957275390625, -2.77471923828125, -2.5537109375, -2.33270263671875, -2.1116943359375, -1.89068603515625, -1.669677734375, -1.44866943359375, -1.2276611328125, -1.00665283203125, -0.78564453125, -0.56463623046875, -0.3436279296875, -0.12261962890625, 0.098388671875, 0.31939697265625, 0.5404052734375, 0.76141357421875, 0.982421875, 1.20343017578125, 1.4244384765625, 1.64544677734375, 1.866455078125, 2.08746337890625, 2.3084716796875, 2.52947998046875, 2.75048828125, 2.97149658203125, 3.1925048828125, 3.41351318359375, 3.634521484375, 3.85552978515625, 4.0765380859375, 4.29754638671875, 4.5185546875, 4.73956298828125, 4.9605712890625, 5.18157958984375, 5.402587890625, 5.62359619140625, 5.8446044921875, 6.06561279296875, 6.28662109375, 6.50762939453125, 6.7286376953125, 6.94964599609375, 7.170654296875, 7.39166259765625, 7.6126708984375, 7.83367919921875, 8.0546875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 19.0, 15.0, 14.0, 20.0, 40.0, 42.0, 50.0, 54.0, 58.0, 38.0, 52.0, 55.0, 59.0, 56.0, 64.0, 69.0, 38.0, 38.0, 32.0, 35.0, 26.0, 21.0, 21.0, 12.0, 14.0, 10.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.97416687011719, -51.42745590209961, -49.88074493408203, -48.33403396606445, -46.787322998046875, -45.24061584472656, -43.69390106201172, -42.147193908691406, -40.60048294067383, -39.05377197265625, -37.50706100463867, -35.960350036621094, -34.413639068603516, -32.86692810058594, -31.320219039916992, -29.773509979248047, -28.226797103881836, -26.680086135864258, -25.13337516784668, -23.586666107177734, -22.039955139160156, -20.493244171142578, -18.946533203125, -17.399822235107422, -15.85311222076416, -14.306401252746582, -12.75969123840332, -11.212980270385742, -9.666269302368164, -8.119559288024902, -6.572848320007324, -5.0261383056640625, -3.4794273376464844, -1.932716727256775, -0.38600611686706543, 1.1607046127319336, 2.7074151039123535, 4.254125595092773, 5.800836563110352, 7.347546577453613, 8.894257545471191, 10.44096851348877, 11.987678527832031, 13.53438949584961, 15.081100463867188, 16.627811431884766, 18.174522399902344, 19.72123146057129, 21.267942428588867, 22.814653396606445, 24.361364364624023, 25.90807342529297, 27.454784393310547, 29.001495361328125, 30.548206329345703, 32.09491729736328, 33.64162826538086, 35.18833923339844, 36.735050201416016, 38.281761169433594, 39.82847213745117, 41.37518310546875, 42.92189025878906, 44.46860122680664, 46.01531219482422]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 8.0, 9.0, 14.0, 18.0, 19.0, 19.0, 36.0, 20.0, 24.0, 34.0, 40.0, 38.0, 43.0, 32.0, 41.0, 46.0, 43.0, 48.0, 35.0, 33.0, 58.0, 29.0, 29.0, 30.0, 45.0, 30.0, 21.0, 32.0, 22.0, 14.0, 10.0, 11.0, 7.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.671630859375, -38.380489349365234, -37.0893440246582, -35.79820251464844, -34.507057189941406, -33.21591567993164, -31.924774169921875, -30.633630752563477, -29.342487335205078, -28.05134391784668, -26.76020050048828, -25.469058990478516, -24.177915573120117, -22.88677215576172, -21.595630645751953, -20.304487228393555, -19.013343811035156, -17.722200393676758, -16.43105697631836, -15.139915466308594, -13.848772048950195, -12.557628631591797, -11.266486167907715, -9.975343704223633, -8.684200286865234, -7.393057346343994, -6.101914405822754, -4.810771465301514, -3.5196285247802734, -2.228485584259033, -0.937342643737793, 0.35379981994628906, 1.6449432373046875, 2.9360861778259277, 4.227229118347168, 5.518372058868408, 6.809514999389648, 8.100658416748047, 9.391800880432129, 10.682943344116211, 11.97408676147461, 13.265230178833008, 14.55637264251709, 15.847515106201172, 17.13865852355957, 18.42980194091797, 19.720943450927734, 21.012086868286133, 22.30323028564453, 23.59437370300293, 24.885517120361328, 26.176658630371094, 27.467802047729492, 28.75894546508789, 30.050086975097656, 31.341230392456055, 32.63237380981445, 33.92351531982422, 35.21466064453125, 36.505802154541016, 37.79694366455078, 39.08808898925781, 40.37923049926758, 41.670372009277344, 42.961517333984375]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 0.0, 8.0, 6.0, 14.0, 20.0, 34.0, 48.0, 74.0, 107.0, 149.0, 230.0, 319.0, 531.0, 753.0, 1080.0, 1700.0, 2606.0, 3996.0, 6274.0, 9928.0, 16452.0, 27497.0, 46182.0, 81533.0, 146895.0, 268107.0, 469185.0, 720660.0, 822909.0, 652902.0, 401128.0, 223087.0, 121946.0, 68014.0, 38915.0, 22700.0, 13830.0, 8545.0, 5571.0, 3493.0, 2350.0, 1469.0, 1006.0, 650.0, 461.0, 333.0, 184.0, 154.0, 102.0, 53.0, 36.0, 19.0, 13.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0], "bins": [-49.96875, -48.423828125, -46.87890625, -45.333984375, -43.7890625, -42.244140625, -40.69921875, -39.154296875, -37.609375, -36.064453125, -34.51953125, -32.974609375, -31.4296875, -29.884765625, -28.33984375, -26.794921875, -25.25, -23.705078125, -22.16015625, -20.615234375, -19.0703125, -17.525390625, -15.98046875, -14.435546875, -12.890625, -11.345703125, -9.80078125, -8.255859375, -6.7109375, -5.166015625, -3.62109375, -2.076171875, -0.53125, 1.013671875, 2.55859375, 4.103515625, 5.6484375, 7.193359375, 8.73828125, 10.283203125, 11.828125, 13.373046875, 14.91796875, 16.462890625, 18.0078125, 19.552734375, 21.09765625, 22.642578125, 24.1875, 25.732421875, 27.27734375, 28.822265625, 30.3671875, 31.912109375, 33.45703125, 35.001953125, 36.546875, 38.091796875, 39.63671875, 41.181640625, 42.7265625, 44.271484375, 45.81640625, 47.361328125, 48.90625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 6.0, 11.0, 12.0, 12.0, 20.0, 20.0, 15.0, 18.0, 22.0, 28.0, 42.0, 30.0, 40.0, 32.0, 36.0, 37.0, 39.0, 38.0, 46.0, 34.0, 42.0, 42.0, 42.0, 30.0, 32.0, 26.0, 38.0, 28.0, 36.0, 16.0, 25.0, 14.0, 11.0, 17.0, 9.0, 5.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.828125, -30.668212890625, -29.50830078125, -28.348388671875, -27.1884765625, -26.028564453125, -24.86865234375, -23.708740234375, -22.548828125, -21.388916015625, -20.22900390625, -19.069091796875, -17.9091796875, -16.749267578125, -15.58935546875, -14.429443359375, -13.26953125, -12.109619140625, -10.94970703125, -9.789794921875, -8.6298828125, -7.469970703125, -6.31005859375, -5.150146484375, -3.990234375, -2.830322265625, -1.67041015625, -0.510498046875, 0.6494140625, 1.809326171875, 2.96923828125, 4.129150390625, 5.2890625, 6.448974609375, 7.60888671875, 8.768798828125, 9.9287109375, 11.088623046875, 12.24853515625, 13.408447265625, 14.568359375, 15.728271484375, 16.88818359375, 18.048095703125, 19.2080078125, 20.367919921875, 21.52783203125, 22.687744140625, 23.84765625, 25.007568359375, 26.16748046875, 27.327392578125, 28.4873046875, 29.647216796875, 30.80712890625, 31.967041015625, 33.126953125, 34.286865234375, 35.44677734375, 36.606689453125, 37.7666015625, 38.926513671875, 40.08642578125, 41.246337890625, 42.40625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 12.0, 16.0, 44.0, 35.0, 63.0, 96.0, 145.0, 194.0, 303.0, 450.0, 683.0, 1046.0, 1460.0, 2396.0, 3542.0, 5780.0, 9231.0, 15165.0, 25463.0, 43901.0, 78367.0, 143495.0, 264683.0, 471872.0, 739594.0, 845637.0, 654338.0, 394083.0, 217299.0, 117321.0, 64934.0, 36254.0, 21615.0, 12874.0, 8021.0, 4873.0, 3071.0, 2060.0, 1264.0, 884.0, 605.0, 387.0, 248.0, 179.0, 104.0, 56.0, 39.0, 38.0, 29.0, 15.0, 9.0, 5.0, 1.0, 6.0, 0.0, 0.0, 1.0], "bins": [-63.15625, -61.203125, -59.25, -57.296875, -55.34375, -53.390625, -51.4375, -49.484375, -47.53125, -45.578125, -43.625, -41.671875, -39.71875, -37.765625, -35.8125, -33.859375, -31.90625, -29.953125, -28.0, -26.046875, -24.09375, -22.140625, -20.1875, -18.234375, -16.28125, -14.328125, -12.375, -10.421875, -8.46875, -6.515625, -4.5625, -2.609375, -0.65625, 1.296875, 3.25, 5.203125, 7.15625, 9.109375, 11.0625, 13.015625, 14.96875, 16.921875, 18.875, 20.828125, 22.78125, 24.734375, 26.6875, 28.640625, 30.59375, 32.546875, 34.5, 36.453125, 38.40625, 40.359375, 42.3125, 44.265625, 46.21875, 48.171875, 50.125, 52.078125, 54.03125, 55.984375, 57.9375, 59.890625, 61.84375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 13.0, 14.0, 22.0, 20.0, 38.0, 45.0, 47.0, 45.0, 53.0, 94.0, 110.0, 129.0, 148.0, 150.0, 176.0, 195.0, 185.0, 226.0, 200.0, 208.0, 208.0, 218.0, 197.0, 178.0, 169.0, 144.0, 124.0, 119.0, 111.0, 111.0, 60.0, 47.0, 42.0, 35.0, 30.0, 32.0, 32.0, 17.0, 19.0, 9.0, 10.0, 8.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.46875, -18.857666015625, -18.24658203125, -17.635498046875, -17.0244140625, -16.413330078125, -15.80224609375, -15.191162109375, -14.580078125, -13.968994140625, -13.35791015625, -12.746826171875, -12.1357421875, -11.524658203125, -10.91357421875, -10.302490234375, -9.69140625, -9.080322265625, -8.46923828125, -7.858154296875, -7.2470703125, -6.635986328125, -6.02490234375, -5.413818359375, -4.802734375, -4.191650390625, -3.58056640625, -2.969482421875, -2.3583984375, -1.747314453125, -1.13623046875, -0.525146484375, 0.0859375, 0.697021484375, 1.30810546875, 1.919189453125, 2.5302734375, 3.141357421875, 3.75244140625, 4.363525390625, 4.974609375, 5.585693359375, 6.19677734375, 6.807861328125, 7.4189453125, 8.030029296875, 8.64111328125, 9.252197265625, 9.86328125, 10.474365234375, 11.08544921875, 11.696533203125, 12.3076171875, 12.918701171875, 13.52978515625, 14.140869140625, 14.751953125, 15.363037109375, 15.97412109375, 16.585205078125, 17.1962890625, 17.807373046875, 18.41845703125, 19.029541015625, 19.640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 8.0, 17.0, 13.0, 18.0, 17.0, 33.0, 43.0, 56.0, 53.0, 69.0, 85.0, 83.0, 85.0, 88.0, 65.0, 58.0, 44.0, 33.0, 25.0, 31.0, 22.0, 7.0, 13.0, 11.0, 3.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.51981353759766, -94.56147003173828, -91.6031265258789, -88.644775390625, -85.68643188476562, -82.72808837890625, -79.76974487304688, -76.8114013671875, -73.85305786132812, -70.89471435546875, -67.93637084960938, -64.97802734375, -62.019676208496094, -59.06133270263672, -56.102989196777344, -53.14464569091797, -50.18629455566406, -47.22795104980469, -44.26960372924805, -41.31126022338867, -38.35291290283203, -35.394569396972656, -32.43622589111328, -29.477880477905273, -26.519535064697266, -23.561189651489258, -20.60284423828125, -17.644500732421875, -14.686155319213867, -11.72780990600586, -8.769466400146484, -5.811120986938477, -2.8527679443359375, 0.10557699203491211, 3.0639219284057617, 6.022266387939453, 8.980611801147461, 11.938957214355469, 14.897300720214844, 17.85564613342285, 20.81399154663086, 23.772336959838867, 26.730682373046875, 29.68902587890625, 32.647369384765625, 35.605716705322266, 38.56406021118164, 41.52240753173828, 44.480751037597656, 47.43909454345703, 50.39744186401367, 53.35578536987305, 56.31413269042969, 59.27247619628906, 62.23081970214844, 65.18916320800781, 68.14750671386719, 71.10585021972656, 74.06419372558594, 77.02253723144531, 79.98088836669922, 82.9392318725586, 85.89757537841797, 88.85591888427734, 91.81427001953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 10.0, 4.0, 11.0, 6.0, 11.0, 11.0, 10.0, 14.0, 17.0, 13.0, 18.0, 23.0, 29.0, 21.0, 23.0, 23.0, 42.0, 27.0, 29.0, 31.0, 44.0, 32.0, 42.0, 38.0, 38.0, 30.0, 31.0, 26.0, 40.0, 31.0, 27.0, 30.0, 24.0, 21.0, 31.0, 16.0, 20.0, 16.0, 12.0, 12.0, 17.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-40.53941345214844, -39.245582580566406, -37.951751708984375, -36.657920837402344, -35.36408996582031, -34.07026290893555, -32.776432037353516, -31.482601165771484, -30.188770294189453, -28.894939422607422, -27.60110855102539, -26.307279586791992, -25.01344871520996, -23.71961784362793, -22.42578887939453, -21.1319580078125, -19.83812713623047, -18.544296264648438, -17.250465393066406, -15.956636428833008, -14.662805557250977, -13.368974685668945, -12.07514476776123, -10.781314849853516, -9.487483978271484, -8.193653106689453, -6.899823188781738, -5.605992794036865, -4.312162399291992, -3.018332004547119, -1.724501609802246, -0.43067169189453125, 0.8631553649902344, 2.1569857597351074, 3.4508161544799805, 4.7446465492248535, 6.038476943969727, 7.3323073387146, 8.626137733459473, 9.919967651367188, 11.213798522949219, 12.50762939453125, 13.801459312438965, 15.09528923034668, 16.38912010192871, 17.682950973510742, 18.97677993774414, 20.270610809326172, 21.564441680908203, 22.858272552490234, 24.152103424072266, 25.445932388305664, 26.739763259887695, 28.033594131469727, 29.327423095703125, 30.621253967285156, 31.915084838867188, 33.20891571044922, 34.50274658203125, 35.79657745361328, 37.09040832519531, 38.38423538208008, 39.67806625366211, 40.97189712524414, 42.26572799682617]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 11.0, 8.0, 15.0, 13.0, 20.0, 36.0, 57.0, 102.0, 125.0, 181.0, 297.0, 506.0, 662.0, 1099.0, 1706.0, 2487.0, 4000.0, 6228.0, 9919.0, 15032.0, 23844.0, 38063.0, 60035.0, 90514.0, 128363.0, 158068.0, 154238.0, 121040.0, 83026.0, 54070.0, 34386.0, 21792.0, 13651.0, 8933.0, 5620.0, 3670.0, 2349.0, 1485.0, 988.0, 618.0, 445.0, 242.0, 189.0, 153.0, 97.0, 59.0, 38.0, 37.0, 18.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-23.15625, -22.43017578125, -21.7041015625, -20.97802734375, -20.251953125, -19.52587890625, -18.7998046875, -18.07373046875, -17.34765625, -16.62158203125, -15.8955078125, -15.16943359375, -14.443359375, -13.71728515625, -12.9912109375, -12.26513671875, -11.5390625, -10.81298828125, -10.0869140625, -9.36083984375, -8.634765625, -7.90869140625, -7.1826171875, -6.45654296875, -5.73046875, -5.00439453125, -4.2783203125, -3.55224609375, -2.826171875, -2.10009765625, -1.3740234375, -0.64794921875, 0.078125, 0.80419921875, 1.5302734375, 2.25634765625, 2.982421875, 3.70849609375, 4.4345703125, 5.16064453125, 5.88671875, 6.61279296875, 7.3388671875, 8.06494140625, 8.791015625, 9.51708984375, 10.2431640625, 10.96923828125, 11.6953125, 12.42138671875, 13.1474609375, 13.87353515625, 14.599609375, 15.32568359375, 16.0517578125, 16.77783203125, 17.50390625, 18.22998046875, 18.9560546875, 19.68212890625, 20.408203125, 21.13427734375, 21.8603515625, 22.58642578125, 23.3125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 11.0, 13.0, 21.0, 19.0, 19.0, 25.0, 31.0, 26.0, 28.0, 32.0, 29.0, 49.0, 33.0, 37.0, 39.0, 50.0, 44.0, 41.0, 53.0, 43.0, 32.0, 34.0, 38.0, 28.0, 33.0, 18.0, 30.0, 22.0, 20.0, 14.0, 13.0, 4.0, 13.0, 12.0, 5.0, 2.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.15625, -42.45556640625, -40.7548828125, -39.05419921875, -37.353515625, -35.65283203125, -33.9521484375, -32.25146484375, -30.55078125, -28.85009765625, -27.1494140625, -25.44873046875, -23.748046875, -22.04736328125, -20.3466796875, -18.64599609375, -16.9453125, -15.24462890625, -13.5439453125, -11.84326171875, -10.142578125, -8.44189453125, -6.7412109375, -5.04052734375, -3.33984375, -1.63916015625, 0.0615234375, 1.76220703125, 3.462890625, 5.16357421875, 6.8642578125, 8.56494140625, 10.265625, 11.96630859375, 13.6669921875, 15.36767578125, 17.068359375, 18.76904296875, 20.4697265625, 22.17041015625, 23.87109375, 25.57177734375, 27.2724609375, 28.97314453125, 30.673828125, 32.37451171875, 34.0751953125, 35.77587890625, 37.4765625, 39.17724609375, 40.8779296875, 42.57861328125, 44.279296875, 45.97998046875, 47.6806640625, 49.38134765625, 51.08203125, 52.78271484375, 54.4833984375, 56.18408203125, 57.884765625, 59.58544921875, 61.2861328125, 62.98681640625, 64.6875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 9.0, 13.0, 25.0, 39.0, 44.0, 62.0, 95.0, 140.0, 213.0, 316.0, 525.0, 791.0, 1137.0, 1833.0, 3110.0, 5152.0, 8703.0, 14567.0, 25149.0, 43391.0, 75283.0, 128126.0, 190683.0, 199891.0, 143617.0, 86605.0, 49394.0, 28484.0, 16455.0, 9662.0, 5662.0, 3376.0, 2170.0, 1313.0, 887.0, 533.0, 344.0, 241.0, 167.0, 98.0, 74.0, 48.0, 31.0, 24.0, 18.0, 12.0, 5.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-30.703125, -29.716552734375, -28.72998046875, -27.743408203125, -26.7568359375, -25.770263671875, -24.78369140625, -23.797119140625, -22.810546875, -21.823974609375, -20.83740234375, -19.850830078125, -18.8642578125, -17.877685546875, -16.89111328125, -15.904541015625, -14.91796875, -13.931396484375, -12.94482421875, -11.958251953125, -10.9716796875, -9.985107421875, -8.99853515625, -8.011962890625, -7.025390625, -6.038818359375, -5.05224609375, -4.065673828125, -3.0791015625, -2.092529296875, -1.10595703125, -0.119384765625, 0.8671875, 1.853759765625, 2.84033203125, 3.826904296875, 4.8134765625, 5.800048828125, 6.78662109375, 7.773193359375, 8.759765625, 9.746337890625, 10.73291015625, 11.719482421875, 12.7060546875, 13.692626953125, 14.67919921875, 15.665771484375, 16.65234375, 17.638916015625, 18.62548828125, 19.612060546875, 20.5986328125, 21.585205078125, 22.57177734375, 23.558349609375, 24.544921875, 25.531494140625, 26.51806640625, 27.504638671875, 28.4912109375, 29.477783203125, 30.46435546875, 31.450927734375, 32.4375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 13.0, 12.0, 17.0, 12.0, 15.0, 15.0, 26.0, 21.0, 33.0, 31.0, 41.0, 28.0, 43.0, 41.0, 48.0, 48.0, 44.0, 44.0, 47.0, 36.0, 42.0, 44.0, 29.0, 24.0, 32.0, 29.0, 36.0, 27.0, 26.0, 10.0, 18.0, 15.0, 10.0, 8.0, 6.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.875, -32.78955078125, -31.7041015625, -30.61865234375, -29.533203125, -28.44775390625, -27.3623046875, -26.27685546875, -25.19140625, -24.10595703125, -23.0205078125, -21.93505859375, -20.849609375, -19.76416015625, -18.6787109375, -17.59326171875, -16.5078125, -15.42236328125, -14.3369140625, -13.25146484375, -12.166015625, -11.08056640625, -9.9951171875, -8.90966796875, -7.82421875, -6.73876953125, -5.6533203125, -4.56787109375, -3.482421875, -2.39697265625, -1.3115234375, -0.22607421875, 0.859375, 1.94482421875, 3.0302734375, 4.11572265625, 5.201171875, 6.28662109375, 7.3720703125, 8.45751953125, 9.54296875, 10.62841796875, 11.7138671875, 12.79931640625, 13.884765625, 14.97021484375, 16.0556640625, 17.14111328125, 18.2265625, 19.31201171875, 20.3974609375, 21.48291015625, 22.568359375, 23.65380859375, 24.7392578125, 25.82470703125, 26.91015625, 27.99560546875, 29.0810546875, 30.16650390625, 31.251953125, 32.33740234375, 33.4228515625, 34.50830078125, 35.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 19.0, 27.0, 37.0, 54.0, 93.0, 125.0, 198.0, 301.0, 446.0, 636.0, 934.0, 1472.0, 2182.0, 3644.0, 5605.0, 8975.0, 14483.0, 23600.0, 39109.0, 63970.0, 104936.0, 158950.0, 191547.0, 158177.0, 104125.0, 63822.0, 38399.0, 23383.0, 14341.0, 8945.0, 5696.0, 3557.0, 2291.0, 1477.0, 1014.0, 645.0, 437.0, 282.0, 186.0, 136.0, 83.0, 60.0, 48.0, 32.0, 14.0, 12.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-8.78125, -8.50244140625, -8.2236328125, -7.94482421875, -7.666015625, -7.38720703125, -7.1083984375, -6.82958984375, -6.55078125, -6.27197265625, -5.9931640625, -5.71435546875, -5.435546875, -5.15673828125, -4.8779296875, -4.59912109375, -4.3203125, -4.04150390625, -3.7626953125, -3.48388671875, -3.205078125, -2.92626953125, -2.6474609375, -2.36865234375, -2.08984375, -1.81103515625, -1.5322265625, -1.25341796875, -0.974609375, -0.69580078125, -0.4169921875, -0.13818359375, 0.140625, 0.41943359375, 0.6982421875, 0.97705078125, 1.255859375, 1.53466796875, 1.8134765625, 2.09228515625, 2.37109375, 2.64990234375, 2.9287109375, 3.20751953125, 3.486328125, 3.76513671875, 4.0439453125, 4.32275390625, 4.6015625, 4.88037109375, 5.1591796875, 5.43798828125, 5.716796875, 5.99560546875, 6.2744140625, 6.55322265625, 6.83203125, 7.11083984375, 7.3896484375, 7.66845703125, 7.947265625, 8.22607421875, 8.5048828125, 8.78369140625, 9.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 10.0, 8.0, 6.0, 7.0, 10.0, 19.0, 32.0, 44.0, 30.0, 57.0, 42.0, 63.0, 81.0, 98.0, 69.0, 82.0, 76.0, 57.0, 40.0, 43.0, 26.0, 26.0, 16.0, 16.0, 9.0, 11.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012483596801757812, -0.0012136027216911316, -0.001178845763206482, -0.0011440888047218323, -0.0011093318462371826, -0.001074574887752533, -0.0010398179292678833, -0.0010050609707832336, -0.000970304012298584, -0.0009355470538139343, -0.0009007900953292847, -0.000866033136844635, -0.0008312761783599854, -0.0007965192198753357, -0.000761762261390686, -0.0007270053029060364, -0.0006922483444213867, -0.0006574913859367371, -0.0006227344274520874, -0.0005879774689674377, -0.0005532205104827881, -0.0005184635519981384, -0.00048370659351348877, -0.0004489496350288391, -0.00041419267654418945, -0.0003794357180595398, -0.00034467875957489014, -0.0003099218010902405, -0.0002751648426055908, -0.00024040788412094116, -0.0002056509256362915, -0.00017089396715164185, -0.0001361370086669922, -0.00010138005018234253, -6.662309169769287e-05, -3.186613321304321e-05, 2.8908252716064453e-06, 3.7647783756256104e-05, 7.240474224090576e-05, 0.00010716170072555542, 0.00014191865921020508, 0.00017667561769485474, 0.0002114325761795044, 0.00024618953466415405, 0.0002809464931488037, 0.00031570345163345337, 0.00035046041011810303, 0.0003852173686027527, 0.00041997432708740234, 0.000454731285572052, 0.0004894882440567017, 0.0005242452025413513, 0.000559002161026001, 0.0005937591195106506, 0.0006285160779953003, 0.00066327303647995, 0.0006980299949645996, 0.0007327869534492493, 0.0007675439119338989, 0.0008023008704185486, 0.0008370578289031982, 0.0008718147873878479, 0.0009065717458724976, 0.0009413287043571472, 0.0009760856628417969]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 13.0, 17.0, 20.0, 35.0, 71.0, 107.0, 166.0, 227.0, 333.0, 545.0, 813.0, 1375.0, 2061.0, 3314.0, 5441.0, 9064.0, 15507.0, 26782.0, 46910.0, 82158.0, 142163.0, 208682.0, 199166.0, 129089.0, 73300.0, 41726.0, 24062.0, 13899.0, 8214.0, 5050.0, 3006.0, 1896.0, 1217.0, 749.0, 443.0, 318.0, 204.0, 126.0, 102.0, 54.0, 35.0, 30.0, 22.0, 15.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.381591796875, -10.95849609375, -10.535400390625, -10.1123046875, -9.689208984375, -9.26611328125, -8.843017578125, -8.419921875, -7.996826171875, -7.57373046875, -7.150634765625, -6.7275390625, -6.304443359375, -5.88134765625, -5.458251953125, -5.03515625, -4.612060546875, -4.18896484375, -3.765869140625, -3.3427734375, -2.919677734375, -2.49658203125, -2.073486328125, -1.650390625, -1.227294921875, -0.80419921875, -0.381103515625, 0.0419921875, 0.465087890625, 0.88818359375, 1.311279296875, 1.734375, 2.157470703125, 2.58056640625, 3.003662109375, 3.4267578125, 3.849853515625, 4.27294921875, 4.696044921875, 5.119140625, 5.542236328125, 5.96533203125, 6.388427734375, 6.8115234375, 7.234619140625, 7.65771484375, 8.080810546875, 8.50390625, 8.927001953125, 9.35009765625, 9.773193359375, 10.1962890625, 10.619384765625, 11.04248046875, 11.465576171875, 11.888671875, 12.311767578125, 12.73486328125, 13.157958984375, 13.5810546875, 14.004150390625, 14.42724609375, 14.850341796875, 15.2734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 17.0, 22.0, 18.0, 24.0, 26.0, 38.0, 44.0, 40.0, 48.0, 57.0, 63.0, 61.0, 60.0, 60.0, 56.0, 60.0, 43.0, 31.0, 29.0, 26.0, 14.0, 24.0, 25.0, 25.0, 10.0, 11.0, 7.0, 2.0, 2.0, 7.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.92657470703125, -3.7750244140625, -3.62347412109375, -3.471923828125, -3.32037353515625, -3.1688232421875, -3.01727294921875, -2.86572265625, -2.71417236328125, -2.5626220703125, -2.41107177734375, -2.259521484375, -2.10797119140625, -1.9564208984375, -1.80487060546875, -1.6533203125, -1.50177001953125, -1.3502197265625, -1.19866943359375, -1.047119140625, -0.89556884765625, -0.7440185546875, -0.59246826171875, -0.44091796875, -0.28936767578125, -0.1378173828125, 0.01373291015625, 0.165283203125, 0.31683349609375, 0.4683837890625, 0.61993408203125, 0.771484375, 0.92303466796875, 1.0745849609375, 1.22613525390625, 1.377685546875, 1.52923583984375, 1.6807861328125, 1.83233642578125, 1.98388671875, 2.13543701171875, 2.2869873046875, 2.43853759765625, 2.590087890625, 2.74163818359375, 2.8931884765625, 3.04473876953125, 3.1962890625, 3.34783935546875, 3.4993896484375, 3.65093994140625, 3.802490234375, 3.95404052734375, 4.1055908203125, 4.25714111328125, 4.40869140625, 4.56024169921875, 4.7117919921875, 4.86334228515625, 5.014892578125, 5.16644287109375, 5.3179931640625, 5.46954345703125, 5.62109375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 5.0, 16.0, 17.0, 18.0, 20.0, 36.0, 50.0, 54.0, 66.0, 76.0, 76.0, 92.0, 92.0, 78.0, 53.0, 58.0, 34.0, 28.0, 33.0, 27.0, 10.0, 14.0, 10.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.11541748046875, -97.12666320800781, -94.13790893554688, -91.1491470336914, -88.16039276123047, -85.17163848876953, -82.18287658691406, -79.19412231445312, -76.20536804199219, -73.21661376953125, -70.22785949707031, -67.23909759521484, -64.2503433227539, -61.26158905029297, -58.272830963134766, -55.28407287597656, -52.295318603515625, -49.30656433105469, -46.317806243896484, -43.32904815673828, -40.340293884277344, -37.351539611816406, -34.3627815246582, -31.374025344848633, -28.385269165039062, -25.396512985229492, -22.407756805419922, -19.41900062561035, -16.43024444580078, -13.441488265991211, -10.45273208618164, -7.46397590637207, -4.475227355957031, -1.486471176147461, 1.5022850036621094, 4.49104118347168, 7.47979736328125, 10.46855354309082, 13.45730972290039, 16.44606590270996, 19.43482208251953, 22.4235782623291, 25.412334442138672, 28.401090621948242, 31.389846801757812, 34.37860107421875, 37.36735916137695, 40.356117248535156, 43.344871520996094, 46.33362579345703, 49.322383880615234, 52.31114196777344, 55.299896240234375, 58.28865051269531, 61.277408599853516, 64.26616668701172, 67.25492095947266, 70.2436752319336, 73.23243713378906, 76.22119140625, 79.20994567871094, 82.19869995117188, 85.18745422363281, 88.17621612548828, 91.16497039794922]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 12.0, 10.0, 8.0, 10.0, 11.0, 10.0, 14.0, 13.0, 20.0, 18.0, 21.0, 27.0, 31.0, 22.0, 22.0, 31.0, 33.0, 30.0, 31.0, 29.0, 48.0, 41.0, 37.0, 35.0, 34.0, 38.0, 34.0, 29.0, 33.0, 26.0, 20.0, 23.0, 28.0, 18.0, 24.0, 20.0, 14.0, 16.0, 15.0, 10.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-38.84930419921875, -37.54950714111328, -36.24971389770508, -34.94991683959961, -33.650123596191406, -32.35032653808594, -31.050533294677734, -29.750736236572266, -28.450942993164062, -27.151147842407227, -25.85135269165039, -24.551557540893555, -23.25176239013672, -21.951967239379883, -20.652172088623047, -19.352375030517578, -18.052579879760742, -16.752784729003906, -15.45298957824707, -14.153194427490234, -12.853399276733398, -11.553604125976562, -10.25380802154541, -8.954012870788574, -7.654217720031738, -6.354422569274902, -5.054627418518066, -3.7548317909240723, -2.4550366401672363, -1.1552414894104004, 0.14455413818359375, 1.4443492889404297, 2.7441444396972656, 4.043939590454102, 5.3437347412109375, 6.643530368804932, 7.943325519561768, 9.243120193481445, 10.542916297912598, 11.842711448669434, 13.14250659942627, 14.442301750183105, 15.742096900939941, 17.041893005371094, 18.34168815612793, 19.641483306884766, 20.9412784576416, 22.241073608398438, 23.540868759155273, 24.84066390991211, 26.140459060668945, 27.44025421142578, 28.740049362182617, 30.039844512939453, 31.339641571044922, 32.639434814453125, 33.939231872558594, 35.23902893066406, 36.538822174072266, 37.838619232177734, 39.13841247558594, 40.438209533691406, 41.73800277709961, 43.03779983520508, 44.33759307861328]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 1.0, 9.0, 13.0, 16.0, 11.0, 27.0, 28.0, 51.0, 70.0, 87.0, 144.0, 254.0, 386.0, 550.0, 875.0, 1523.0, 2426.0, 4042.0, 7000.0, 11859.0, 20724.0, 36180.0, 62275.0, 101615.0, 146099.0, 174355.0, 163199.0, 122250.0, 79526.0, 47484.0, 27548.0, 15570.0, 9018.0, 5272.0, 3043.0, 1844.0, 1137.0, 704.0, 448.0, 311.0, 219.0, 145.0, 74.0, 48.0, 34.0, 21.0, 15.0, 9.0, 8.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-61.46875, -59.64697265625, -57.8251953125, -56.00341796875, -54.181640625, -52.35986328125, -50.5380859375, -48.71630859375, -46.89453125, -45.07275390625, -43.2509765625, -41.42919921875, -39.607421875, -37.78564453125, -35.9638671875, -34.14208984375, -32.3203125, -30.49853515625, -28.6767578125, -26.85498046875, -25.033203125, -23.21142578125, -21.3896484375, -19.56787109375, -17.74609375, -15.92431640625, -14.1025390625, -12.28076171875, -10.458984375, -8.63720703125, -6.8154296875, -4.99365234375, -3.171875, -1.35009765625, 0.4716796875, 2.29345703125, 4.115234375, 5.93701171875, 7.7587890625, 9.58056640625, 11.40234375, 13.22412109375, 15.0458984375, 16.86767578125, 18.689453125, 20.51123046875, 22.3330078125, 24.15478515625, 25.9765625, 27.79833984375, 29.6201171875, 31.44189453125, 33.263671875, 35.08544921875, 36.9072265625, 38.72900390625, 40.55078125, 42.37255859375, 44.1943359375, 46.01611328125, 47.837890625, 49.65966796875, 51.4814453125, 53.30322265625, 55.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 7.0, 8.0, 12.0, 13.0, 11.0, 15.0, 10.0, 14.0, 20.0, 23.0, 22.0, 32.0, 21.0, 38.0, 25.0, 25.0, 34.0, 36.0, 37.0, 29.0, 40.0, 39.0, 52.0, 36.0, 40.0, 43.0, 27.0, 30.0, 34.0, 24.0, 19.0, 28.0, 25.0, 25.0, 14.0, 18.0, 15.0, 12.0, 9.0, 9.0, 1.0, 3.0, 7.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.5625, -41.16552734375, -39.7685546875, -38.37158203125, -36.974609375, -35.57763671875, -34.1806640625, -32.78369140625, -31.38671875, -29.98974609375, -28.5927734375, -27.19580078125, -25.798828125, -24.40185546875, -23.0048828125, -21.60791015625, -20.2109375, -18.81396484375, -17.4169921875, -16.02001953125, -14.623046875, -13.22607421875, -11.8291015625, -10.43212890625, -9.03515625, -7.63818359375, -6.2412109375, -4.84423828125, -3.447265625, -2.05029296875, -0.6533203125, 0.74365234375, 2.140625, 3.53759765625, 4.9345703125, 6.33154296875, 7.728515625, 9.12548828125, 10.5224609375, 11.91943359375, 13.31640625, 14.71337890625, 16.1103515625, 17.50732421875, 18.904296875, 20.30126953125, 21.6982421875, 23.09521484375, 24.4921875, 25.88916015625, 27.2861328125, 28.68310546875, 30.080078125, 31.47705078125, 32.8740234375, 34.27099609375, 35.66796875, 37.06494140625, 38.4619140625, 39.85888671875, 41.255859375, 42.65283203125, 44.0498046875, 45.44677734375, 46.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 11.0, 14.0, 19.0, 20.0, 26.0, 36.0, 35.0, 58.0, 85.0, 135.0, 151.0, 212.0, 358.0, 553.0, 1035.0, 1752.0, 3632.0, 7836.0, 19177.0, 49595.0, 128129.0, 265434.0, 295772.0, 163987.0, 65408.0, 25157.0, 10024.0, 4603.0, 2195.0, 1169.0, 655.0, 403.0, 246.0, 181.0, 109.0, 80.0, 63.0, 50.0, 39.0, 21.0, 21.0, 9.0, 11.0, 7.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-124.875, -120.865234375, -116.85546875, -112.845703125, -108.8359375, -104.826171875, -100.81640625, -96.806640625, -92.796875, -88.787109375, -84.77734375, -80.767578125, -76.7578125, -72.748046875, -68.73828125, -64.728515625, -60.71875, -56.708984375, -52.69921875, -48.689453125, -44.6796875, -40.669921875, -36.66015625, -32.650390625, -28.640625, -24.630859375, -20.62109375, -16.611328125, -12.6015625, -8.591796875, -4.58203125, -0.572265625, 3.4375, 7.447265625, 11.45703125, 15.466796875, 19.4765625, 23.486328125, 27.49609375, 31.505859375, 35.515625, 39.525390625, 43.53515625, 47.544921875, 51.5546875, 55.564453125, 59.57421875, 63.583984375, 67.59375, 71.603515625, 75.61328125, 79.623046875, 83.6328125, 87.642578125, 91.65234375, 95.662109375, 99.671875, 103.681640625, 107.69140625, 111.701171875, 115.7109375, 119.720703125, 123.73046875, 127.740234375, 131.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 12.0, 12.0, 13.0, 9.0, 10.0, 11.0, 16.0, 20.0, 17.0, 22.0, 30.0, 35.0, 29.0, 34.0, 44.0, 32.0, 41.0, 38.0, 37.0, 48.0, 30.0, 45.0, 39.0, 38.0, 38.0, 47.0, 39.0, 36.0, 25.0, 23.0, 14.0, 29.0, 12.0, 7.0, 14.0, 12.0, 10.0, 2.0, 6.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.859375, -30.812744140625, -29.76611328125, -28.719482421875, -27.6728515625, -26.626220703125, -25.57958984375, -24.532958984375, -23.486328125, -22.439697265625, -21.39306640625, -20.346435546875, -19.2998046875, -18.253173828125, -17.20654296875, -16.159912109375, -15.11328125, -14.066650390625, -13.02001953125, -11.973388671875, -10.9267578125, -9.880126953125, -8.83349609375, -7.786865234375, -6.740234375, -5.693603515625, -4.64697265625, -3.600341796875, -2.5537109375, -1.507080078125, -0.46044921875, 0.586181640625, 1.6328125, 2.679443359375, 3.72607421875, 4.772705078125, 5.8193359375, 6.865966796875, 7.91259765625, 8.959228515625, 10.005859375, 11.052490234375, 12.09912109375, 13.145751953125, 14.1923828125, 15.239013671875, 16.28564453125, 17.332275390625, 18.37890625, 19.425537109375, 20.47216796875, 21.518798828125, 22.5654296875, 23.612060546875, 24.65869140625, 25.705322265625, 26.751953125, 27.798583984375, 28.84521484375, 29.891845703125, 30.9384765625, 31.985107421875, 33.03173828125, 34.078369140625, 35.125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 15.0, 12.0, 31.0, 27.0, 49.0, 55.0, 92.0, 123.0, 197.0, 251.0, 424.0, 649.0, 1056.0, 1655.0, 2674.0, 4333.0, 7024.0, 11948.0, 20372.0, 35896.0, 64035.0, 108222.0, 165380.0, 195544.0, 165541.0, 109967.0, 64609.0, 36510.0, 20760.0, 12074.0, 7236.0, 4381.0, 2578.0, 1718.0, 1084.0, 695.0, 478.0, 267.0, 189.0, 122.0, 85.0, 58.0, 37.0, 22.0, 24.0, 12.0, 8.0, 11.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.576171875, -31.43359375, -30.291015625, -29.1484375, -28.005859375, -26.86328125, -25.720703125, -24.578125, -23.435546875, -22.29296875, -21.150390625, -20.0078125, -18.865234375, -17.72265625, -16.580078125, -15.4375, -14.294921875, -13.15234375, -12.009765625, -10.8671875, -9.724609375, -8.58203125, -7.439453125, -6.296875, -5.154296875, -4.01171875, -2.869140625, -1.7265625, -0.583984375, 0.55859375, 1.701171875, 2.84375, 3.986328125, 5.12890625, 6.271484375, 7.4140625, 8.556640625, 9.69921875, 10.841796875, 11.984375, 13.126953125, 14.26953125, 15.412109375, 16.5546875, 17.697265625, 18.83984375, 19.982421875, 21.125, 22.267578125, 23.41015625, 24.552734375, 25.6953125, 26.837890625, 27.98046875, 29.123046875, 30.265625, 31.408203125, 32.55078125, 33.693359375, 34.8359375, 35.978515625, 37.12109375, 38.263671875, 39.40625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 10.0, 19.0, 24.0, 32.0, 42.0, 58.0, 90.0, 105.0, 113.0, 122.0, 93.0, 62.0, 68.0, 41.0, 33.0, 19.0, 13.0, 10.0, 8.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004047393798828125, -0.003861725330352783, -0.0036760568618774414, -0.0034903883934020996, -0.003304719924926758, -0.003119051456451416, -0.0029333829879760742, -0.0027477145195007324, -0.0025620460510253906, -0.002376377582550049, -0.002190709114074707, -0.0020050406455993652, -0.0018193721771240234, -0.0016337037086486816, -0.0014480352401733398, -0.001262366771697998, -0.0010766983032226562, -0.0008910298347473145, -0.0007053613662719727, -0.0005196928977966309, -0.00033402442932128906, -0.00014835596084594727, 3.731250762939453e-05, 0.00022298097610473633, 0.0004086494445800781, 0.0005943179130554199, 0.0007799863815307617, 0.0009656548500061035, 0.0011513233184814453, 0.0013369917869567871, 0.001522660255432129, 0.0017083287239074707, 0.0018939971923828125, 0.0020796656608581543, 0.002265334129333496, 0.002451002597808838, 0.0026366710662841797, 0.0028223395347595215, 0.0030080080032348633, 0.003193676471710205, 0.003379344940185547, 0.0035650134086608887, 0.0037506818771362305, 0.003936350345611572, 0.004122018814086914, 0.004307687282562256, 0.004493355751037598, 0.0046790242195129395, 0.004864692687988281, 0.005050361156463623, 0.005236029624938965, 0.005421698093414307, 0.0056073665618896484, 0.00579303503036499, 0.005978703498840332, 0.006164371967315674, 0.006350040435791016, 0.006535708904266357, 0.006721377372741699, 0.006907045841217041, 0.007092714309692383, 0.007278382778167725, 0.007464051246643066, 0.007649719715118408, 0.00783538818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 16.0, 16.0, 20.0, 39.0, 58.0, 60.0, 115.0, 148.0, 246.0, 379.0, 578.0, 925.0, 1427.0, 2145.0, 3564.0, 5609.0, 8796.0, 14250.0, 23277.0, 39551.0, 65415.0, 107063.0, 159320.0, 186933.0, 158346.0, 105937.0, 63938.0, 38792.0, 23280.0, 14159.0, 8843.0, 5523.0, 3604.0, 2212.0, 1401.0, 873.0, 608.0, 371.0, 242.0, 165.0, 100.0, 65.0, 47.0, 27.0, 18.0, 22.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.5625, -33.46484375, -32.3671875, -31.26953125, -30.171875, -29.07421875, -27.9765625, -26.87890625, -25.78125, -24.68359375, -23.5859375, -22.48828125, -21.390625, -20.29296875, -19.1953125, -18.09765625, -17.0, -15.90234375, -14.8046875, -13.70703125, -12.609375, -11.51171875, -10.4140625, -9.31640625, -8.21875, -7.12109375, -6.0234375, -4.92578125, -3.828125, -2.73046875, -1.6328125, -0.53515625, 0.5625, 1.66015625, 2.7578125, 3.85546875, 4.953125, 6.05078125, 7.1484375, 8.24609375, 9.34375, 10.44140625, 11.5390625, 12.63671875, 13.734375, 14.83203125, 15.9296875, 17.02734375, 18.125, 19.22265625, 20.3203125, 21.41796875, 22.515625, 23.61328125, 24.7109375, 25.80859375, 26.90625, 28.00390625, 29.1015625, 30.19921875, 31.296875, 32.39453125, 33.4921875, 34.58984375, 35.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 9.0, 14.0, 12.0, 17.0, 15.0, 10.0, 22.0, 28.0, 30.0, 35.0, 36.0, 36.0, 37.0, 38.0, 51.0, 58.0, 44.0, 43.0, 47.0, 55.0, 43.0, 43.0, 28.0, 31.0, 26.0, 27.0, 31.0, 18.0, 18.0, 11.0, 16.0, 10.0, 14.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.8046875, -9.4984130859375, -9.192138671875, -8.8858642578125, -8.57958984375, -8.2733154296875, -7.967041015625, -7.6607666015625, -7.3544921875, -7.0482177734375, -6.741943359375, -6.4356689453125, -6.12939453125, -5.8231201171875, -5.516845703125, -5.2105712890625, -4.904296875, -4.5980224609375, -4.291748046875, -3.9854736328125, -3.67919921875, -3.3729248046875, -3.066650390625, -2.7603759765625, -2.4541015625, -2.1478271484375, -1.841552734375, -1.5352783203125, -1.22900390625, -0.9227294921875, -0.616455078125, -0.3101806640625, -0.00390625, 0.3023681640625, 0.608642578125, 0.9149169921875, 1.22119140625, 1.5274658203125, 1.833740234375, 2.1400146484375, 2.4462890625, 2.7525634765625, 3.058837890625, 3.3651123046875, 3.67138671875, 3.9776611328125, 4.283935546875, 4.5902099609375, 4.896484375, 5.2027587890625, 5.509033203125, 5.8153076171875, 6.12158203125, 6.4278564453125, 6.734130859375, 7.0404052734375, 7.3466796875, 7.6529541015625, 7.959228515625, 8.2655029296875, 8.57177734375, 8.8780517578125, 9.184326171875, 9.4906005859375, 9.796875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 16.0, 15.0, 17.0, 24.0, 34.0, 55.0, 39.0, 46.0, 69.0, 62.0, 86.0, 73.0, 70.0, 76.0, 58.0, 53.0, 33.0, 37.0, 26.0, 21.0, 21.0, 13.0, 12.0, 12.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.44152069091797, -102.274658203125, -99.10779571533203, -95.94093322753906, -92.77406311035156, -89.6072006225586, -86.44033813476562, -83.27347564697266, -80.10661315917969, -76.93975067138672, -73.77288818359375, -70.60601806640625, -67.43915557861328, -64.27229309082031, -61.105430603027344, -57.938568115234375, -54.771697998046875, -51.604835510253906, -48.43796920776367, -45.2711067199707, -42.10424041748047, -38.9373779296875, -35.77051544189453, -32.60365295410156, -29.436786651611328, -26.269922256469727, -23.103057861328125, -19.936195373535156, -16.769330978393555, -13.602466583251953, -10.435604095458984, -7.268739700317383, -4.1018829345703125, -0.9350190162658691, 2.231844902038574, 5.398708343505859, 8.565572738647461, 11.732437133789062, 14.899299621582031, 18.066164016723633, 21.233028411865234, 24.399892807006836, 27.566757202148438, 30.733619689941406, 33.900482177734375, 37.06734848022461, 40.23421096801758, 43.40107727050781, 46.56793975830078, 49.73480224609375, 52.901668548583984, 56.06853103637695, 59.23539733886719, 62.402259826660156, 65.56912231445312, 68.7359848022461, 71.90284729003906, 75.06970977783203, 78.236572265625, 81.4034423828125, 84.57030487060547, 87.73716735839844, 90.9040298461914, 94.07089233398438, 97.23776245117188]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 7.0, 12.0, 9.0, 10.0, 20.0, 20.0, 12.0, 19.0, 23.0, 21.0, 32.0, 25.0, 21.0, 31.0, 30.0, 29.0, 32.0, 44.0, 45.0, 45.0, 34.0, 41.0, 29.0, 43.0, 36.0, 36.0, 30.0, 26.0, 22.0, 27.0, 26.0, 17.0, 20.0, 17.0, 14.0, 8.0, 11.0, 9.0, 10.0, 12.0, 8.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-51.89430236816406, -50.25565719604492, -48.61701583862305, -46.978370666503906, -45.339725494384766, -43.701080322265625, -42.06243896484375, -40.42379379272461, -38.78514862060547, -37.14650344848633, -35.50786209106445, -33.86921691894531, -32.23057174682617, -30.591928482055664, -28.953285217285156, -27.314640045166016, -25.675996780395508, -24.037353515625, -22.39870834350586, -20.76006507873535, -19.12141990661621, -17.482776641845703, -15.844132423400879, -14.205488204956055, -12.56684398651123, -10.928199768066406, -9.289555549621582, -7.650911808013916, -6.012267589569092, -4.373623847961426, -2.7349796295166016, -1.0963354110717773, 0.5423088073730469, 2.180953025817871, 3.819597005844116, 5.458240985870361, 7.0968852043151855, 8.735528945922852, 10.374173164367676, 12.0128173828125, 13.651461601257324, 15.290105819702148, 16.928749084472656, 18.567394256591797, 20.206037521362305, 21.844680786132812, 23.483325958251953, 25.121971130371094, 26.7606143951416, 28.39925765991211, 30.03790283203125, 31.676546096801758, 33.315189361572266, 34.953834533691406, 36.59247970581055, 38.23112487792969, 39.86976623535156, 41.5084114074707, 43.14705276489258, 44.78569793701172, 46.42434310913086, 48.06298828125, 49.701629638671875, 51.340274810791016, 52.978919982910156]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 6.0, 6.0, 7.0, 4.0, 12.0, 10.0, 12.0, 17.0, 18.0, 26.0, 27.0, 30.0, 52.0, 43.0, 74.0, 73.0, 104.0, 130.0, 204.0, 280.0, 387.0, 661.0, 1000.0, 1715.0, 1039945.0, 1977.0, 1232.0, 757.0, 510.0, 330.0, 210.0, 146.0, 136.0, 82.0, 68.0, 70.0, 54.0, 39.0, 27.0, 21.0, 20.0, 13.0, 17.0, 17.0, 11.0, 8.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1530.567626953125, -1483.7633056640625, -1436.958984375, -1390.1546630859375, -1343.350341796875, -1296.546142578125, -1249.7418212890625, -1202.9375, -1156.1331787109375, -1109.328857421875, -1062.5245361328125, -1015.7202758789062, -968.9159545898438, -922.1116333007812, -875.307373046875, -828.5030517578125, -781.69873046875, -734.8944091796875, -688.090087890625, -641.2858276367188, -594.4815063476562, -547.6771850585938, -500.8728942871094, -454.068603515625, -407.2642822265625, -360.4599609375, -313.6556701660156, -266.85137939453125, -220.04705810546875, -173.2427520751953, -126.43844604492188, -79.6341552734375, -32.8299560546875, 13.974349975585938, 60.778656005859375, 107.58296203613281, 154.38726806640625, 201.1915740966797, 247.99588012695312, 294.8001708984375, 341.6044921875, 388.4088134765625, 435.2131042480469, 482.01739501953125, 528.8217163085938, 575.6260375976562, 622.4302978515625, 669.234619140625, 716.0389404296875, 762.84326171875, 809.6475830078125, 856.4518432617188, 903.2561645507812, 950.0604858398438, 996.86474609375, 1043.6690673828125, 1090.473388671875, 1137.2777099609375, 1184.08203125, 1230.8863525390625, 1277.690673828125, 1324.494873046875, 1371.2991943359375, 1418.103515625, 1464.9078369140625]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 5.0, 15.0, 8.0, 12.0, 10.0, 18.0, 23.0, 28.0, 28.0, 40.0, 54.0, 73.0, 118.0, 126.0, 184.0, 297.0, 437.0, 916.0, 1993.0, 4100.0, 8268.0, 51412228.0, 28069.0, 7004.0, 3467.0, 1603.0, 772.0, 422.0, 279.0, 172.0, 134.0, 98.0, 70.0, 53.0, 27.0, 33.0, 26.0, 15.0, 22.0, 11.0, 16.0, 9.0, 14.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-1515.934814453125, -1472.479736328125, -1429.024658203125, -1385.569580078125, -1342.114501953125, -1298.659423828125, -1255.204345703125, -1211.7491455078125, -1168.2940673828125, -1124.8389892578125, -1081.3839111328125, -1037.9288330078125, -994.4736938476562, -951.0186157226562, -907.5635375976562, -864.1083984375, -820.6533813476562, -777.1983032226562, -733.7432250976562, -690.2880859375, -646.8330078125, -603.3779296875, -559.9228515625, -516.4677734375, -473.0126647949219, -429.5575866699219, -386.10247802734375, -342.64739990234375, -299.19232177734375, -255.73721313476562, -212.28213500976562, -168.8270263671875, -125.3719482421875, -81.91685485839844, -38.461769104003906, 4.993316650390625, 48.44841003417969, 91.90350341796875, 135.35858154296875, 178.81369018554688, 222.26876831054688, 265.7238464355469, 309.178955078125, 352.634033203125, 396.089111328125, 439.5442199707031, 482.9992980957031, 526.4544067382812, 569.9094848632812, 613.3645629882812, 656.8196411132812, 700.2747802734375, 743.7298583984375, 787.1849365234375, 830.6400146484375, 874.0950927734375, 917.5501708984375, 961.0052490234375, 1004.4603271484375, 1047.9154052734375, 1091.3704833984375, 1134.82568359375, 1178.28076171875, 1221.73583984375, 1265.19091796875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 7.0, 2.0, 10.0, 12.0, 15.0, 22.0, 42.0, 53.0, 84.0, 126.0, 194.0, 272.0, 412.0, 635.0, 1024.0, 1691.0, 2587.0, 4134.0, 6605.0, 11239.0, 19040.0, 32331.0, 54701.0, 92916.0, 160370.0, 275128.0, 504898.0, 1070135.0, 1816356.0, 1065625.0, 503003.0, 275678.0, 160882.0, 94058.0, 55076.0, 32460.0, 19455.0, 11479.0, 6920.0, 4250.0, 2854.0, 1663.0, 1045.0, 637.0, 468.0, 301.0, 185.0, 132.0, 76.0, 58.0, 40.0, 24.0, 19.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-38.5, -37.3154296875, -36.130859375, -34.9462890625, -33.76171875, -32.5771484375, -31.392578125, -30.2080078125, -29.0234375, -27.8388671875, -26.654296875, -25.4697265625, -24.28515625, -23.1005859375, -21.916015625, -20.7314453125, -19.546875, -18.3623046875, -17.177734375, -15.9931640625, -14.80859375, -13.6240234375, -12.439453125, -11.2548828125, -10.0703125, -8.8857421875, -7.701171875, -6.5166015625, -5.33203125, -4.1474609375, -2.962890625, -1.7783203125, -0.59375, 0.5908203125, 1.775390625, 2.9599609375, 4.14453125, 5.3291015625, 6.513671875, 7.6982421875, 8.8828125, 10.0673828125, 11.251953125, 12.4365234375, 13.62109375, 14.8056640625, 15.990234375, 17.1748046875, 18.359375, 19.5439453125, 20.728515625, 21.9130859375, 23.09765625, 24.2822265625, 25.466796875, 26.6513671875, 27.8359375, 29.0205078125, 30.205078125, 31.3896484375, 32.57421875, 33.7587890625, 34.943359375, 36.1279296875, 37.3125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 11.0, 6.0, 6.0, 9.0, 7.0, 11.0, 23.0, 22.0, 21.0, 25.0, 26.0, 26.0, 31.0, 51.0, 46.0, 64.0, 75.0, 139.0, 151.0, 197.0, 232.0, 184.0, 145.0, 111.0, 74.0, 51.0, 51.0, 40.0, 24.0, 26.0, 29.0, 19.0, 22.0, 23.0, 9.0, 9.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.046875, -28.935302734375, -27.82373046875, -26.712158203125, -25.6005859375, -24.489013671875, -23.37744140625, -22.265869140625, -21.154296875, -20.042724609375, -18.93115234375, -17.819580078125, -16.7080078125, -15.596435546875, -14.48486328125, -13.373291015625, -12.26171875, -11.150146484375, -10.03857421875, -8.927001953125, -7.8154296875, -6.703857421875, -5.59228515625, -4.480712890625, -3.369140625, -2.257568359375, -1.14599609375, -0.034423828125, 1.0771484375, 2.188720703125, 3.30029296875, 4.411865234375, 5.5234375, 6.635009765625, 7.74658203125, 8.858154296875, 9.9697265625, 11.081298828125, 12.19287109375, 13.304443359375, 14.416015625, 15.527587890625, 16.63916015625, 17.750732421875, 18.8623046875, 19.973876953125, 21.08544921875, 22.197021484375, 23.30859375, 24.420166015625, 25.53173828125, 26.643310546875, 27.7548828125, 28.866455078125, 29.97802734375, 31.089599609375, 32.201171875, 33.312744140625, 34.42431640625, 35.535888671875, 36.6474609375, 37.759033203125, 38.87060546875, 39.982177734375, 41.09375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 7.0, 8.0, 20.0, 27.0, 26.0, 28.0, 54.0, 71.0, 123.0, 195.0, 283.0, 456.0, 758.0, 1173.0, 1792.0, 2958.0, 4594.0, 7335.0, 11349.0, 17795.0, 28212.0, 43169.0, 66884.0, 100937.0, 150691.0, 221127.0, 333687.0, 617002.0, 1534858.0, 1532828.0, 617541.0, 332572.0, 221285.0, 151711.0, 101630.0, 66651.0, 43880.0, 28260.0, 18393.0, 11548.0, 7169.0, 4473.0, 2847.0, 1866.0, 1165.0, 711.0, 455.0, 304.0, 183.0, 126.0, 84.0, 49.0, 36.0, 27.0, 14.0, 8.0, 5.0, 2.0], "bins": [-22.5, -21.857177734375, -21.21435546875, -20.571533203125, -19.9287109375, -19.285888671875, -18.64306640625, -18.000244140625, -17.357421875, -16.714599609375, -16.07177734375, -15.428955078125, -14.7861328125, -14.143310546875, -13.50048828125, -12.857666015625, -12.21484375, -11.572021484375, -10.92919921875, -10.286376953125, -9.6435546875, -9.000732421875, -8.35791015625, -7.715087890625, -7.072265625, -6.429443359375, -5.78662109375, -5.143798828125, -4.5009765625, -3.858154296875, -3.21533203125, -2.572509765625, -1.9296875, -1.286865234375, -0.64404296875, -0.001220703125, 0.6416015625, 1.284423828125, 1.92724609375, 2.570068359375, 3.212890625, 3.855712890625, 4.49853515625, 5.141357421875, 5.7841796875, 6.427001953125, 7.06982421875, 7.712646484375, 8.35546875, 8.998291015625, 9.64111328125, 10.283935546875, 10.9267578125, 11.569580078125, 12.21240234375, 12.855224609375, 13.498046875, 14.140869140625, 14.78369140625, 15.426513671875, 16.0693359375, 16.712158203125, 17.35498046875, 17.997802734375, 18.640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 3.0, 8.0, 11.0, 7.0, 13.0, 22.0, 24.0, 20.0, 21.0, 21.0, 23.0, 42.0, 29.0, 47.0, 61.0, 120.0, 201.0, 268.0, 249.0, 203.0, 141.0, 94.0, 74.0, 48.0, 50.0, 45.0, 40.0, 21.0, 18.0, 19.0, 15.0, 10.0, 7.0, 8.0, 8.0, 4.0, 8.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0625, -45.671875, -44.28125, -42.890625, -41.5, -40.109375, -38.71875, -37.328125, -35.9375, -34.546875, -33.15625, -31.765625, -30.375, -28.984375, -27.59375, -26.203125, -24.8125, -23.421875, -22.03125, -20.640625, -19.25, -17.859375, -16.46875, -15.078125, -13.6875, -12.296875, -10.90625, -9.515625, -8.125, -6.734375, -5.34375, -3.953125, -2.5625, -1.171875, 0.21875, 1.609375, 3.0, 4.390625, 5.78125, 7.171875, 8.5625, 9.953125, 11.34375, 12.734375, 14.125, 15.515625, 16.90625, 18.296875, 19.6875, 21.078125, 22.46875, 23.859375, 25.25, 26.640625, 28.03125, 29.421875, 30.8125, 32.203125, 33.59375, 34.984375, 36.375, 37.765625, 39.15625, 40.546875, 41.9375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 8.0, 13.0, 18.0, 24.0, 21.0, 24.0, 35.0, 48.0, 80.0, 116.0, 170.0, 222.0, 350.0, 483.0, 734.0, 1093.0, 1702.0, 2868.0, 4655.0, 7860.0, 13593.0, 24329.0, 44171.0, 84179.0, 237345.0, 5545320.0, 162984.0, 70204.0, 37916.0, 21103.0, 11831.0, 6826.0, 4006.0, 2447.0, 1531.0, 954.0, 678.0, 443.0, 340.0, 217.0, 141.0, 107.0, 80.0, 50.0, 33.0, 26.0, 21.0, 17.0, 3.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-62.5625, -60.357421875, -58.15234375, -55.947265625, -53.7421875, -51.537109375, -49.33203125, -47.126953125, -44.921875, -42.716796875, -40.51171875, -38.306640625, -36.1015625, -33.896484375, -31.69140625, -29.486328125, -27.28125, -25.076171875, -22.87109375, -20.666015625, -18.4609375, -16.255859375, -14.05078125, -11.845703125, -9.640625, -7.435546875, -5.23046875, -3.025390625, -0.8203125, 1.384765625, 3.58984375, 5.794921875, 8.0, 10.205078125, 12.41015625, 14.615234375, 16.8203125, 19.025390625, 21.23046875, 23.435546875, 25.640625, 27.845703125, 30.05078125, 32.255859375, 34.4609375, 36.666015625, 38.87109375, 41.076171875, 43.28125, 45.486328125, 47.69140625, 49.896484375, 52.1015625, 54.306640625, 56.51171875, 58.716796875, 60.921875, 63.126953125, 65.33203125, 67.537109375, 69.7421875, 71.947265625, 74.15234375, 76.357421875, 78.5625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 6.0, 6.0, 7.0, 5.0, 9.0, 6.0, 12.0, 15.0, 10.0, 20.0, 29.0, 29.0, 33.0, 32.0, 21.0, 34.0, 38.0, 37.0, 43.0, 70.0, 154.0, 326.0, 348.0, 209.0, 106.0, 74.0, 47.0, 42.0, 42.0, 32.0, 26.0, 25.0, 29.0, 19.0, 18.0, 11.0, 10.0, 7.0, 10.0, 11.0, 5.0, 2.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-65.0, -63.0791015625, -61.158203125, -59.2373046875, -57.31640625, -55.3955078125, -53.474609375, -51.5537109375, -49.6328125, -47.7119140625, -45.791015625, -43.8701171875, -41.94921875, -40.0283203125, -38.107421875, -36.1865234375, -34.265625, -32.3447265625, -30.423828125, -28.5029296875, -26.58203125, -24.6611328125, -22.740234375, -20.8193359375, -18.8984375, -16.9775390625, -15.056640625, -13.1357421875, -11.21484375, -9.2939453125, -7.373046875, -5.4521484375, -3.53125, -1.6103515625, 0.310546875, 2.2314453125, 4.15234375, 6.0732421875, 7.994140625, 9.9150390625, 11.8359375, 13.7568359375, 15.677734375, 17.5986328125, 19.51953125, 21.4404296875, 23.361328125, 25.2822265625, 27.203125, 29.1240234375, 31.044921875, 32.9658203125, 34.88671875, 36.8076171875, 38.728515625, 40.6494140625, 42.5703125, 44.4912109375, 46.412109375, 48.3330078125, 50.25390625, 52.1748046875, 54.095703125, 56.0166015625, 57.9375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 9.0, 18.0, 21.0, 38.0, 50.0, 92.0, 211.0, 239.0, 108.0, 73.0, 50.0, 34.0, 21.0, 17.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3444.7783203125, -3358.5693359375, -3272.3603515625, -3186.1513671875, -3099.9423828125, -3013.7333984375, -2927.5244140625, -2841.315185546875, -2755.106201171875, -2668.897216796875, -2582.688232421875, -2496.479248046875, -2410.270263671875, -2324.06103515625, -2237.85205078125, -2151.64306640625, -2065.43408203125, -1979.22509765625, -1893.01611328125, -1806.80712890625, -1720.5980224609375, -1634.3890380859375, -1548.1800537109375, -1461.970947265625, -1375.76220703125, -1289.55322265625, -1203.34423828125, -1117.13525390625, -1030.9261474609375, -944.7171630859375, -858.5081787109375, -772.2991333007812, -686.090087890625, -599.881103515625, -513.6720581054688, -427.46307373046875, -341.2540588378906, -255.0450439453125, -168.8360595703125, -82.62701416015625, 3.58197021484375, 89.79097747802734, 175.99998474121094, 262.208984375, 348.4179992675781, 434.62701416015625, 520.8359985351562, 607.0450439453125, 693.2540283203125, 779.4630126953125, 865.6720581054688, 951.8810424804688, 1038.090087890625, 1124.299072265625, 1210.508056640625, 1296.717041015625, 1382.926025390625, 1469.135009765625, 1555.343994140625, 1641.552978515625, 1727.7620849609375, 1813.9710693359375, 1900.1800537109375, 1986.38916015625, 2072.59814453125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 0.0, 11.0, 10.0, 10.0, 20.0, 24.0, 13.0, 22.0, 19.0, 28.0, 38.0, 30.0, 34.0, 38.0, 59.0, 64.0, 94.0, 77.0, 69.0, 57.0, 45.0, 31.0, 24.0, 33.0, 19.0, 15.0, 16.0, 24.0, 14.0, 11.0, 7.0, 2.0, 7.0, 5.0, 6.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1230.11181640625, -1193.7510986328125, -1157.3905029296875, -1121.02978515625, -1084.6690673828125, -1048.308349609375, -1011.94775390625, -975.5870361328125, -939.2263793945312, -902.86572265625, -866.5050048828125, -830.1443481445312, -793.78369140625, -757.4229736328125, -721.0623168945312, -684.70166015625, -648.3409423828125, -611.9802856445312, -575.6195678710938, -539.2589111328125, -502.8982238769531, -466.53753662109375, -430.1768798828125, -393.8161926269531, -357.45550537109375, -321.0948181152344, -284.734130859375, -248.37347412109375, -212.01278686523438, -175.652099609375, -139.2914276123047, -102.93075561523438, -66.5699462890625, -30.209266662597656, 6.1514129638671875, 42.51209259033203, 78.87277221679688, 115.23345947265625, 151.59413146972656, 187.95480346679688, 224.31549072265625, 260.6761779785156, 297.036865234375, 333.39752197265625, 369.7582092285156, 406.118896484375, 442.47955322265625, 478.8402404785156, 515.200927734375, 551.5615844726562, 587.9223022460938, 624.282958984375, 660.6436767578125, 697.0043334960938, 733.364990234375, 769.7257080078125, 806.0863647460938, 842.447021484375, 878.8077392578125, 915.1683959960938, 951.529052734375, 987.8897705078125, 1024.25048828125, 1060.611083984375, 1096.9718017578125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 4.0, 7.0, 12.0, 11.0, 21.0, 25.0, 43.0, 53.0, 86.0, 117.0, 150.0, 280.0, 403.0, 590.0, 882.0, 1382.0, 2260.0, 3812.0, 6884.0, 13081.0, 28109.0, 83543.0, 673410.0, 3135990.0, 161814.0, 43203.0, 17774.0, 8875.0, 4716.0, 2756.0, 1552.0, 919.0, 550.0, 354.0, 236.0, 136.0, 102.0, 42.0, 29.0, 21.0, 8.0, 8.0, 11.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.2734375, -12.8963623046875, -12.519287109375, -12.1422119140625, -11.76513671875, -11.3880615234375, -11.010986328125, -10.6339111328125, -10.2568359375, -9.8797607421875, -9.502685546875, -9.1256103515625, -8.74853515625, -8.3714599609375, -7.994384765625, -7.6173095703125, -7.240234375, -6.8631591796875, -6.486083984375, -6.1090087890625, -5.73193359375, -5.3548583984375, -4.977783203125, -4.6007080078125, -4.2236328125, -3.8465576171875, -3.469482421875, -3.0924072265625, -2.71533203125, -2.3382568359375, -1.961181640625, -1.5841064453125, -1.20703125, -0.8299560546875, -0.452880859375, -0.0758056640625, 0.30126953125, 0.6783447265625, 1.055419921875, 1.4324951171875, 1.8095703125, 2.1866455078125, 2.563720703125, 2.9407958984375, 3.31787109375, 3.6949462890625, 4.072021484375, 4.4490966796875, 4.826171875, 5.2032470703125, 5.580322265625, 5.9573974609375, 6.33447265625, 6.7115478515625, 7.088623046875, 7.4656982421875, 7.8427734375, 8.2198486328125, 8.596923828125, 8.9739990234375, 9.35107421875, 9.7281494140625, 10.105224609375, 10.4822998046875, 10.859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 4.0, 9.0, 4.0, 15.0, 13.0, 22.0, 39.0, 71.0, 113.0, 166.0, 169.0, 111.0, 69.0, 63.0, 27.0, 16.0, 13.0, 10.0, 6.0, 6.0, 9.0, 3.0, 3.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.623046875, -1.5742034912109375, -1.525360107421875, -1.4765167236328125, -1.42767333984375, -1.3788299560546875, -1.329986572265625, -1.2811431884765625, -1.2322998046875, -1.1834564208984375, -1.134613037109375, -1.0857696533203125, -1.03692626953125, -0.9880828857421875, -0.939239501953125, -0.8903961181640625, -0.841552734375, -0.7927093505859375, -0.743865966796875, -0.6950225830078125, -0.64617919921875, -0.5973358154296875, -0.548492431640625, -0.4996490478515625, -0.4508056640625, -0.4019622802734375, -0.353118896484375, -0.3042755126953125, -0.25543212890625, -0.2065887451171875, -0.157745361328125, -0.1089019775390625, -0.06005859375, -0.0112152099609375, 0.037628173828125, 0.0864715576171875, 0.13531494140625, 0.1841583251953125, 0.233001708984375, 0.2818450927734375, 0.3306884765625, 0.3795318603515625, 0.428375244140625, 0.4772186279296875, 0.52606201171875, 0.5749053955078125, 0.623748779296875, 0.6725921630859375, 0.721435546875, 0.7702789306640625, 0.819122314453125, 0.8679656982421875, 0.91680908203125, 0.9656524658203125, 1.014495849609375, 1.0633392333984375, 1.1121826171875, 1.1610260009765625, 1.209869384765625, 1.2587127685546875, 1.30755615234375, 1.3563995361328125, 1.405242919921875, 1.4540863037109375, 1.5029296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 20.0, 14.0, 17.0, 29.0, 57.0, 84.0, 128.0, 188.0, 308.0, 591.0, 966.0, 1770.0, 3525.0, 7153.0, 15691.0, 36742.0, 97680.0, 289428.0, 1101566.0, 1952229.0, 454527.0, 141475.0, 51096.0, 20443.0, 9134.0, 4302.0, 2146.0, 1168.0, 682.0, 397.0, 255.0, 149.0, 103.0, 76.0, 34.0, 31.0, 21.0, 17.0, 12.0, 5.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.803955078125, -7.54541015625, -7.286865234375, -7.0283203125, -6.769775390625, -6.51123046875, -6.252685546875, -5.994140625, -5.735595703125, -5.47705078125, -5.218505859375, -4.9599609375, -4.701416015625, -4.44287109375, -4.184326171875, -3.92578125, -3.667236328125, -3.40869140625, -3.150146484375, -2.8916015625, -2.633056640625, -2.37451171875, -2.115966796875, -1.857421875, -1.598876953125, -1.34033203125, -1.081787109375, -0.8232421875, -0.564697265625, -0.30615234375, -0.047607421875, 0.2109375, 0.469482421875, 0.72802734375, 0.986572265625, 1.2451171875, 1.503662109375, 1.76220703125, 2.020751953125, 2.279296875, 2.537841796875, 2.79638671875, 3.054931640625, 3.3134765625, 3.572021484375, 3.83056640625, 4.089111328125, 4.34765625, 4.606201171875, 4.86474609375, 5.123291015625, 5.3818359375, 5.640380859375, 5.89892578125, 6.157470703125, 6.416015625, 6.674560546875, 6.93310546875, 7.191650390625, 7.4501953125, 7.708740234375, 7.96728515625, 8.225830078125, 8.484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 14.0, 13.0, 16.0, 33.0, 32.0, 43.0, 59.0, 94.0, 110.0, 125.0, 160.0, 209.0, 326.0, 473.0, 699.0, 462.0, 300.0, 243.0, 159.0, 123.0, 103.0, 64.0, 57.0, 42.0, 24.0, 19.0, 16.0, 11.0, 11.0, 6.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.120208740234375, -3.01776123046875, -2.915313720703125, -2.8128662109375, -2.710418701171875, -2.60797119140625, -2.505523681640625, -2.403076171875, -2.300628662109375, -2.19818115234375, -2.095733642578125, -1.9932861328125, -1.890838623046875, -1.78839111328125, -1.685943603515625, -1.58349609375, -1.481048583984375, -1.37860107421875, -1.276153564453125, -1.1737060546875, -1.071258544921875, -0.96881103515625, -0.866363525390625, -0.763916015625, -0.661468505859375, -0.55902099609375, -0.456573486328125, -0.3541259765625, -0.251678466796875, -0.14923095703125, -0.046783447265625, 0.0556640625, 0.158111572265625, 0.26055908203125, 0.363006591796875, 0.4654541015625, 0.567901611328125, 0.67034912109375, 0.772796630859375, 0.875244140625, 0.977691650390625, 1.08013916015625, 1.182586669921875, 1.2850341796875, 1.387481689453125, 1.48992919921875, 1.592376708984375, 1.69482421875, 1.797271728515625, 1.89971923828125, 2.002166748046875, 2.1046142578125, 2.207061767578125, 2.30950927734375, 2.411956787109375, 2.514404296875, 2.616851806640625, 2.71929931640625, 2.821746826171875, 2.9241943359375, 3.026641845703125, 3.12908935546875, 3.231536865234375, 3.333984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 19.0, 44.0, 104.0, 155.0, 282.0, 192.0, 111.0, 48.0, 9.0, 18.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.88779067993164, -51.938392639160156, -49.988990783691406, -48.039588928222656, -46.09019088745117, -44.14079284667969, -42.19139099121094, -40.24198913574219, -38.2925910949707, -36.34319305419922, -34.39379119873047, -32.44438934326172, -30.494991302490234, -28.545591354370117, -26.59619140625, -24.646791458129883, -22.697391510009766, -20.74799156188965, -18.79859161376953, -16.849191665649414, -14.899791717529297, -12.95039176940918, -11.000991821289062, -9.051591873168945, -7.102191925048828, -5.152791976928711, -3.2033920288085938, -1.2539920806884766, 0.6954078674316406, 2.644807815551758, 4.594207763671875, 6.543607711791992, 8.493011474609375, 10.442411422729492, 12.39181137084961, 14.341211318969727, 16.290611267089844, 18.24001121520996, 20.189411163330078, 22.138811111450195, 24.088211059570312, 26.03761100769043, 27.987010955810547, 29.936410903930664, 31.88581085205078, 33.83521270751953, 35.784610748291016, 37.7340087890625, 39.68341064453125, 41.6328125, 43.582210540771484, 45.53160858154297, 47.48101043701172, 49.43041229248047, 51.37981033325195, 53.32920837402344, 55.27861022949219, 57.22801208496094, 59.17741012573242, 61.126808166503906, 63.076210021972656, 65.0256118774414, 66.97500610351562, 68.92440795898438, 70.87380981445312]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 12.0, 15.0, 14.0, 11.0, 20.0, 20.0, 26.0, 26.0, 44.0, 36.0, 45.0, 47.0, 55.0, 52.0, 56.0, 64.0, 56.0, 52.0, 52.0, 46.0, 41.0, 29.0, 32.0, 44.0, 22.0, 12.0, 16.0, 14.0, 12.0, 8.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.651752471923828, -22.992904663085938, -22.334056854248047, -21.675209045410156, -21.016361236572266, -20.357513427734375, -19.698665618896484, -19.039817810058594, -18.380970001220703, -17.722122192382812, -17.063274383544922, -16.40442657470703, -15.74557876586914, -15.08673095703125, -14.427884101867676, -13.769036293029785, -13.110189437866211, -12.45134162902832, -11.79249382019043, -11.133646011352539, -10.474798202514648, -9.815950393676758, -9.157103538513184, -8.498255729675293, -7.839407920837402, -7.180560111999512, -6.521712303161621, -5.862864971160889, -5.204017162322998, -4.545169353485107, -3.886321783065796, -3.2274742126464844, -2.5686264038085938, -1.9097787141799927, -1.2509310245513916, -0.5920833349227905, 0.06676435470581055, 0.7256121635437012, 1.3844597339630127, 2.043307304382324, 2.702155113220215, 3.3610029220581055, 4.019850730895996, 4.6786980628967285, 5.337545871734619, 5.99639368057251, 6.655241012573242, 7.314088821411133, 7.972936630249023, 8.631784439086914, 9.290632247924805, 9.949480056762695, 10.608327865600586, 11.267175674438477, 11.92602252960205, 12.584870338439941, 13.243718147277832, 13.902565956115723, 14.561413764953613, 15.220261573791504, 15.879108428955078, 16.53795623779297, 17.19680404663086, 17.85565185546875, 18.51449966430664]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 10.0, 9.0, 20.0, 27.0, 44.0, 60.0, 68.0, 111.0, 174.0, 189.0, 337.0, 482.0, 706.0, 1092.0, 1661.0, 2791.0, 4574.0, 8528.0, 17941.0, 49323.0, 216750.0, 542234.0, 133400.0, 35682.0, 14409.0, 7172.0, 4018.0, 2299.0, 1492.0, 940.0, 605.0, 431.0, 281.0, 181.0, 171.0, 109.0, 66.0, 57.0, 30.0, 26.0, 14.0, 16.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.68524169921875, -5.4915771484375, -5.29791259765625, -5.104248046875, -4.91058349609375, -4.7169189453125, -4.52325439453125, -4.32958984375, -4.13592529296875, -3.9422607421875, -3.74859619140625, -3.554931640625, -3.36126708984375, -3.1676025390625, -2.97393798828125, -2.7802734375, -2.58660888671875, -2.3929443359375, -2.19927978515625, -2.005615234375, -1.81195068359375, -1.6182861328125, -1.42462158203125, -1.23095703125, -1.03729248046875, -0.8436279296875, -0.64996337890625, -0.456298828125, -0.26263427734375, -0.0689697265625, 0.12469482421875, 0.318359375, 0.51202392578125, 0.7056884765625, 0.89935302734375, 1.093017578125, 1.28668212890625, 1.4803466796875, 1.67401123046875, 1.86767578125, 2.06134033203125, 2.2550048828125, 2.44866943359375, 2.642333984375, 2.83599853515625, 3.0296630859375, 3.22332763671875, 3.4169921875, 3.61065673828125, 3.8043212890625, 3.99798583984375, 4.191650390625, 4.38531494140625, 4.5789794921875, 4.77264404296875, 4.96630859375, 5.15997314453125, 5.3536376953125, 5.54730224609375, 5.740966796875, 5.93463134765625, 6.1282958984375, 6.32196044921875, 6.515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 8.0, 6.0, 19.0, 16.0, 27.0, 37.0, 65.0, 96.0, 130.0, 111.0, 133.0, 95.0, 72.0, 46.0, 35.0, 16.0, 8.0, 12.0, 12.0, 5.0, 11.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.7221832275390625, -1.666046142578125, -1.6099090576171875, -1.55377197265625, -1.4976348876953125, -1.441497802734375, -1.3853607177734375, -1.3292236328125, -1.2730865478515625, -1.216949462890625, -1.1608123779296875, -1.10467529296875, -1.0485382080078125, -0.992401123046875, -0.9362640380859375, -0.880126953125, -0.8239898681640625, -0.767852783203125, -0.7117156982421875, -0.65557861328125, -0.5994415283203125, -0.543304443359375, -0.4871673583984375, -0.4310302734375, -0.3748931884765625, -0.318756103515625, -0.2626190185546875, -0.20648193359375, -0.1503448486328125, -0.094207763671875, -0.0380706787109375, 0.01806640625, 0.0742034912109375, 0.130340576171875, 0.1864776611328125, 0.24261474609375, 0.2987518310546875, 0.354888916015625, 0.4110260009765625, 0.4671630859375, 0.5233001708984375, 0.579437255859375, 0.6355743408203125, 0.69171142578125, 0.7478485107421875, 0.803985595703125, 0.8601226806640625, 0.916259765625, 0.9723968505859375, 1.028533935546875, 1.0846710205078125, 1.14080810546875, 1.1969451904296875, 1.253082275390625, 1.3092193603515625, 1.3653564453125, 1.4214935302734375, 1.477630615234375, 1.5337677001953125, 1.58990478515625, 1.6460418701171875, 1.702178955078125, 1.7583160400390625, 1.814453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 13.0, 8.0, 14.0, 22.0, 35.0, 52.0, 55.0, 104.0, 173.0, 290.0, 434.0, 699.0, 1196.0, 2123.0, 3775.0, 6974.0, 14037.0, 30301.0, 70669.0, 182590.0, 377685.0, 209412.0, 80527.0, 34206.0, 15716.0, 7763.0, 4029.0, 2263.0, 1294.0, 794.0, 471.0, 306.0, 199.0, 102.0, 85.0, 48.0, 26.0, 15.0, 23.0, 11.0, 1.0, 5.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.26171875, -6.0751953125, -5.888671875, -5.7021484375, -5.515625, -5.3291015625, -5.142578125, -4.9560546875, -4.76953125, -4.5830078125, -4.396484375, -4.2099609375, -4.0234375, -3.8369140625, -3.650390625, -3.4638671875, -3.27734375, -3.0908203125, -2.904296875, -2.7177734375, -2.53125, -2.3447265625, -2.158203125, -1.9716796875, -1.78515625, -1.5986328125, -1.412109375, -1.2255859375, -1.0390625, -0.8525390625, -0.666015625, -0.4794921875, -0.29296875, -0.1064453125, 0.080078125, 0.2666015625, 0.453125, 0.6396484375, 0.826171875, 1.0126953125, 1.19921875, 1.3857421875, 1.572265625, 1.7587890625, 1.9453125, 2.1318359375, 2.318359375, 2.5048828125, 2.69140625, 2.8779296875, 3.064453125, 3.2509765625, 3.4375, 3.6240234375, 3.810546875, 3.9970703125, 4.18359375, 4.3701171875, 4.556640625, 4.7431640625, 4.9296875, 5.1162109375, 5.302734375, 5.4892578125, 5.67578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 11.0, 8.0, 9.0, 21.0, 27.0, 15.0, 18.0, 31.0, 33.0, 38.0, 27.0, 38.0, 37.0, 46.0, 47.0, 47.0, 42.0, 43.0, 48.0, 41.0, 42.0, 43.0, 37.0, 23.0, 28.0, 21.0, 34.0, 27.0, 19.0, 12.0, 22.0, 8.0, 10.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.94140625, -6.73748779296875, -6.5335693359375, -6.32965087890625, -6.125732421875, -5.92181396484375, -5.7178955078125, -5.51397705078125, -5.31005859375, -5.10614013671875, -4.9022216796875, -4.69830322265625, -4.494384765625, -4.29046630859375, -4.0865478515625, -3.88262939453125, -3.6787109375, -3.47479248046875, -3.2708740234375, -3.06695556640625, -2.863037109375, -2.65911865234375, -2.4552001953125, -2.25128173828125, -2.04736328125, -1.84344482421875, -1.6395263671875, -1.43560791015625, -1.231689453125, -1.02777099609375, -0.8238525390625, -0.61993408203125, -0.416015625, -0.21209716796875, -0.0081787109375, 0.19573974609375, 0.399658203125, 0.60357666015625, 0.8074951171875, 1.01141357421875, 1.21533203125, 1.41925048828125, 1.6231689453125, 1.82708740234375, 2.031005859375, 2.23492431640625, 2.4388427734375, 2.64276123046875, 2.8466796875, 3.05059814453125, 3.2545166015625, 3.45843505859375, 3.662353515625, 3.86627197265625, 4.0701904296875, 4.27410888671875, 4.47802734375, 4.68194580078125, 4.8858642578125, 5.08978271484375, 5.293701171875, 5.49761962890625, 5.7015380859375, 5.90545654296875, 6.109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 10.0, 4.0, 12.0, 12.0, 23.0, 40.0, 88.0, 104.0, 190.0, 362.0, 879.0, 2517.0, 8543.0, 46495.0, 590464.0, 359009.0, 30068.0, 6287.0, 1973.0, 700.0, 334.0, 167.0, 90.0, 53.0, 39.0, 22.0, 19.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.203125, -7.8980712890625, -7.593017578125, -7.2879638671875, -6.98291015625, -6.6778564453125, -6.372802734375, -6.0677490234375, -5.7626953125, -5.4576416015625, -5.152587890625, -4.8475341796875, -4.54248046875, -4.2374267578125, -3.932373046875, -3.6273193359375, -3.322265625, -3.0172119140625, -2.712158203125, -2.4071044921875, -2.10205078125, -1.7969970703125, -1.491943359375, -1.1868896484375, -0.8818359375, -0.5767822265625, -0.271728515625, 0.0333251953125, 0.33837890625, 0.6434326171875, 0.948486328125, 1.2535400390625, 1.55859375, 1.8636474609375, 2.168701171875, 2.4737548828125, 2.77880859375, 3.0838623046875, 3.388916015625, 3.6939697265625, 3.9990234375, 4.3040771484375, 4.609130859375, 4.9141845703125, 5.21923828125, 5.5242919921875, 5.829345703125, 6.1343994140625, 6.439453125, 6.7445068359375, 7.049560546875, 7.3546142578125, 7.65966796875, 7.9647216796875, 8.269775390625, 8.5748291015625, 8.8798828125, 9.1849365234375, 9.489990234375, 9.7950439453125, 10.10009765625, 10.4051513671875, 10.710205078125, 11.0152587890625, 11.3203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 8.0, 12.0, 10.0, 21.0, 21.0, 29.0, 30.0, 47.0, 63.0, 80.0, 63.0, 81.0, 94.0, 87.0, 66.0, 56.0, 50.0, 40.0, 32.0, 22.0, 16.0, 11.0, 6.0, 9.0, 10.0, 12.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00039005279541015625, -0.0003782510757446289, -0.00036644935607910156, -0.0003546476364135742, -0.0003428459167480469, -0.00033104419708251953, -0.0003192424774169922, -0.00030744075775146484, -0.0002956390380859375, -0.00028383731842041016, -0.0002720355987548828, -0.00026023387908935547, -0.0002484321594238281, -0.00023663043975830078, -0.00022482872009277344, -0.0002130270004272461, -0.00020122528076171875, -0.0001894235610961914, -0.00017762184143066406, -0.00016582012176513672, -0.00015401840209960938, -0.00014221668243408203, -0.0001304149627685547, -0.00011861324310302734, -0.0001068115234375, -9.500980377197266e-05, -8.320808410644531e-05, -7.140636444091797e-05, -5.9604644775390625e-05, -4.780292510986328e-05, -3.600120544433594e-05, -2.4199485778808594e-05, -1.239776611328125e-05, -5.960464477539062e-07, 1.1205673217773438e-05, 2.300739288330078e-05, 3.4809112548828125e-05, 4.661083221435547e-05, 5.841255187988281e-05, 7.021427154541016e-05, 8.20159912109375e-05, 9.381771087646484e-05, 0.00010561943054199219, 0.00011742115020751953, 0.00012922286987304688, 0.00014102458953857422, 0.00015282630920410156, 0.0001646280288696289, 0.00017642974853515625, 0.0001882314682006836, 0.00020003318786621094, 0.00021183490753173828, 0.00022363662719726562, 0.00023543834686279297, 0.0002472400665283203, 0.00025904178619384766, 0.000270843505859375, 0.00028264522552490234, 0.0002944469451904297, 0.00030624866485595703, 0.0003180503845214844, 0.0003298521041870117, 0.00034165382385253906, 0.0003534555435180664, 0.00036525726318359375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 9.0, 9.0, 7.0, 10.0, 23.0, 32.0, 64.0, 84.0, 196.0, 345.0, 808.0, 1731.0, 4599.0, 15024.0, 70573.0, 507174.0, 377188.0, 52037.0, 11952.0, 3777.0, 1521.0, 618.0, 353.0, 166.0, 88.0, 59.0, 42.0, 20.0, 18.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.15625, -8.908203125, -8.66015625, -8.412109375, -8.1640625, -7.916015625, -7.66796875, -7.419921875, -7.171875, -6.923828125, -6.67578125, -6.427734375, -6.1796875, -5.931640625, -5.68359375, -5.435546875, -5.1875, -4.939453125, -4.69140625, -4.443359375, -4.1953125, -3.947265625, -3.69921875, -3.451171875, -3.203125, -2.955078125, -2.70703125, -2.458984375, -2.2109375, -1.962890625, -1.71484375, -1.466796875, -1.21875, -0.970703125, -0.72265625, -0.474609375, -0.2265625, 0.021484375, 0.26953125, 0.517578125, 0.765625, 1.013671875, 1.26171875, 1.509765625, 1.7578125, 2.005859375, 2.25390625, 2.501953125, 2.75, 2.998046875, 3.24609375, 3.494140625, 3.7421875, 3.990234375, 4.23828125, 4.486328125, 4.734375, 4.982421875, 5.23046875, 5.478515625, 5.7265625, 5.974609375, 6.22265625, 6.470703125, 6.71875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 8.0, 10.0, 17.0, 21.0, 46.0, 40.0, 34.0, 56.0, 48.0, 65.0, 78.0, 87.0, 78.0, 84.0, 67.0, 57.0, 54.0, 35.0, 28.0, 12.0, 11.0, 18.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.14617919921875, -3.0189208984375, -2.89166259765625, -2.764404296875, -2.63714599609375, -2.5098876953125, -2.38262939453125, -2.25537109375, -2.12811279296875, -2.0008544921875, -1.87359619140625, -1.746337890625, -1.61907958984375, -1.4918212890625, -1.36456298828125, -1.2373046875, -1.11004638671875, -0.9827880859375, -0.85552978515625, -0.728271484375, -0.60101318359375, -0.4737548828125, -0.34649658203125, -0.21923828125, -0.09197998046875, 0.0352783203125, 0.16253662109375, 0.289794921875, 0.41705322265625, 0.5443115234375, 0.67156982421875, 0.798828125, 0.92608642578125, 1.0533447265625, 1.18060302734375, 1.307861328125, 1.43511962890625, 1.5623779296875, 1.68963623046875, 1.81689453125, 1.94415283203125, 2.0714111328125, 2.19866943359375, 2.325927734375, 2.45318603515625, 2.5804443359375, 2.70770263671875, 2.8349609375, 2.96221923828125, 3.0894775390625, 3.21673583984375, 3.343994140625, 3.47125244140625, 3.5985107421875, 3.72576904296875, 3.85302734375, 3.98028564453125, 4.1075439453125, 4.23480224609375, 4.362060546875, 4.48931884765625, 4.6165771484375, 4.74383544921875, 4.87109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 16.0, 13.0, 30.0, 95.0, 260.0, 346.0, 149.0, 47.0, 15.0, 13.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.5968017578125, -158.52476501464844, -153.45272827148438, -148.3806915283203, -143.30865478515625, -138.2366180419922, -133.16458129882812, -128.09255981445312, -123.02051544189453, -117.94847869873047, -112.8764419555664, -107.80440521240234, -102.73237609863281, -97.66033935546875, -92.58830261230469, -87.51626586914062, -82.44422912597656, -77.3721923828125, -72.30015563964844, -67.22811889648438, -62.15608596801758, -57.084049224853516, -52.01201629638672, -46.939979553222656, -41.867942810058594, -36.79590606689453, -31.7238712310791, -26.651836395263672, -21.57979965209961, -16.507762908935547, -11.435728073120117, -6.3636932373046875, -1.2916717529296875, 3.7803640365600586, 8.852399826049805, 13.92443561553955, 18.996471405029297, 24.06850814819336, 29.14054298400879, 34.21257781982422, 39.28461456298828, 44.356651306152344, 49.428688049316406, 54.5007209777832, 59.572757720947266, 64.64479064941406, 69.71682739257812, 74.78886413574219, 79.86090087890625, 84.93293762207031, 90.00497436523438, 95.07701110839844, 100.1490478515625, 105.22108459472656, 110.2931137084961, 115.36515045166016, 120.43718719482422, 125.50922393798828, 130.5812530517578, 135.65328979492188, 140.72532653808594, 145.79736328125, 150.86940002441406, 155.94143676757812, 161.0134735107422]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 11.0, 17.0, 20.0, 31.0, 57.0, 87.0, 111.0, 144.0, 156.0, 105.0, 85.0, 51.0, 24.0, 14.0, 13.0, 14.0, 10.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.89652252197266, -101.9616928100586, -98.02685546875, -94.09202575683594, -90.15719604492188, -86.22235870361328, -82.28752899169922, -78.35269165039062, -74.41786193847656, -70.4830322265625, -66.5481948852539, -62.613365173339844, -58.678531646728516, -54.74369812011719, -50.808868408203125, -46.8740348815918, -42.93920135498047, -39.00436782836914, -35.06953430175781, -31.13470458984375, -27.199871063232422, -23.265037536621094, -19.3302059173584, -15.395374298095703, -11.460540771484375, -7.525708198547363, -3.5908756256103516, 0.34395694732666016, 4.278789520263672, 8.213623046875, 12.148454666137695, 16.08328628540039, 20.018112182617188, 23.952945709228516, 27.88777732849121, 31.822608947753906, 35.757442474365234, 39.69227600097656, 43.627105712890625, 47.56193923950195, 51.49677276611328, 55.43160629272461, 59.36643981933594, 63.30126953125, 67.23609924316406, 71.17093658447266, 75.10576629638672, 79.04060363769531, 82.97543334960938, 86.91026306152344, 90.84510040283203, 94.7799301147461, 98.71476745605469, 102.64959716796875, 106.58442687988281, 110.51925659179688, 114.45409393310547, 118.38892364501953, 122.32376098632812, 126.25859069824219, 130.19342041015625, 134.12826538085938, 138.06309509277344, 141.9979248046875, 145.93275451660156]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 17.0, 31.0, 35.0, 50.0, 80.0, 172.0, 275.0, 567.0, 1195.0, 3207.0, 10609.0, 65838.0, 3889739.0, 197487.0, 17932.0, 4307.0, 1503.0, 585.0, 276.0, 137.0, 88.0, 48.0, 24.0, 10.0, 15.0, 7.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.9892578125, -33.884765625, -32.7802734375, -31.67578125, -30.5712890625, -29.466796875, -28.3623046875, -27.2578125, -26.1533203125, -25.048828125, -23.9443359375, -22.83984375, -21.7353515625, -20.630859375, -19.5263671875, -18.421875, -17.3173828125, -16.212890625, -15.1083984375, -14.00390625, -12.8994140625, -11.794921875, -10.6904296875, -9.5859375, -8.4814453125, -7.376953125, -6.2724609375, -5.16796875, -4.0634765625, -2.958984375, -1.8544921875, -0.75, 0.3544921875, 1.458984375, 2.5634765625, 3.66796875, 4.7724609375, 5.876953125, 6.9814453125, 8.0859375, 9.1904296875, 10.294921875, 11.3994140625, 12.50390625, 13.6083984375, 14.712890625, 15.8173828125, 16.921875, 18.0263671875, 19.130859375, 20.2353515625, 21.33984375, 22.4443359375, 23.548828125, 24.6533203125, 25.7578125, 26.8623046875, 27.966796875, 29.0712890625, 30.17578125, 31.2802734375, 32.384765625, 33.4892578125, 34.59375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 3.0, 8.0, 14.0, 23.0, 22.0, 32.0, 37.0, 59.0, 79.0, 98.0, 105.0, 105.0, 81.0, 69.0, 62.0, 52.0, 42.0, 20.0, 20.0, 7.0, 12.0, 3.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7509765625, -1.700836181640625, -1.65069580078125, -1.600555419921875, -1.5504150390625, -1.500274658203125, -1.45013427734375, -1.399993896484375, -1.349853515625, -1.299713134765625, -1.24957275390625, -1.199432373046875, -1.1492919921875, -1.099151611328125, -1.04901123046875, -0.998870849609375, -0.94873046875, -0.898590087890625, -0.84844970703125, -0.798309326171875, -0.7481689453125, -0.698028564453125, -0.64788818359375, -0.597747802734375, -0.547607421875, -0.497467041015625, -0.44732666015625, -0.397186279296875, -0.3470458984375, -0.296905517578125, -0.24676513671875, -0.196624755859375, -0.146484375, -0.096343994140625, -0.04620361328125, 0.003936767578125, 0.0540771484375, 0.104217529296875, 0.15435791015625, 0.204498291015625, 0.254638671875, 0.304779052734375, 0.35491943359375, 0.405059814453125, 0.4552001953125, 0.505340576171875, 0.55548095703125, 0.605621337890625, 0.65576171875, 0.705902099609375, 0.75604248046875, 0.806182861328125, 0.8563232421875, 0.906463623046875, 0.95660400390625, 1.006744384765625, 1.056884765625, 1.107025146484375, 1.15716552734375, 1.207305908203125, 1.2574462890625, 1.307586669921875, 1.35772705078125, 1.407867431640625, 1.4580078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 0.0, 8.0, 5.0, 6.0, 12.0, 7.0, 29.0, 42.0, 55.0, 105.0, 163.0, 264.0, 468.0, 802.0, 1577.0, 3340.0, 7869.0, 22192.0, 75325.0, 400789.0, 3233540.0, 346264.0, 68274.0, 19942.0, 7085.0, 3052.0, 1396.0, 737.0, 390.0, 220.0, 114.0, 80.0, 51.0, 29.0, 18.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.083251953125, -16.57275390625, -16.062255859375, -15.5517578125, -15.041259765625, -14.53076171875, -14.020263671875, -13.509765625, -12.999267578125, -12.48876953125, -11.978271484375, -11.4677734375, -10.957275390625, -10.44677734375, -9.936279296875, -9.42578125, -8.915283203125, -8.40478515625, -7.894287109375, -7.3837890625, -6.873291015625, -6.36279296875, -5.852294921875, -5.341796875, -4.831298828125, -4.32080078125, -3.810302734375, -3.2998046875, -2.789306640625, -2.27880859375, -1.768310546875, -1.2578125, -0.747314453125, -0.23681640625, 0.273681640625, 0.7841796875, 1.294677734375, 1.80517578125, 2.315673828125, 2.826171875, 3.336669921875, 3.84716796875, 4.357666015625, 4.8681640625, 5.378662109375, 5.88916015625, 6.399658203125, 6.91015625, 7.420654296875, 7.93115234375, 8.441650390625, 8.9521484375, 9.462646484375, 9.97314453125, 10.483642578125, 10.994140625, 11.504638671875, 12.01513671875, 12.525634765625, 13.0361328125, 13.546630859375, 14.05712890625, 14.567626953125, 15.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 10.0, 4.0, 14.0, 11.0, 16.0, 18.0, 40.0, 54.0, 57.0, 101.0, 146.0, 224.0, 499.0, 1623.0, 525.0, 258.0, 152.0, 94.0, 69.0, 42.0, 34.0, 34.0, 9.0, 8.0, 8.0, 8.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.469146728515625, -2.38555908203125, -2.301971435546875, -2.2183837890625, -2.134796142578125, -2.05120849609375, -1.967620849609375, -1.884033203125, -1.800445556640625, -1.71685791015625, -1.633270263671875, -1.5496826171875, -1.466094970703125, -1.38250732421875, -1.298919677734375, -1.21533203125, -1.131744384765625, -1.04815673828125, -0.964569091796875, -0.8809814453125, -0.797393798828125, -0.71380615234375, -0.630218505859375, -0.546630859375, -0.463043212890625, -0.37945556640625, -0.295867919921875, -0.2122802734375, -0.128692626953125, -0.04510498046875, 0.038482666015625, 0.1220703125, 0.205657958984375, 0.28924560546875, 0.372833251953125, 0.4564208984375, 0.540008544921875, 0.62359619140625, 0.707183837890625, 0.790771484375, 0.874359130859375, 0.95794677734375, 1.041534423828125, 1.1251220703125, 1.208709716796875, 1.29229736328125, 1.375885009765625, 1.45947265625, 1.543060302734375, 1.62664794921875, 1.710235595703125, 1.7938232421875, 1.877410888671875, 1.96099853515625, 2.044586181640625, 2.128173828125, 2.211761474609375, 2.29534912109375, 2.378936767578125, 2.4625244140625, 2.546112060546875, 2.62969970703125, 2.713287353515625, 2.796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 12.0, 18.0, 42.0, 125.0, 210.0, 210.0, 182.0, 96.0, 46.0, 26.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.104042053222656, -33.084327697753906, -32.064613342285156, -31.044897079467773, -30.02518081665039, -29.00546646118164, -27.98575210571289, -26.96603775024414, -25.946321487426758, -24.926607131958008, -23.906890869140625, -22.887176513671875, -21.867462158203125, -20.847745895385742, -19.828031539916992, -18.80831527709961, -17.78860092163086, -16.76888656616211, -15.749170303344727, -14.729455947875977, -13.70974063873291, -12.690025329589844, -11.670310974121094, -10.650595664978027, -9.630880355834961, -8.611165046691895, -7.591450214385986, -6.571735382080078, -5.552020072937012, -4.532304763793945, -3.512589931488037, -2.492875099182129, -1.4731578826904297, -0.4534428119659424, 0.5662722587585449, 1.5859873294830322, 2.6057024002075195, 3.625417709350586, 4.645132541656494, 5.664847373962402, 6.684562683105469, 7.704277992248535, 8.723993301391602, 9.743707656860352, 10.763422966003418, 11.783138275146484, 12.802852630615234, 13.8225679397583, 14.842283248901367, 15.861998558044434, 16.8817138671875, 17.90142822265625, 18.921142578125, 19.940858840942383, 20.960573196411133, 21.980289459228516, 23.000003814697266, 24.019718170166016, 25.0394344329834, 26.05914878845215, 27.07886505126953, 28.09857940673828, 29.11829376220703, 30.13800811767578, 31.157724380493164]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 13.0, 19.0, 19.0, 11.0, 20.0, 24.0, 30.0, 30.0, 38.0, 52.0, 57.0, 70.0, 65.0, 62.0, 78.0, 59.0, 55.0, 52.0, 45.0, 37.0, 28.0, 34.0, 29.0, 17.0, 17.0, 13.0, 13.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.659423828125, -12.290857315063477, -11.922290802001953, -11.55372428894043, -11.185157775878906, -10.816591262817383, -10.44802474975586, -10.079458236694336, -9.710891723632812, -9.342325210571289, -8.973758697509766, -8.605192184448242, -8.236625671386719, -7.868059158325195, -7.499492645263672, -7.130926132202148, -6.762359619140625, -6.393793106079102, -6.025226593017578, -5.656660079956055, -5.288093566894531, -4.919527053833008, -4.550960540771484, -4.182394027709961, -3.8138275146484375, -3.445261001586914, -3.0766944885253906, -2.708127975463867, -2.3395614624023438, -1.9709949493408203, -1.6024284362792969, -1.2338619232177734, -0.8652944564819336, -0.49672794342041016, -0.12816143035888672, 0.24040508270263672, 0.6089715957641602, 0.9775381088256836, 1.346104621887207, 1.7146711349487305, 2.083237648010254, 2.4518041610717773, 2.820370674133301, 3.188937187194824, 3.5575037002563477, 3.926070213317871, 4.2946367263793945, 4.663203239440918, 5.031769752502441, 5.400336265563965, 5.768902778625488, 6.137469291687012, 6.506035804748535, 6.874602317810059, 7.243168830871582, 7.6117353439331055, 7.980301856994629, 8.348868370056152, 8.717434883117676, 9.0860013961792, 9.454567909240723, 9.823134422302246, 10.19170093536377, 10.560267448425293, 10.928833961486816]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 12.0, 9.0, 11.0, 21.0, 39.0, 45.0, 58.0, 78.0, 147.0, 202.0, 299.0, 508.0, 823.0, 1472.0, 2902.0, 6158.0, 16015.0, 52087.0, 226048.0, 520460.0, 158590.0, 39090.0, 12536.0, 5096.0, 2400.0, 1313.0, 739.0, 449.0, 326.0, 188.0, 130.0, 83.0, 66.0, 40.0, 35.0, 15.0, 15.0, 15.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-14.390625, -13.9462890625, -13.501953125, -13.0576171875, -12.61328125, -12.1689453125, -11.724609375, -11.2802734375, -10.8359375, -10.3916015625, -9.947265625, -9.5029296875, -9.05859375, -8.6142578125, -8.169921875, -7.7255859375, -7.28125, -6.8369140625, -6.392578125, -5.9482421875, -5.50390625, -5.0595703125, -4.615234375, -4.1708984375, -3.7265625, -3.2822265625, -2.837890625, -2.3935546875, -1.94921875, -1.5048828125, -1.060546875, -0.6162109375, -0.171875, 0.2724609375, 0.716796875, 1.1611328125, 1.60546875, 2.0498046875, 2.494140625, 2.9384765625, 3.3828125, 3.8271484375, 4.271484375, 4.7158203125, 5.16015625, 5.6044921875, 6.048828125, 6.4931640625, 6.9375, 7.3818359375, 7.826171875, 8.2705078125, 8.71484375, 9.1591796875, 9.603515625, 10.0478515625, 10.4921875, 10.9365234375, 11.380859375, 11.8251953125, 12.26953125, 12.7138671875, 13.158203125, 13.6025390625, 14.046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 13.0, 13.0, 20.0, 28.0, 21.0, 53.0, 46.0, 73.0, 97.0, 92.0, 93.0, 94.0, 67.0, 70.0, 54.0, 45.0, 24.0, 23.0, 16.0, 10.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.609375, -1.5593719482421875, -1.509368896484375, -1.4593658447265625, -1.40936279296875, -1.3593597412109375, -1.309356689453125, -1.2593536376953125, -1.2093505859375, -1.1593475341796875, -1.109344482421875, -1.0593414306640625, -1.00933837890625, -0.9593353271484375, -0.909332275390625, -0.8593292236328125, -0.809326171875, -0.7593231201171875, -0.709320068359375, -0.6593170166015625, -0.60931396484375, -0.5593109130859375, -0.509307861328125, -0.4593048095703125, -0.4093017578125, -0.3592987060546875, -0.309295654296875, -0.2592926025390625, -0.20928955078125, -0.1592864990234375, -0.109283447265625, -0.0592803955078125, -0.00927734375, 0.0407257080078125, 0.090728759765625, 0.1407318115234375, 0.19073486328125, 0.2407379150390625, 0.290740966796875, 0.3407440185546875, 0.3907470703125, 0.4407501220703125, 0.490753173828125, 0.5407562255859375, 0.59075927734375, 0.6407623291015625, 0.690765380859375, 0.7407684326171875, 0.790771484375, 0.8407745361328125, 0.890777587890625, 0.9407806396484375, 0.99078369140625, 1.0407867431640625, 1.090789794921875, 1.1407928466796875, 1.1907958984375, 1.2407989501953125, 1.290802001953125, 1.3408050537109375, 1.39080810546875, 1.4408111572265625, 1.490814208984375, 1.5408172607421875, 1.5908203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 14.0, 16.0, 24.0, 25.0, 37.0, 65.0, 83.0, 134.0, 198.0, 280.0, 480.0, 786.0, 1380.0, 2688.0, 5112.0, 10677.0, 24967.0, 63447.0, 183584.0, 382351.0, 234066.0, 81278.0, 30560.0, 13097.0, 6028.0, 3080.0, 1691.0, 897.0, 490.0, 341.0, 228.0, 136.0, 91.0, 58.0, 42.0, 32.0, 21.0, 18.0, 11.0, 9.0, 7.0, 6.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.93743896484375, -6.7108154296875, -6.48419189453125, -6.257568359375, -6.03094482421875, -5.8043212890625, -5.57769775390625, -5.35107421875, -5.12445068359375, -4.8978271484375, -4.67120361328125, -4.444580078125, -4.21795654296875, -3.9913330078125, -3.76470947265625, -3.5380859375, -3.31146240234375, -3.0848388671875, -2.85821533203125, -2.631591796875, -2.40496826171875, -2.1783447265625, -1.95172119140625, -1.72509765625, -1.49847412109375, -1.2718505859375, -1.04522705078125, -0.818603515625, -0.59197998046875, -0.3653564453125, -0.13873291015625, 0.087890625, 0.31451416015625, 0.5411376953125, 0.76776123046875, 0.994384765625, 1.22100830078125, 1.4476318359375, 1.67425537109375, 1.90087890625, 2.12750244140625, 2.3541259765625, 2.58074951171875, 2.807373046875, 3.03399658203125, 3.2606201171875, 3.48724365234375, 3.7138671875, 3.94049072265625, 4.1671142578125, 4.39373779296875, 4.620361328125, 4.84698486328125, 5.0736083984375, 5.30023193359375, 5.52685546875, 5.75347900390625, 5.9801025390625, 6.20672607421875, 6.433349609375, 6.65997314453125, 6.8865966796875, 7.11322021484375, 7.33984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 11.0, 1.0, 10.0, 16.0, 16.0, 24.0, 13.0, 20.0, 27.0, 29.0, 21.0, 33.0, 33.0, 49.0, 39.0, 34.0, 53.0, 40.0, 36.0, 53.0, 40.0, 48.0, 42.0, 43.0, 43.0, 33.0, 19.0, 26.0, 29.0, 24.0, 13.0, 10.0, 10.0, 11.0, 12.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.6435546875, -3.501953125, -3.3603515625, -3.21875, -3.0771484375, -2.935546875, -2.7939453125, -2.65234375, -2.5107421875, -2.369140625, -2.2275390625, -2.0859375, -1.9443359375, -1.802734375, -1.6611328125, -1.51953125, -1.3779296875, -1.236328125, -1.0947265625, -0.953125, -0.8115234375, -0.669921875, -0.5283203125, -0.38671875, -0.2451171875, -0.103515625, 0.0380859375, 0.1796875, 0.3212890625, 0.462890625, 0.6044921875, 0.74609375, 0.8876953125, 1.029296875, 1.1708984375, 1.3125, 1.4541015625, 1.595703125, 1.7373046875, 1.87890625, 2.0205078125, 2.162109375, 2.3037109375, 2.4453125, 2.5869140625, 2.728515625, 2.8701171875, 3.01171875, 3.1533203125, 3.294921875, 3.4365234375, 3.578125, 3.7197265625, 3.861328125, 4.0029296875, 4.14453125, 4.2861328125, 4.427734375, 4.5693359375, 4.7109375, 4.8525390625, 4.994140625, 5.1357421875, 5.27734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 13.0, 19.0, 18.0, 33.0, 78.0, 109.0, 230.0, 476.0, 1281.0, 3836.0, 16504.0, 118623.0, 681952.0, 193888.0, 23582.0, 5123.0, 1595.0, 639.0, 253.0, 119.0, 62.0, 43.0, 29.0, 16.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9609375, -14.3985595703125, -13.836181640625, -13.2738037109375, -12.71142578125, -12.1490478515625, -11.586669921875, -11.0242919921875, -10.4619140625, -9.8995361328125, -9.337158203125, -8.7747802734375, -8.21240234375, -7.6500244140625, -7.087646484375, -6.5252685546875, -5.962890625, -5.4005126953125, -4.838134765625, -4.2757568359375, -3.71337890625, -3.1510009765625, -2.588623046875, -2.0262451171875, -1.4638671875, -0.9014892578125, -0.339111328125, 0.2232666015625, 0.78564453125, 1.3480224609375, 1.910400390625, 2.4727783203125, 3.03515625, 3.5975341796875, 4.159912109375, 4.7222900390625, 5.28466796875, 5.8470458984375, 6.409423828125, 6.9718017578125, 7.5341796875, 8.0965576171875, 8.658935546875, 9.2213134765625, 9.78369140625, 10.3460693359375, 10.908447265625, 11.4708251953125, 12.033203125, 12.5955810546875, 13.157958984375, 13.7203369140625, 14.28271484375, 14.8450927734375, 15.407470703125, 15.9698486328125, 16.5322265625, 17.0946044921875, 17.656982421875, 18.2193603515625, 18.78173828125, 19.3441162109375, 19.906494140625, 20.4688720703125, 21.03125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 10.0, 18.0, 23.0, 51.0, 113.0, 168.0, 211.0, 170.0, 100.0, 51.0, 27.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018330961465835571, -0.0017826855182647705, -0.0017322748899459839, -0.0016818642616271973, -0.0016314536333084106, -0.001581043004989624, -0.0015306323766708374, -0.0014802217483520508, -0.0014298111200332642, -0.0013794004917144775, -0.001328989863395691, -0.0012785792350769043, -0.0012281686067581177, -0.001177757978439331, -0.0011273473501205444, -0.0010769367218017578, -0.0010265260934829712, -0.0009761154651641846, -0.000925704836845398, -0.0008752942085266113, -0.0008248835802078247, -0.0007744729518890381, -0.0007240623235702515, -0.0006736516952514648, -0.0006232410669326782, -0.0005728304386138916, -0.000522419810295105, -0.00047200918197631836, -0.00042159855365753174, -0.0003711879253387451, -0.0003207772970199585, -0.0002703666687011719, -0.00021995604038238525, -0.00016954541206359863, -0.00011913478374481201, -6.872415542602539e-05, -1.831352710723877e-05, 3.209710121154785e-05, 8.250772953033447e-05, 0.0001329183578491211, 0.00018332898616790771, 0.00023373961448669434, 0.00028415024280548096, 0.0003345608711242676, 0.0003849714994430542, 0.0004353821277618408, 0.00048579275608062744, 0.0005362033843994141, 0.0005866140127182007, 0.0006370246410369873, 0.0006874352693557739, 0.0007378458976745605, 0.0007882565259933472, 0.0008386671543121338, 0.0008890777826309204, 0.000939488410949707, 0.0009898990392684937, 0.0010403096675872803, 0.001090720295906067, 0.0011411309242248535, 0.0011915415525436401, 0.0012419521808624268, 0.0012923628091812134, 0.0013427734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 15.0, 17.0, 22.0, 34.0, 62.0, 75.0, 132.0, 196.0, 336.0, 577.0, 1057.0, 1986.0, 4257.0, 9796.0, 26024.0, 85984.0, 296461.0, 409349.0, 145188.0, 41003.0, 14199.0, 5888.0, 2693.0, 1362.0, 754.0, 430.0, 244.0, 153.0, 85.0, 55.0, 45.0, 25.0, 19.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4246826171875, -8.114990234375, -7.8052978515625, -7.49560546875, -7.1859130859375, -6.876220703125, -6.5665283203125, -6.2568359375, -5.9471435546875, -5.637451171875, -5.3277587890625, -5.01806640625, -4.7083740234375, -4.398681640625, -4.0889892578125, -3.779296875, -3.4696044921875, -3.159912109375, -2.8502197265625, -2.54052734375, -2.2308349609375, -1.921142578125, -1.6114501953125, -1.3017578125, -0.9920654296875, -0.682373046875, -0.3726806640625, -0.06298828125, 0.2467041015625, 0.556396484375, 0.8660888671875, 1.17578125, 1.4854736328125, 1.795166015625, 2.1048583984375, 2.41455078125, 2.7242431640625, 3.033935546875, 3.3436279296875, 3.6533203125, 3.9630126953125, 4.272705078125, 4.5823974609375, 4.89208984375, 5.2017822265625, 5.511474609375, 5.8211669921875, 6.130859375, 6.4405517578125, 6.750244140625, 7.0599365234375, 7.36962890625, 7.6793212890625, 7.989013671875, 8.2987060546875, 8.6083984375, 8.9180908203125, 9.227783203125, 9.5374755859375, 9.84716796875, 10.1568603515625, 10.466552734375, 10.7762451171875, 11.0859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 14.0, 24.0, 24.0, 51.0, 38.0, 58.0, 60.0, 83.0, 91.0, 94.0, 93.0, 76.0, 54.0, 53.0, 33.0, 28.0, 19.0, 14.0, 8.0, 7.0, 12.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.149658203125, -5.95166015625, -5.753662109375, -5.5556640625, -5.357666015625, -5.15966796875, -4.961669921875, -4.763671875, -4.565673828125, -4.36767578125, -4.169677734375, -3.9716796875, -3.773681640625, -3.57568359375, -3.377685546875, -3.1796875, -2.981689453125, -2.78369140625, -2.585693359375, -2.3876953125, -2.189697265625, -1.99169921875, -1.793701171875, -1.595703125, -1.397705078125, -1.19970703125, -1.001708984375, -0.8037109375, -0.605712890625, -0.40771484375, -0.209716796875, -0.01171875, 0.186279296875, 0.38427734375, 0.582275390625, 0.7802734375, 0.978271484375, 1.17626953125, 1.374267578125, 1.572265625, 1.770263671875, 1.96826171875, 2.166259765625, 2.3642578125, 2.562255859375, 2.76025390625, 2.958251953125, 3.15625, 3.354248046875, 3.55224609375, 3.750244140625, 3.9482421875, 4.146240234375, 4.34423828125, 4.542236328125, 4.740234375, 4.938232421875, 5.13623046875, 5.334228515625, 5.5322265625, 5.730224609375, 5.92822265625, 6.126220703125, 6.32421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 5.0, 4.0, 7.0, 8.0, 27.0, 56.0, 124.0, 214.0, 277.0, 155.0, 70.0, 35.0, 12.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.39089965820312, -119.12557983398438, -115.8602523803711, -112.59493255615234, -109.32960510253906, -106.06428527832031, -102.79896545410156, -99.53364562988281, -96.26831817626953, -93.00299835205078, -89.7376708984375, -86.47235107421875, -83.20703125, -79.94170379638672, -76.67638397216797, -73.41105651855469, -70.14573669433594, -66.88041687011719, -63.615089416503906, -60.349769592285156, -57.08444595336914, -53.819122314453125, -50.553802490234375, -47.28847885131836, -44.023155212402344, -40.75783157348633, -37.49250793457031, -34.22718811035156, -30.961864471435547, -27.69654083251953, -24.43121910095215, -21.165897369384766, -17.90058135986328, -14.635258674621582, -11.369935989379883, -8.104613304138184, -4.839290618896484, -1.5739669799804688, 1.691354751586914, 4.956676483154297, 8.222000122070312, 11.487322807312012, 14.752645492553711, 18.017967224121094, 21.28329086303711, 24.548614501953125, 27.813936233520508, 31.07925796508789, 34.344581604003906, 37.60990524291992, 40.87522888183594, 44.14054870605469, 47.4058723449707, 50.67119598388672, 53.93651580810547, 57.201839447021484, 60.4671630859375, 63.732486724853516, 66.99781036376953, 70.26313018798828, 73.52845764160156, 76.79377746582031, 80.05909729003906, 83.32441711425781, 86.5897445678711]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 8.0, 6.0, 9.0, 20.0, 21.0, 31.0, 45.0, 39.0, 56.0, 64.0, 61.0, 82.0, 77.0, 67.0, 83.0, 69.0, 55.0, 45.0, 36.0, 25.0, 16.0, 22.0, 10.0, 6.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.96773147583008, -39.429840087890625, -37.89194869995117, -36.35405731201172, -34.81616973876953, -33.27827835083008, -31.740386962890625, -30.202495574951172, -28.66460609436035, -27.1267147064209, -25.588825225830078, -24.050933837890625, -22.513042449951172, -20.97515296936035, -19.4372615814209, -17.899372100830078, -16.361480712890625, -14.823590278625488, -13.285699844360352, -11.747808456420898, -10.209918022155762, -8.672027587890625, -7.134136199951172, -5.596245765686035, -4.058355331420898, -2.5204646587371826, -0.9825739860534668, 0.5553169250488281, 2.093207359313965, 3.6310977935791016, 5.168989181518555, 6.706879615783691, 8.244773864746094, 9.78266429901123, 11.320554733276367, 12.85844612121582, 14.396336555480957, 15.934226989746094, 17.472118377685547, 19.010009765625, 20.54789924621582, 22.085790634155273, 23.623680114746094, 25.161571502685547, 26.699462890625, 28.23735237121582, 29.775243759155273, 31.313133239746094, 32.85102462768555, 34.388916015625, 35.92680740356445, 37.464698791503906, 39.002586364746094, 40.54047775268555, 42.078369140625, 43.61626052856445, 45.154151916503906, 46.69204330444336, 48.22993469238281, 49.767822265625, 51.30571365356445, 52.843605041503906, 54.38149642944336, 55.91938781738281, 57.457275390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 17.0, 27.0, 33.0, 41.0, 67.0, 94.0, 138.0, 232.0, 317.0, 553.0, 950.0, 1862.0, 3941.0, 9819.0, 31282.0, 171358.0, 3517087.0, 385072.0, 49199.0, 13354.0, 4814.0, 1901.0, 939.0, 477.0, 256.0, 157.0, 109.0, 65.0, 33.0, 21.0, 14.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.405029296875, -33.46630859375, -32.527587890625, -31.5888671875, -30.650146484375, -29.71142578125, -28.772705078125, -27.833984375, -26.895263671875, -25.95654296875, -25.017822265625, -24.0791015625, -23.140380859375, -22.20166015625, -21.262939453125, -20.32421875, -19.385498046875, -18.44677734375, -17.508056640625, -16.5693359375, -15.630615234375, -14.69189453125, -13.753173828125, -12.814453125, -11.875732421875, -10.93701171875, -9.998291015625, -9.0595703125, -8.120849609375, -7.18212890625, -6.243408203125, -5.3046875, -4.365966796875, -3.42724609375, -2.488525390625, -1.5498046875, -0.611083984375, 0.32763671875, 1.266357421875, 2.205078125, 3.143798828125, 4.08251953125, 5.021240234375, 5.9599609375, 6.898681640625, 7.83740234375, 8.776123046875, 9.71484375, 10.653564453125, 11.59228515625, 12.531005859375, 13.4697265625, 14.408447265625, 15.34716796875, 16.285888671875, 17.224609375, 18.163330078125, 19.10205078125, 20.040771484375, 20.9794921875, 21.918212890625, 22.85693359375, 23.795654296875, 24.734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 6.0, 10.0, 22.0, 21.0, 35.0, 50.0, 54.0, 71.0, 59.0, 88.0, 98.0, 91.0, 83.0, 55.0, 51.0, 38.0, 42.0, 35.0, 27.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.5342864990234375, -1.485565185546875, -1.4368438720703125, -1.38812255859375, -1.3394012451171875, -1.290679931640625, -1.2419586181640625, -1.1932373046875, -1.1445159912109375, -1.095794677734375, -1.0470733642578125, -0.99835205078125, -0.9496307373046875, -0.900909423828125, -0.8521881103515625, -0.803466796875, -0.7547454833984375, -0.706024169921875, -0.6573028564453125, -0.60858154296875, -0.5598602294921875, -0.511138916015625, -0.4624176025390625, -0.4136962890625, -0.3649749755859375, -0.316253662109375, -0.2675323486328125, -0.21881103515625, -0.1700897216796875, -0.121368408203125, -0.0726470947265625, -0.02392578125, 0.0247955322265625, 0.073516845703125, 0.1222381591796875, 0.17095947265625, 0.2196807861328125, 0.268402099609375, 0.3171234130859375, 0.3658447265625, 0.4145660400390625, 0.463287353515625, 0.5120086669921875, 0.56072998046875, 0.6094512939453125, 0.658172607421875, 0.7068939208984375, 0.755615234375, 0.8043365478515625, 0.853057861328125, 0.9017791748046875, 0.95050048828125, 0.9992218017578125, 1.047943115234375, 1.0966644287109375, 1.1453857421875, 1.1941070556640625, 1.242828369140625, 1.2915496826171875, 1.34027099609375, 1.3889923095703125, 1.437713623046875, 1.4864349365234375, 1.53515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 13.0, 8.0, 15.0, 22.0, 40.0, 51.0, 73.0, 135.0, 262.0, 851.0, 5637.0, 125621.0, 3939726.0, 114882.0, 5384.0, 862.0, 287.0, 162.0, 63.0, 55.0, 47.0, 30.0, 23.0, 4.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-78.5625, -76.6689453125, -74.775390625, -72.8818359375, -70.98828125, -69.0947265625, -67.201171875, -65.3076171875, -63.4140625, -61.5205078125, -59.626953125, -57.7333984375, -55.83984375, -53.9462890625, -52.052734375, -50.1591796875, -48.265625, -46.3720703125, -44.478515625, -42.5849609375, -40.69140625, -38.7978515625, -36.904296875, -35.0107421875, -33.1171875, -31.2236328125, -29.330078125, -27.4365234375, -25.54296875, -23.6494140625, -21.755859375, -19.8623046875, -17.96875, -16.0751953125, -14.181640625, -12.2880859375, -10.39453125, -8.5009765625, -6.607421875, -4.7138671875, -2.8203125, -0.9267578125, 0.966796875, 2.8603515625, 4.75390625, 6.6474609375, 8.541015625, 10.4345703125, 12.328125, 14.2216796875, 16.115234375, 18.0087890625, 19.90234375, 21.7958984375, 23.689453125, 25.5830078125, 27.4765625, 29.3701171875, 31.263671875, 33.1572265625, 35.05078125, 36.9443359375, 38.837890625, 40.7314453125, 42.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 2.0, 3.0, 14.0, 20.0, 41.0, 32.0, 48.0, 85.0, 105.0, 182.0, 299.0, 478.0, 1160.0, 681.0, 336.0, 191.0, 120.0, 73.0, 63.0, 33.0, 36.0, 14.0, 14.0, 15.0, 6.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1331787109375, -2.012451171875, -1.8917236328125, -1.77099609375, -1.6502685546875, -1.529541015625, -1.4088134765625, -1.2880859375, -1.1673583984375, -1.046630859375, -0.9259033203125, -0.80517578125, -0.6844482421875, -0.563720703125, -0.4429931640625, -0.322265625, -0.2015380859375, -0.080810546875, 0.0399169921875, 0.16064453125, 0.2813720703125, 0.402099609375, 0.5228271484375, 0.6435546875, 0.7642822265625, 0.885009765625, 1.0057373046875, 1.12646484375, 1.2471923828125, 1.367919921875, 1.4886474609375, 1.609375, 1.7301025390625, 1.850830078125, 1.9715576171875, 2.09228515625, 2.2130126953125, 2.333740234375, 2.4544677734375, 2.5751953125, 2.6959228515625, 2.816650390625, 2.9373779296875, 3.05810546875, 3.1788330078125, 3.299560546875, 3.4202880859375, 3.541015625, 3.6617431640625, 3.782470703125, 3.9031982421875, 4.02392578125, 4.1446533203125, 4.265380859375, 4.3861083984375, 4.5068359375, 4.6275634765625, 4.748291015625, 4.8690185546875, 4.98974609375, 5.1104736328125, 5.231201171875, 5.3519287109375, 5.47265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 32.0, 95.0, 195.0, 274.0, 230.0, 99.0, 38.0, 14.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.01563262939453, -65.32146453857422, -63.627296447753906, -61.93312454223633, -60.238956451416016, -58.5447883605957, -56.850616455078125, -55.15644836425781, -53.4622802734375, -51.76811218261719, -50.073944091796875, -48.3797721862793, -46.685604095458984, -44.99143600463867, -43.297264099121094, -41.60309600830078, -39.90892791748047, -38.214759826660156, -36.520591735839844, -34.826419830322266, -33.13225173950195, -31.43808364868164, -29.743913650512695, -28.04974365234375, -26.355575561523438, -24.661407470703125, -22.96723747253418, -21.273067474365234, -19.578899383544922, -17.88473129272461, -16.190561294555664, -14.496392250061035, -12.80221939086914, -11.108050346374512, -9.413881301879883, -7.719712257385254, -6.025543212890625, -4.331374168395996, -2.637205123901367, -0.9430360794067383, 0.7511329650878906, 2.4453020095825195, 4.139471054077148, 5.833640098571777, 7.527809143066406, 9.221978187561035, 10.916147232055664, 12.610316276550293, 14.304485321044922, 15.99865436553955, 17.69282341003418, 19.386993408203125, 21.081161499023438, 22.77532958984375, 24.469499588012695, 26.16366958618164, 27.857837677001953, 29.552005767822266, 31.24617576599121, 32.940345764160156, 34.63451385498047, 36.32868194580078, 38.022850036621094, 39.71702194213867, 41.411190032958984]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 9.0, 5.0, 12.0, 15.0, 23.0, 24.0, 25.0, 28.0, 42.0, 41.0, 54.0, 40.0, 49.0, 49.0, 55.0, 58.0, 53.0, 59.0, 58.0, 38.0, 39.0, 48.0, 41.0, 28.0, 16.0, 24.0, 12.0, 8.0, 10.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.889745712280273, -13.383111000061035, -12.876477241516113, -12.369842529296875, -11.863208770751953, -11.356574058532715, -10.849939346313477, -10.343305587768555, -9.836670875549316, -9.330036163330078, -8.823402404785156, -8.316767692565918, -7.810133457183838, -7.303499221801758, -6.7968645095825195, -6.2902302742004395, -5.783596038818359, -5.276961803436279, -4.770327568054199, -4.263692855834961, -3.757058620452881, -3.250424385070801, -2.7437899112701416, -2.2371554374694824, -1.7305212020874023, -1.2238868474960327, -0.7172524929046631, -0.21061813831329346, 0.29601621627807617, 0.8026504516601562, 1.3092849254608154, 1.8159193992614746, 2.3225536346435547, 2.8291878700256348, 3.335822343826294, 3.842456817626953, 4.349091053009033, 4.855725288391113, 5.362360000610352, 5.868994235992432, 6.375628471374512, 6.882262706756592, 7.388896942138672, 7.89553165435791, 8.402166366577148, 8.90880012512207, 9.415434837341309, 9.922069549560547, 10.428703308105469, 10.935338020324707, 11.441971778869629, 11.948606491088867, 12.455240249633789, 12.961874961853027, 13.468509674072266, 13.975143432617188, 14.481778144836426, 14.988412857055664, 15.495046615600586, 16.001680374145508, 16.508316040039062, 17.014949798583984, 17.521583557128906, 18.02821922302246, 18.534852981567383]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 11.0, 12.0, 15.0, 19.0, 21.0, 36.0, 37.0, 73.0, 82.0, 112.0, 171.0, 248.0, 312.0, 490.0, 813.0, 1337.0, 2583.0, 5392.0, 12289.0, 30722.0, 85097.0, 242379.0, 380915.0, 180528.0, 62449.0, 23179.0, 9411.0, 4290.0, 2110.0, 1172.0, 733.0, 457.0, 286.0, 210.0, 168.0, 107.0, 90.0, 50.0, 39.0, 26.0, 21.0, 18.0, 11.0, 8.0, 9.0, 5.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.4375, -14.004638671875, -13.57177734375, -13.138916015625, -12.7060546875, -12.273193359375, -11.84033203125, -11.407470703125, -10.974609375, -10.541748046875, -10.10888671875, -9.676025390625, -9.2431640625, -8.810302734375, -8.37744140625, -7.944580078125, -7.51171875, -7.078857421875, -6.64599609375, -6.213134765625, -5.7802734375, -5.347412109375, -4.91455078125, -4.481689453125, -4.048828125, -3.615966796875, -3.18310546875, -2.750244140625, -2.3173828125, -1.884521484375, -1.45166015625, -1.018798828125, -0.5859375, -0.153076171875, 0.27978515625, 0.712646484375, 1.1455078125, 1.578369140625, 2.01123046875, 2.444091796875, 2.876953125, 3.309814453125, 3.74267578125, 4.175537109375, 4.6083984375, 5.041259765625, 5.47412109375, 5.906982421875, 6.33984375, 6.772705078125, 7.20556640625, 7.638427734375, 8.0712890625, 8.504150390625, 8.93701171875, 9.369873046875, 9.802734375, 10.235595703125, 10.66845703125, 11.101318359375, 11.5341796875, 11.967041015625, 12.39990234375, 12.832763671875, 13.265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 10.0, 14.0, 11.0, 13.0, 26.0, 37.0, 55.0, 73.0, 72.0, 89.0, 79.0, 77.0, 87.0, 64.0, 52.0, 53.0, 50.0, 24.0, 32.0, 17.0, 21.0, 12.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.4537811279296875, -1.405609130859375, -1.3574371337890625, -1.30926513671875, -1.2610931396484375, -1.212921142578125, -1.1647491455078125, -1.1165771484375, -1.0684051513671875, -1.020233154296875, -0.9720611572265625, -0.92388916015625, -0.8757171630859375, -0.827545166015625, -0.7793731689453125, -0.731201171875, -0.6830291748046875, -0.634857177734375, -0.5866851806640625, -0.53851318359375, -0.4903411865234375, -0.442169189453125, -0.3939971923828125, -0.3458251953125, -0.2976531982421875, -0.249481201171875, -0.2013092041015625, -0.15313720703125, -0.1049652099609375, -0.056793212890625, -0.0086212158203125, 0.03955078125, 0.0877227783203125, 0.135894775390625, 0.1840667724609375, 0.23223876953125, 0.2804107666015625, 0.328582763671875, 0.3767547607421875, 0.4249267578125, 0.4730987548828125, 0.521270751953125, 0.5694427490234375, 0.61761474609375, 0.6657867431640625, 0.713958740234375, 0.7621307373046875, 0.810302734375, 0.8584747314453125, 0.906646728515625, 0.9548187255859375, 1.00299072265625, 1.0511627197265625, 1.099334716796875, 1.1475067138671875, 1.1956787109375, 1.2438507080078125, 1.292022705078125, 1.3401947021484375, 1.38836669921875, 1.4365386962890625, 1.484710693359375, 1.5328826904296875, 1.5810546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 4.0, 7.0, 11.0, 20.0, 8.0, 29.0, 50.0, 69.0, 91.0, 198.0, 336.0, 632.0, 1410.0, 3288.0, 9417.0, 30370.0, 109789.0, 357170.0, 369956.0, 116744.0, 32311.0, 10053.0, 3612.0, 1472.0, 642.0, 304.0, 197.0, 122.0, 71.0, 43.0, 37.0, 26.0, 11.0, 10.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.15625, -16.6519775390625, -16.147705078125, -15.6434326171875, -15.13916015625, -14.6348876953125, -14.130615234375, -13.6263427734375, -13.1220703125, -12.6177978515625, -12.113525390625, -11.6092529296875, -11.10498046875, -10.6007080078125, -10.096435546875, -9.5921630859375, -9.087890625, -8.5836181640625, -8.079345703125, -7.5750732421875, -7.07080078125, -6.5665283203125, -6.062255859375, -5.5579833984375, -5.0537109375, -4.5494384765625, -4.045166015625, -3.5408935546875, -3.03662109375, -2.5323486328125, -2.028076171875, -1.5238037109375, -1.01953125, -0.5152587890625, -0.010986328125, 0.4932861328125, 0.99755859375, 1.5018310546875, 2.006103515625, 2.5103759765625, 3.0146484375, 3.5189208984375, 4.023193359375, 4.5274658203125, 5.03173828125, 5.5360107421875, 6.040283203125, 6.5445556640625, 7.048828125, 7.5531005859375, 8.057373046875, 8.5616455078125, 9.06591796875, 9.5701904296875, 10.074462890625, 10.5787353515625, 11.0830078125, 11.5872802734375, 12.091552734375, 12.5958251953125, 13.10009765625, 13.6043701171875, 14.108642578125, 14.6129150390625, 15.1171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 9.0, 5.0, 16.0, 14.0, 23.0, 12.0, 20.0, 34.0, 20.0, 32.0, 46.0, 48.0, 52.0, 47.0, 67.0, 51.0, 50.0, 39.0, 58.0, 32.0, 33.0, 46.0, 35.0, 28.0, 19.0, 34.0, 19.0, 17.0, 18.0, 16.0, 5.0, 15.0, 4.0, 5.0, 7.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.95703125, -6.7529296875, -6.548828125, -6.3447265625, -6.140625, -5.9365234375, -5.732421875, -5.5283203125, -5.32421875, -5.1201171875, -4.916015625, -4.7119140625, -4.5078125, -4.3037109375, -4.099609375, -3.8955078125, -3.69140625, -3.4873046875, -3.283203125, -3.0791015625, -2.875, -2.6708984375, -2.466796875, -2.2626953125, -2.05859375, -1.8544921875, -1.650390625, -1.4462890625, -1.2421875, -1.0380859375, -0.833984375, -0.6298828125, -0.42578125, -0.2216796875, -0.017578125, 0.1865234375, 0.390625, 0.5947265625, 0.798828125, 1.0029296875, 1.20703125, 1.4111328125, 1.615234375, 1.8193359375, 2.0234375, 2.2275390625, 2.431640625, 2.6357421875, 2.83984375, 3.0439453125, 3.248046875, 3.4521484375, 3.65625, 3.8603515625, 4.064453125, 4.2685546875, 4.47265625, 4.6767578125, 4.880859375, 5.0849609375, 5.2890625, 5.4931640625, 5.697265625, 5.9013671875, 6.10546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 9.0, 9.0, 19.0, 27.0, 38.0, 49.0, 87.0, 126.0, 177.0, 360.0, 483.0, 818.0, 1509.0, 2634.0, 5022.0, 10453.0, 24073.0, 63280.0, 213283.0, 460378.0, 172051.0, 53234.0, 20799.0, 9240.0, 4562.0, 2429.0, 1359.0, 777.0, 484.0, 262.0, 154.0, 111.0, 83.0, 47.0, 38.0, 16.0, 20.0, 16.0, 10.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0572509765625, -14.606689453125, -14.1561279296875, -13.70556640625, -13.2550048828125, -12.804443359375, -12.3538818359375, -11.9033203125, -11.4527587890625, -11.002197265625, -10.5516357421875, -10.10107421875, -9.6505126953125, -9.199951171875, -8.7493896484375, -8.298828125, -7.8482666015625, -7.397705078125, -6.9471435546875, -6.49658203125, -6.0460205078125, -5.595458984375, -5.1448974609375, -4.6943359375, -4.2437744140625, -3.793212890625, -3.3426513671875, -2.89208984375, -2.4415283203125, -1.990966796875, -1.5404052734375, -1.08984375, -0.6392822265625, -0.188720703125, 0.2618408203125, 0.71240234375, 1.1629638671875, 1.613525390625, 2.0640869140625, 2.5146484375, 2.9652099609375, 3.415771484375, 3.8663330078125, 4.31689453125, 4.7674560546875, 5.218017578125, 5.6685791015625, 6.119140625, 6.5697021484375, 7.020263671875, 7.4708251953125, 7.92138671875, 8.3719482421875, 8.822509765625, 9.2730712890625, 9.7236328125, 10.1741943359375, 10.624755859375, 11.0753173828125, 11.52587890625, 11.9764404296875, 12.427001953125, 12.8775634765625, 13.328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 4.0, 4.0, 7.0, 4.0, 8.0, 10.0, 13.0, 14.0, 23.0, 30.0, 50.0, 98.0, 143.0, 167.0, 147.0, 89.0, 47.0, 32.0, 26.0, 23.0, 15.0, 8.0, 9.0, 4.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00293731689453125, -0.0028441548347473145, -0.002750992774963379, -0.0026578307151794434, -0.002564668655395508, -0.0024715065956115723, -0.0023783445358276367, -0.002285182476043701, -0.0021920204162597656, -0.00209885835647583, -0.0020056962966918945, -0.001912534236907959, -0.0018193721771240234, -0.0017262101173400879, -0.0016330480575561523, -0.0015398859977722168, -0.0014467239379882812, -0.0013535618782043457, -0.0012603998184204102, -0.0011672377586364746, -0.001074075698852539, -0.0009809136390686035, -0.000887751579284668, -0.0007945895195007324, -0.0007014274597167969, -0.0006082653999328613, -0.0005151033401489258, -0.00042194128036499023, -0.0003287792205810547, -0.00023561716079711914, -0.0001424551010131836, -4.929304122924805e-05, 4.38690185546875e-05, 0.00013703107833862305, 0.0002301931381225586, 0.00032335519790649414, 0.0004165172576904297, 0.0005096793174743652, 0.0006028413772583008, 0.0006960034370422363, 0.0007891654968261719, 0.0008823275566101074, 0.000975489616394043, 0.0010686516761779785, 0.001161813735961914, 0.0012549757957458496, 0.0013481378555297852, 0.0014412999153137207, 0.0015344619750976562, 0.0016276240348815918, 0.0017207860946655273, 0.0018139481544494629, 0.0019071102142333984, 0.002000272274017334, 0.0020934343338012695, 0.002186596393585205, 0.0022797584533691406, 0.002372920513153076, 0.0024660825729370117, 0.0025592446327209473, 0.002652406692504883, 0.0027455687522888184, 0.002838730812072754, 0.0029318928718566895, 0.003025054931640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 7.0, 9.0, 20.0, 34.0, 38.0, 64.0, 89.0, 193.0, 336.0, 791.0, 1666.0, 4231.0, 11995.0, 41794.0, 225980.0, 616219.0, 106668.0, 25193.0, 7857.0, 2916.0, 1208.0, 549.0, 301.0, 137.0, 71.0, 59.0, 29.0, 19.0, 22.0, 5.0, 10.0, 11.0, 8.0, 2.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.953125, -24.1806640625, -23.408203125, -22.6357421875, -21.86328125, -21.0908203125, -20.318359375, -19.5458984375, -18.7734375, -18.0009765625, -17.228515625, -16.4560546875, -15.68359375, -14.9111328125, -14.138671875, -13.3662109375, -12.59375, -11.8212890625, -11.048828125, -10.2763671875, -9.50390625, -8.7314453125, -7.958984375, -7.1865234375, -6.4140625, -5.6416015625, -4.869140625, -4.0966796875, -3.32421875, -2.5517578125, -1.779296875, -1.0068359375, -0.234375, 0.5380859375, 1.310546875, 2.0830078125, 2.85546875, 3.6279296875, 4.400390625, 5.1728515625, 5.9453125, 6.7177734375, 7.490234375, 8.2626953125, 9.03515625, 9.8076171875, 10.580078125, 11.3525390625, 12.125, 12.8974609375, 13.669921875, 14.4423828125, 15.21484375, 15.9873046875, 16.759765625, 17.5322265625, 18.3046875, 19.0771484375, 19.849609375, 20.6220703125, 21.39453125, 22.1669921875, 22.939453125, 23.7119140625, 24.484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 4.0, 6.0, 7.0, 8.0, 12.0, 14.0, 13.0, 20.0, 30.0, 35.0, 48.0, 55.0, 85.0, 89.0, 93.0, 89.0, 85.0, 65.0, 52.0, 38.0, 14.0, 20.0, 19.0, 8.0, 15.0, 9.0, 10.0, 5.0, 4.0, 5.0, 7.0, 2.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0546875, -9.7437744140625, -9.432861328125, -9.1219482421875, -8.81103515625, -8.5001220703125, -8.189208984375, -7.8782958984375, -7.5673828125, -7.2564697265625, -6.945556640625, -6.6346435546875, -6.32373046875, -6.0128173828125, -5.701904296875, -5.3909912109375, -5.080078125, -4.7691650390625, -4.458251953125, -4.1473388671875, -3.83642578125, -3.5255126953125, -3.214599609375, -2.9036865234375, -2.5927734375, -2.2818603515625, -1.970947265625, -1.6600341796875, -1.34912109375, -1.0382080078125, -0.727294921875, -0.4163818359375, -0.10546875, 0.2054443359375, 0.516357421875, 0.8272705078125, 1.13818359375, 1.4490966796875, 1.760009765625, 2.0709228515625, 2.3818359375, 2.6927490234375, 3.003662109375, 3.3145751953125, 3.62548828125, 3.9364013671875, 4.247314453125, 4.5582275390625, 4.869140625, 5.1800537109375, 5.490966796875, 5.8018798828125, 6.11279296875, 6.4237060546875, 6.734619140625, 7.0455322265625, 7.3564453125, 7.6673583984375, 7.978271484375, 8.2891845703125, 8.60009765625, 8.9110107421875, 9.221923828125, 9.5328369140625, 9.84375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 27.0, 123.0, 387.0, 342.0, 103.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.44189453125, -143.41519165039062, -131.3885040283203, -119.36180114746094, -107.3351058959961, -95.30841064453125, -83.28170776367188, -71.25501251220703, -59.22831726074219, -47.201622009277344, -35.174922943115234, -23.148223876953125, -11.121528625488281, 0.9051666259765625, 12.931869506835938, 24.95856475830078, 36.985260009765625, 49.01195526123047, 61.03865432739258, 73.06535339355469, 85.09204864501953, 97.11874389648438, 109.14544677734375, 121.1721420288086, 133.19883728027344, 145.2255401611328, 157.25222778320312, 169.2789306640625, 181.30563354492188, 193.3323211669922, 205.35902404785156, 217.38571166992188, 229.41241455078125, 241.43911743164062, 253.46580505371094, 265.49249267578125, 277.5191955566406, 289.5458984375, 301.5726013183594, 313.59930419921875, 325.6259765625, 337.6526794433594, 349.67938232421875, 361.7060546875, 373.7327575683594, 385.75946044921875, 397.7861633300781, 409.8128662109375, 421.8395690917969, 433.86627197265625, 445.8929748535156, 457.919677734375, 469.94635009765625, 481.9730529785156, 493.999755859375, 506.0264587402344, 518.0531616210938, 530.079833984375, 542.1065673828125, 554.1332397460938, 566.1599731445312, 578.1866455078125, 590.21337890625, 602.2400512695312, 614.2667236328125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 8.0, 10.0, 14.0, 19.0, 17.0, 29.0, 22.0, 45.0, 36.0, 41.0, 52.0, 63.0, 73.0, 59.0, 58.0, 60.0, 56.0, 61.0, 49.0, 39.0, 19.0, 41.0, 28.0, 23.0, 20.0, 12.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.74826431274414, -60.60056686401367, -58.45287322998047, -56.30517578125, -54.15747833251953, -52.00978088378906, -49.862083435058594, -47.71438980102539, -45.56669235229492, -43.41899490356445, -41.27130126953125, -39.12360382080078, -36.97590637207031, -34.828208923339844, -32.680511474609375, -30.532817840576172, -28.385120391845703, -26.237422943115234, -24.0897274017334, -21.942031860351562, -19.794334411621094, -17.646636962890625, -15.498941421508789, -13.351244926452637, -11.203548431396484, -9.055851936340332, -6.90815544128418, -4.760458946228027, -2.612762451171875, -0.46506595611572266, 1.6826305389404297, 3.830327033996582, 5.978019714355469, 8.125716209411621, 10.273412704467773, 12.421109199523926, 14.568805694580078, 16.716503143310547, 18.864198684692383, 21.01189422607422, 23.159591674804688, 25.307289123535156, 27.454984664916992, 29.602680206298828, 31.750377655029297, 33.898075103759766, 36.04576873779297, 38.19346618652344, 40.341163635253906, 42.488861083984375, 44.636558532714844, 46.78425216674805, 48.931949615478516, 51.079647064208984, 53.22734069824219, 55.375038146972656, 57.522735595703125, 59.670433044433594, 61.81813049316406, 63.965824127197266, 66.113525390625, 68.26121520996094, 70.4089126586914, 72.55661010742188, 74.70430755615234]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 14.0, 16.0, 14.0, 30.0, 37.0, 37.0, 51.0, 63.0, 91.0, 119.0, 163.0, 245.0, 349.0, 552.0, 828.0, 1403.0, 2474.0, 4924.0, 11049.0, 29564.0, 102348.0, 641936.0, 3088973.0, 221380.0, 54306.0, 18161.0, 7491.0, 3423.0, 1734.0, 956.0, 589.0, 318.0, 213.0, 123.0, 84.0, 67.0, 31.0, 38.0, 17.0, 18.0, 7.0, 10.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.578125, -26.817138671875, -26.05615234375, -25.295166015625, -24.5341796875, -23.773193359375, -23.01220703125, -22.251220703125, -21.490234375, -20.729248046875, -19.96826171875, -19.207275390625, -18.4462890625, -17.685302734375, -16.92431640625, -16.163330078125, -15.40234375, -14.641357421875, -13.88037109375, -13.119384765625, -12.3583984375, -11.597412109375, -10.83642578125, -10.075439453125, -9.314453125, -8.553466796875, -7.79248046875, -7.031494140625, -6.2705078125, -5.509521484375, -4.74853515625, -3.987548828125, -3.2265625, -2.465576171875, -1.70458984375, -0.943603515625, -0.1826171875, 0.578369140625, 1.33935546875, 2.100341796875, 2.861328125, 3.622314453125, 4.38330078125, 5.144287109375, 5.9052734375, 6.666259765625, 7.42724609375, 8.188232421875, 8.94921875, 9.710205078125, 10.47119140625, 11.232177734375, 11.9931640625, 12.754150390625, 13.51513671875, 14.276123046875, 15.037109375, 15.798095703125, 16.55908203125, 17.320068359375, 18.0810546875, 18.842041015625, 19.60302734375, 20.364013671875, 21.125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 16.0, 16.0, 21.0, 16.0, 31.0, 40.0, 48.0, 46.0, 56.0, 73.0, 80.0, 68.0, 76.0, 66.0, 57.0, 54.0, 55.0, 42.0, 29.0, 26.0, 19.0, 10.0, 6.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.048828125, -1.99273681640625, -1.9366455078125, -1.88055419921875, -1.824462890625, -1.76837158203125, -1.7122802734375, -1.65618896484375, -1.60009765625, -1.54400634765625, -1.4879150390625, -1.43182373046875, -1.375732421875, -1.31964111328125, -1.2635498046875, -1.20745849609375, -1.1513671875, -1.09527587890625, -1.0391845703125, -0.98309326171875, -0.927001953125, -0.87091064453125, -0.8148193359375, -0.75872802734375, -0.70263671875, -0.64654541015625, -0.5904541015625, -0.53436279296875, -0.478271484375, -0.42218017578125, -0.3660888671875, -0.30999755859375, -0.25390625, -0.19781494140625, -0.1417236328125, -0.08563232421875, -0.029541015625, 0.02655029296875, 0.0826416015625, 0.13873291015625, 0.19482421875, 0.25091552734375, 0.3070068359375, 0.36309814453125, 0.419189453125, 0.47528076171875, 0.5313720703125, 0.58746337890625, 0.6435546875, 0.69964599609375, 0.7557373046875, 0.81182861328125, 0.867919921875, 0.92401123046875, 0.9801025390625, 1.03619384765625, 1.09228515625, 1.14837646484375, 1.2044677734375, 1.26055908203125, 1.316650390625, 1.37274169921875, 1.4288330078125, 1.48492431640625, 1.541015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 9.0, 7.0, 18.0, 21.0, 31.0, 42.0, 74.0, 133.0, 181.0, 342.0, 619.0, 1351.0, 3009.0, 7840.0, 22922.0, 84524.0, 462288.0, 3030754.0, 458895.0, 84499.0, 23118.0, 7654.0, 3055.0, 1325.0, 672.0, 329.0, 221.0, 110.0, 67.0, 53.0, 31.0, 27.0, 18.0, 10.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.578125, -23.7978515625, -23.017578125, -22.2373046875, -21.45703125, -20.6767578125, -19.896484375, -19.1162109375, -18.3359375, -17.5556640625, -16.775390625, -15.9951171875, -15.21484375, -14.4345703125, -13.654296875, -12.8740234375, -12.09375, -11.3134765625, -10.533203125, -9.7529296875, -8.97265625, -8.1923828125, -7.412109375, -6.6318359375, -5.8515625, -5.0712890625, -4.291015625, -3.5107421875, -2.73046875, -1.9501953125, -1.169921875, -0.3896484375, 0.390625, 1.1708984375, 1.951171875, 2.7314453125, 3.51171875, 4.2919921875, 5.072265625, 5.8525390625, 6.6328125, 7.4130859375, 8.193359375, 8.9736328125, 9.75390625, 10.5341796875, 11.314453125, 12.0947265625, 12.875, 13.6552734375, 14.435546875, 15.2158203125, 15.99609375, 16.7763671875, 17.556640625, 18.3369140625, 19.1171875, 19.8974609375, 20.677734375, 21.4580078125, 22.23828125, 23.0185546875, 23.798828125, 24.5791015625, 25.359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 13.0, 19.0, 28.0, 38.0, 50.0, 65.0, 130.0, 165.0, 343.0, 602.0, 1345.0, 492.0, 303.0, 143.0, 88.0, 84.0, 40.0, 36.0, 17.0, 21.0, 11.0, 6.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.260009765625, -5.07470703125, -4.889404296875, -4.7041015625, -4.518798828125, -4.33349609375, -4.148193359375, -3.962890625, -3.777587890625, -3.59228515625, -3.406982421875, -3.2216796875, -3.036376953125, -2.85107421875, -2.665771484375, -2.48046875, -2.295166015625, -2.10986328125, -1.924560546875, -1.7392578125, -1.553955078125, -1.36865234375, -1.183349609375, -0.998046875, -0.812744140625, -0.62744140625, -0.442138671875, -0.2568359375, -0.071533203125, 0.11376953125, 0.299072265625, 0.484375, 0.669677734375, 0.85498046875, 1.040283203125, 1.2255859375, 1.410888671875, 1.59619140625, 1.781494140625, 1.966796875, 2.152099609375, 2.33740234375, 2.522705078125, 2.7080078125, 2.893310546875, 3.07861328125, 3.263916015625, 3.44921875, 3.634521484375, 3.81982421875, 4.005126953125, 4.1904296875, 4.375732421875, 4.56103515625, 4.746337890625, 4.931640625, 5.116943359375, 5.30224609375, 5.487548828125, 5.6728515625, 5.858154296875, 6.04345703125, 6.228759765625, 6.4140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 14.0, 35.0, 116.0, 288.0, 342.0, 154.0, 43.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.66848754882812, -188.0599365234375, -184.45138549804688, -180.84283447265625, -177.23426818847656, -173.62571716308594, -170.0171661376953, -166.4086151123047, -162.80006408691406, -159.19151306152344, -155.5829620361328, -151.97439575195312, -148.3658447265625, -144.75729370117188, -141.14874267578125, -137.54019165039062, -133.931640625, -130.32308959960938, -126.71453094482422, -123.1059799194336, -119.49742889404297, -115.88887023925781, -112.28031921386719, -108.67176818847656, -105.06320190429688, -101.45465087890625, -97.8460922241211, -94.23754119873047, -90.62899017333984, -87.02043151855469, -83.41188049316406, -79.80332946777344, -76.19478607177734, -72.58623504638672, -68.97767639160156, -65.36912536621094, -61.76057434082031, -58.15201950073242, -54.54346466064453, -50.934913635253906, -47.326358795166016, -43.717803955078125, -40.1092529296875, -36.50069808959961, -32.89214324951172, -29.283592224121094, -25.675037384033203, -22.066484451293945, -18.457931518554688, -14.84937858581543, -11.240824699401855, -7.632270812988281, -4.023717880249023, -0.4151649475097656, 3.193389892578125, 6.801942825317383, 10.41049575805664, 14.019048690795898, 17.627601623535156, 21.236156463623047, 24.844709396362305, 28.453262329101562, 32.06181716918945, 35.670372009277344, 39.27892303466797]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 15.0, 23.0, 17.0, 25.0, 37.0, 22.0, 32.0, 35.0, 43.0, 40.0, 43.0, 51.0, 50.0, 55.0, 64.0, 70.0, 52.0, 44.0, 39.0, 33.0, 38.0, 41.0, 29.0, 17.0, 21.0, 16.0, 12.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.077171325683594, -25.220531463623047, -24.3638916015625, -23.507251739501953, -22.650611877441406, -21.79397201538086, -20.937332153320312, -20.080692291259766, -19.22405242919922, -18.367412567138672, -17.510772705078125, -16.654132843017578, -15.797492980957031, -14.940853118896484, -14.084214210510254, -13.227574348449707, -12.370935440063477, -11.51429557800293, -10.657655715942383, -9.801015853881836, -8.944375991821289, -8.087736129760742, -7.231097221374512, -6.374457359313965, -5.517817497253418, -4.661177635192871, -3.8045380115509033, -2.9478983879089355, -2.0912585258483887, -1.2346186637878418, -0.3779792785644531, 0.47866058349609375, 1.3353004455566406, 2.1919403076171875, 3.0485799312591553, 3.905219554901123, 4.76185941696167, 5.618499279022217, 6.4751386642456055, 7.331778526306152, 8.1884183883667, 9.045058250427246, 9.901698112487793, 10.758337020874023, 11.61497688293457, 12.471616744995117, 13.328256607055664, 14.184896469116211, 15.041536331176758, 15.898176193237305, 16.75481605529785, 17.6114559173584, 18.468095779418945, 19.324735641479492, 20.181373596191406, 21.038013458251953, 21.8946533203125, 22.751293182373047, 23.607933044433594, 24.46457290649414, 25.321212768554688, 26.177852630615234, 27.03449249267578, 27.891132354736328, 28.747772216796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 11.0, 17.0, 30.0, 45.0, 52.0, 77.0, 111.0, 136.0, 216.0, 301.0, 443.0, 665.0, 1079.0, 1789.0, 3345.0, 6502.0, 13703.0, 30325.0, 67256.0, 144290.0, 259193.0, 254869.0, 140649.0, 65510.0, 29774.0, 13625.0, 6406.0, 3168.0, 1839.0, 1021.0, 648.0, 454.0, 292.0, 221.0, 125.0, 98.0, 62.0, 56.0, 36.0, 22.0, 20.0, 16.0, 9.0, 5.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.060791015625, -10.69189453125, -10.322998046875, -9.9541015625, -9.585205078125, -9.21630859375, -8.847412109375, -8.478515625, -8.109619140625, -7.74072265625, -7.371826171875, -7.0029296875, -6.634033203125, -6.26513671875, -5.896240234375, -5.52734375, -5.158447265625, -4.78955078125, -4.420654296875, -4.0517578125, -3.682861328125, -3.31396484375, -2.945068359375, -2.576171875, -2.207275390625, -1.83837890625, -1.469482421875, -1.1005859375, -0.731689453125, -0.36279296875, 0.006103515625, 0.375, 0.743896484375, 1.11279296875, 1.481689453125, 1.8505859375, 2.219482421875, 2.58837890625, 2.957275390625, 3.326171875, 3.695068359375, 4.06396484375, 4.432861328125, 4.8017578125, 5.170654296875, 5.53955078125, 5.908447265625, 6.27734375, 6.646240234375, 7.01513671875, 7.384033203125, 7.7529296875, 8.121826171875, 8.49072265625, 8.859619140625, 9.228515625, 9.597412109375, 9.96630859375, 10.335205078125, 10.7041015625, 11.072998046875, 11.44189453125, 11.810791015625, 12.1796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 13.0, 11.0, 17.0, 25.0, 30.0, 24.0, 38.0, 41.0, 42.0, 56.0, 70.0, 69.0, 69.0, 65.0, 74.0, 47.0, 59.0, 38.0, 39.0, 42.0, 28.0, 30.0, 12.0, 14.0, 11.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609375, -1.896820068359375, -1.83270263671875, -1.768585205078125, -1.7044677734375, -1.640350341796875, -1.57623291015625, -1.512115478515625, -1.447998046875, -1.383880615234375, -1.31976318359375, -1.255645751953125, -1.1915283203125, -1.127410888671875, -1.06329345703125, -0.999176025390625, -0.93505859375, -0.870941162109375, -0.80682373046875, -0.742706298828125, -0.6785888671875, -0.614471435546875, -0.55035400390625, -0.486236572265625, -0.422119140625, -0.358001708984375, -0.29388427734375, -0.229766845703125, -0.1656494140625, -0.101531982421875, -0.03741455078125, 0.026702880859375, 0.0908203125, 0.154937744140625, 0.21905517578125, 0.283172607421875, 0.3472900390625, 0.411407470703125, 0.47552490234375, 0.539642333984375, 0.603759765625, 0.667877197265625, 0.73199462890625, 0.796112060546875, 0.8602294921875, 0.924346923828125, 0.98846435546875, 1.052581787109375, 1.11669921875, 1.180816650390625, 1.24493408203125, 1.309051513671875, 1.3731689453125, 1.437286376953125, 1.50140380859375, 1.565521240234375, 1.629638671875, 1.693756103515625, 1.75787353515625, 1.821990966796875, 1.8861083984375, 1.950225830078125, 2.01434326171875, 2.078460693359375, 2.142578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 13.0, 11.0, 18.0, 21.0, 25.0, 41.0, 74.0, 88.0, 153.0, 245.0, 361.0, 667.0, 1269.0, 2703.0, 5892.0, 14957.0, 42767.0, 129026.0, 354167.0, 322037.0, 112547.0, 37888.0, 13226.0, 5278.0, 2305.0, 1156.0, 641.0, 337.0, 227.0, 140.0, 88.0, 57.0, 39.0, 17.0, 23.0, 16.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.375, -19.80810546875, -19.2412109375, -18.67431640625, -18.107421875, -17.54052734375, -16.9736328125, -16.40673828125, -15.83984375, -15.27294921875, -14.7060546875, -14.13916015625, -13.572265625, -13.00537109375, -12.4384765625, -11.87158203125, -11.3046875, -10.73779296875, -10.1708984375, -9.60400390625, -9.037109375, -8.47021484375, -7.9033203125, -7.33642578125, -6.76953125, -6.20263671875, -5.6357421875, -5.06884765625, -4.501953125, -3.93505859375, -3.3681640625, -2.80126953125, -2.234375, -1.66748046875, -1.1005859375, -0.53369140625, 0.033203125, 0.60009765625, 1.1669921875, 1.73388671875, 2.30078125, 2.86767578125, 3.4345703125, 4.00146484375, 4.568359375, 5.13525390625, 5.7021484375, 6.26904296875, 6.8359375, 7.40283203125, 7.9697265625, 8.53662109375, 9.103515625, 9.67041015625, 10.2373046875, 10.80419921875, 11.37109375, 11.93798828125, 12.5048828125, 13.07177734375, 13.638671875, 14.20556640625, 14.7724609375, 15.33935546875, 15.90625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 9.0, 1.0, 11.0, 9.0, 12.0, 13.0, 12.0, 20.0, 22.0, 37.0, 32.0, 32.0, 34.0, 30.0, 57.0, 55.0, 56.0, 48.0, 49.0, 51.0, 48.0, 49.0, 30.0, 40.0, 41.0, 36.0, 33.0, 23.0, 23.0, 13.0, 12.0, 7.0, 9.0, 7.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.3955078125, -10.064453125, -9.7333984375, -9.40234375, -9.0712890625, -8.740234375, -8.4091796875, -8.078125, -7.7470703125, -7.416015625, -7.0849609375, -6.75390625, -6.4228515625, -6.091796875, -5.7607421875, -5.4296875, -5.0986328125, -4.767578125, -4.4365234375, -4.10546875, -3.7744140625, -3.443359375, -3.1123046875, -2.78125, -2.4501953125, -2.119140625, -1.7880859375, -1.45703125, -1.1259765625, -0.794921875, -0.4638671875, -0.1328125, 0.1982421875, 0.529296875, 0.8603515625, 1.19140625, 1.5224609375, 1.853515625, 2.1845703125, 2.515625, 2.8466796875, 3.177734375, 3.5087890625, 3.83984375, 4.1708984375, 4.501953125, 4.8330078125, 5.1640625, 5.4951171875, 5.826171875, 6.1572265625, 6.48828125, 6.8193359375, 7.150390625, 7.4814453125, 7.8125, 8.1435546875, 8.474609375, 8.8056640625, 9.13671875, 9.4677734375, 9.798828125, 10.1298828125, 10.4609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 14.0, 15.0, 25.0, 47.0, 89.0, 146.0, 299.0, 617.0, 1197.0, 2877.0, 6556.0, 16159.0, 45645.0, 162947.0, 544793.0, 187025.0, 49784.0, 17621.0, 6957.0, 3144.0, 1333.0, 633.0, 313.0, 144.0, 68.0, 42.0, 23.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9921875, -14.4669189453125, -13.941650390625, -13.4163818359375, -12.89111328125, -12.3658447265625, -11.840576171875, -11.3153076171875, -10.7900390625, -10.2647705078125, -9.739501953125, -9.2142333984375, -8.68896484375, -8.1636962890625, -7.638427734375, -7.1131591796875, -6.587890625, -6.0626220703125, -5.537353515625, -5.0120849609375, -4.48681640625, -3.9615478515625, -3.436279296875, -2.9110107421875, -2.3857421875, -1.8604736328125, -1.335205078125, -0.8099365234375, -0.28466796875, 0.2406005859375, 0.765869140625, 1.2911376953125, 1.81640625, 2.3416748046875, 2.866943359375, 3.3922119140625, 3.91748046875, 4.4427490234375, 4.968017578125, 5.4932861328125, 6.0185546875, 6.5438232421875, 7.069091796875, 7.5943603515625, 8.11962890625, 8.6448974609375, 9.170166015625, 9.6954345703125, 10.220703125, 10.7459716796875, 11.271240234375, 11.7965087890625, 12.32177734375, 12.8470458984375, 13.372314453125, 13.8975830078125, 14.4228515625, 14.9481201171875, 15.473388671875, 15.9986572265625, 16.52392578125, 17.0491943359375, 17.574462890625, 18.0997314453125, 18.625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 5.0, 13.0, 22.0, 19.0, 29.0, 54.0, 46.0, 78.0, 148.0, 173.0, 101.0, 84.0, 43.0, 38.0, 27.0, 22.0, 19.0, 12.0, 14.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00264739990234375, -0.0025568604469299316, -0.0024663209915161133, -0.002375781536102295, -0.0022852420806884766, -0.002194702625274658, -0.00210416316986084, -0.0020136237144470215, -0.0019230842590332031, -0.0018325448036193848, -0.0017420053482055664, -0.001651465892791748, -0.0015609264373779297, -0.0014703869819641113, -0.001379847526550293, -0.0012893080711364746, -0.0011987686157226562, -0.0011082291603088379, -0.0010176897048950195, -0.0009271502494812012, -0.0008366107940673828, -0.0007460713386535645, -0.0006555318832397461, -0.0005649924278259277, -0.0004744529724121094, -0.000383913516998291, -0.00029337406158447266, -0.0002028346061706543, -0.00011229515075683594, -2.1755695343017578e-05, 6.878376007080078e-05, 0.00015932321548461914, 0.0002498626708984375, 0.00034040212631225586, 0.0004309415817260742, 0.0005214810371398926, 0.0006120204925537109, 0.0007025599479675293, 0.0007930994033813477, 0.000883638858795166, 0.0009741783142089844, 0.0010647177696228027, 0.001155257225036621, 0.0012457966804504395, 0.0013363361358642578, 0.0014268755912780762, 0.0015174150466918945, 0.0016079545021057129, 0.0016984939575195312, 0.0017890334129333496, 0.001879572868347168, 0.0019701123237609863, 0.0020606517791748047, 0.002151191234588623, 0.0022417306900024414, 0.0023322701454162598, 0.002422809600830078, 0.0025133490562438965, 0.002603888511657715, 0.002694427967071533, 0.0027849674224853516, 0.00287550687789917, 0.0029660463333129883, 0.0030565857887268066, 0.003147125244140625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 13.0, 9.0, 21.0, 28.0, 37.0, 48.0, 62.0, 109.0, 144.0, 250.0, 436.0, 720.0, 1305.0, 2488.0, 5363.0, 12350.0, 32295.0, 104711.0, 503557.0, 280780.0, 64186.0, 21913.0, 9015.0, 4054.0, 2079.0, 1057.0, 578.0, 323.0, 197.0, 124.0, 82.0, 61.0, 42.0, 31.0, 16.0, 14.0, 12.0, 8.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.259033203125, -15.67431640625, -15.089599609375, -14.5048828125, -13.920166015625, -13.33544921875, -12.750732421875, -12.166015625, -11.581298828125, -10.99658203125, -10.411865234375, -9.8271484375, -9.242431640625, -8.65771484375, -8.072998046875, -7.48828125, -6.903564453125, -6.31884765625, -5.734130859375, -5.1494140625, -4.564697265625, -3.97998046875, -3.395263671875, -2.810546875, -2.225830078125, -1.64111328125, -1.056396484375, -0.4716796875, 0.113037109375, 0.69775390625, 1.282470703125, 1.8671875, 2.451904296875, 3.03662109375, 3.621337890625, 4.2060546875, 4.790771484375, 5.37548828125, 5.960205078125, 6.544921875, 7.129638671875, 7.71435546875, 8.299072265625, 8.8837890625, 9.468505859375, 10.05322265625, 10.637939453125, 11.22265625, 11.807373046875, 12.39208984375, 12.976806640625, 13.5615234375, 14.146240234375, 14.73095703125, 15.315673828125, 15.900390625, 16.485107421875, 17.06982421875, 17.654541015625, 18.2392578125, 18.823974609375, 19.40869140625, 19.993408203125, 20.578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 4.0, 10.0, 3.0, 9.0, 12.0, 9.0, 17.0, 18.0, 22.0, 26.0, 37.0, 52.0, 69.0, 107.0, 113.0, 100.0, 74.0, 63.0, 48.0, 40.0, 28.0, 16.0, 14.0, 12.0, 20.0, 16.0, 5.0, 6.0, 6.0, 2.0, 8.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.29345703125, -9.9462890625, -9.59912109375, -9.251953125, -8.90478515625, -8.5576171875, -8.21044921875, -7.86328125, -7.51611328125, -7.1689453125, -6.82177734375, -6.474609375, -6.12744140625, -5.7802734375, -5.43310546875, -5.0859375, -4.73876953125, -4.3916015625, -4.04443359375, -3.697265625, -3.35009765625, -3.0029296875, -2.65576171875, -2.30859375, -1.96142578125, -1.6142578125, -1.26708984375, -0.919921875, -0.57275390625, -0.2255859375, 0.12158203125, 0.46875, 0.81591796875, 1.1630859375, 1.51025390625, 1.857421875, 2.20458984375, 2.5517578125, 2.89892578125, 3.24609375, 3.59326171875, 3.9404296875, 4.28759765625, 4.634765625, 4.98193359375, 5.3291015625, 5.67626953125, 6.0234375, 6.37060546875, 6.7177734375, 7.06494140625, 7.412109375, 7.75927734375, 8.1064453125, 8.45361328125, 8.80078125, 9.14794921875, 9.4951171875, 9.84228515625, 10.189453125, 10.53662109375, 10.8837890625, 11.23095703125, 11.578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 10.0, 11.0, 21.0, 49.0, 61.0, 116.0, 167.0, 160.0, 140.0, 123.0, 63.0, 24.0, 19.0, 11.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-184.5086669921875, -178.6202392578125, -172.7318115234375, -166.84336853027344, -160.95494079589844, -155.06651306152344, -149.17808532714844, -143.28964233398438, -137.40121459960938, -131.51278686523438, -125.62435150146484, -119.73592376708984, -113.84748840332031, -107.95906066894531, -102.07063293457031, -96.18219757080078, -90.29376983642578, -84.40534210205078, -78.51690673828125, -72.62847900390625, -66.74004364013672, -60.85161590576172, -54.96318435668945, -49.07475280761719, -43.18632125854492, -37.297889709472656, -31.40945816040039, -25.521028518676758, -19.632596969604492, -13.744165420532227, -7.855735778808594, -1.9673042297363281, 3.9211273193359375, 9.809558868408203, 15.697989463806152, 21.5864200592041, 27.474851608276367, 33.36328125, 39.251712799072266, 45.14014434814453, 51.0285758972168, 56.91700744628906, 62.80543899536133, 68.6938705444336, 74.5822982788086, 80.47073364257812, 86.35916137695312, 92.24758911132812, 98.13602447509766, 104.02445220947266, 109.91288757324219, 115.80131530761719, 121.68975067138672, 127.57817840576172, 133.46661376953125, 139.35504150390625, 145.24346923828125, 151.13189697265625, 157.02032470703125, 162.9087677001953, 168.7971954345703, 174.6856231689453, 180.5740509033203, 186.46249389648438, 192.35092163085938]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 9.0, 12.0, 7.0, 9.0, 12.0, 10.0, 10.0, 24.0, 18.0, 29.0, 31.0, 34.0, 40.0, 46.0, 42.0, 49.0, 56.0, 46.0, 49.0, 42.0, 32.0, 45.0, 29.0, 48.0, 51.0, 35.0, 27.0, 36.0, 18.0, 13.0, 15.0, 17.0, 13.0, 7.0, 9.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.49825286865234, -75.96744537353516, -73.43663024902344, -70.90582275390625, -68.37500762939453, -65.84420013427734, -63.31338882446289, -60.78257751464844, -58.251766204833984, -55.72095489501953, -53.19014358520508, -50.659332275390625, -48.12852478027344, -45.59770965576172, -43.06690216064453, -40.53609085083008, -38.005279541015625, -35.47446823120117, -32.94365692138672, -30.4128475189209, -27.882036209106445, -25.351224899291992, -22.820415496826172, -20.28960418701172, -17.758792877197266, -15.227981567382812, -12.697171211242676, -10.166360855102539, -7.635549545288086, -5.104738235473633, -2.573927879333496, -0.043117523193359375, 2.487701416015625, 5.01851224899292, 7.549323081970215, 10.080133438110352, 12.610944747924805, 15.141756057739258, 17.672565460205078, 20.20337677001953, 22.734188079833984, 25.264999389648438, 27.79581069946289, 30.32662010192871, 32.85742950439453, 35.38824462890625, 37.91905212402344, 40.44986343383789, 42.980674743652344, 45.5114860534668, 48.04229736328125, 50.5731086730957, 53.103919982910156, 55.634727478027344, 58.1655387878418, 60.69635009765625, 63.2271614074707, 65.75797271728516, 68.28878021240234, 70.81959533691406, 73.35040283203125, 75.88121795654297, 78.41202545166016, 80.94284057617188, 83.47364807128906]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 13.0, 8.0, 10.0, 27.0, 35.0, 41.0, 47.0, 91.0, 150.0, 291.0, 465.0, 962.0, 2151.0, 6124.0, 23506.0, 136392.0, 3568000.0, 392146.0, 47293.0, 10747.0, 3299.0, 1213.0, 549.0, 295.0, 140.0, 97.0, 60.0, 38.0, 29.0, 18.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.02001953125, -30.9775390625, -29.93505859375, -28.892578125, -27.85009765625, -26.8076171875, -25.76513671875, -24.72265625, -23.68017578125, -22.6376953125, -21.59521484375, -20.552734375, -19.51025390625, -18.4677734375, -17.42529296875, -16.3828125, -15.34033203125, -14.2978515625, -13.25537109375, -12.212890625, -11.17041015625, -10.1279296875, -9.08544921875, -8.04296875, -7.00048828125, -5.9580078125, -4.91552734375, -3.873046875, -2.83056640625, -1.7880859375, -0.74560546875, 0.296875, 1.33935546875, 2.3818359375, 3.42431640625, 4.466796875, 5.50927734375, 6.5517578125, 7.59423828125, 8.63671875, 9.67919921875, 10.7216796875, 11.76416015625, 12.806640625, 13.84912109375, 14.8916015625, 15.93408203125, 16.9765625, 18.01904296875, 19.0615234375, 20.10400390625, 21.146484375, 22.18896484375, 23.2314453125, 24.27392578125, 25.31640625, 26.35888671875, 27.4013671875, 28.44384765625, 29.486328125, 30.52880859375, 31.5712890625, 32.61376953125, 33.65625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 17.0, 18.0, 16.0, 26.0, 36.0, 40.0, 44.0, 47.0, 61.0, 64.0, 54.0, 63.0, 57.0, 62.0, 66.0, 46.0, 44.0, 50.0, 40.0, 24.0, 27.0, 9.0, 14.0, 15.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.309539794921875, -2.22845458984375, -2.147369384765625, -2.0662841796875, -1.985198974609375, -1.90411376953125, -1.823028564453125, -1.741943359375, -1.660858154296875, -1.57977294921875, -1.498687744140625, -1.4176025390625, -1.336517333984375, -1.25543212890625, -1.174346923828125, -1.09326171875, -1.012176513671875, -0.93109130859375, -0.850006103515625, -0.7689208984375, -0.687835693359375, -0.60675048828125, -0.525665283203125, -0.444580078125, -0.363494873046875, -0.28240966796875, -0.201324462890625, -0.1202392578125, -0.039154052734375, 0.04193115234375, 0.123016357421875, 0.2041015625, 0.285186767578125, 0.36627197265625, 0.447357177734375, 0.5284423828125, 0.609527587890625, 0.69061279296875, 0.771697998046875, 0.852783203125, 0.933868408203125, 1.01495361328125, 1.096038818359375, 1.1771240234375, 1.258209228515625, 1.33929443359375, 1.420379638671875, 1.50146484375, 1.582550048828125, 1.66363525390625, 1.744720458984375, 1.8258056640625, 1.906890869140625, 1.98797607421875, 2.069061279296875, 2.150146484375, 2.231231689453125, 2.31231689453125, 2.393402099609375, 2.4744873046875, 2.555572509765625, 2.63665771484375, 2.717742919921875, 2.798828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 13.0, 16.0, 13.0, 26.0, 42.0, 82.0, 107.0, 170.0, 278.0, 439.0, 740.0, 1224.0, 2252.0, 4085.0, 7735.0, 16924.0, 40053.0, 113493.0, 419286.0, 2838692.0, 527776.0, 134266.0, 46969.0, 19549.0, 9013.0, 4648.0, 2541.0, 1443.0, 875.0, 555.0, 349.0, 195.0, 133.0, 89.0, 55.0, 39.0, 27.0, 25.0, 13.0, 9.0, 11.0, 7.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.828125, -18.283447265625, -17.73876953125, -17.194091796875, -16.6494140625, -16.104736328125, -15.56005859375, -15.015380859375, -14.470703125, -13.926025390625, -13.38134765625, -12.836669921875, -12.2919921875, -11.747314453125, -11.20263671875, -10.657958984375, -10.11328125, -9.568603515625, -9.02392578125, -8.479248046875, -7.9345703125, -7.389892578125, -6.84521484375, -6.300537109375, -5.755859375, -5.211181640625, -4.66650390625, -4.121826171875, -3.5771484375, -3.032470703125, -2.48779296875, -1.943115234375, -1.3984375, -0.853759765625, -0.30908203125, 0.235595703125, 0.7802734375, 1.324951171875, 1.86962890625, 2.414306640625, 2.958984375, 3.503662109375, 4.04833984375, 4.593017578125, 5.1376953125, 5.682373046875, 6.22705078125, 6.771728515625, 7.31640625, 7.861083984375, 8.40576171875, 8.950439453125, 9.4951171875, 10.039794921875, 10.58447265625, 11.129150390625, 11.673828125, 12.218505859375, 12.76318359375, 13.307861328125, 13.8525390625, 14.397216796875, 14.94189453125, 15.486572265625, 16.03125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 10.0, 8.0, 9.0, 20.0, 19.0, 30.0, 40.0, 63.0, 97.0, 112.0, 178.0, 305.0, 767.0, 1257.0, 399.0, 225.0, 142.0, 104.0, 66.0, 56.0, 38.0, 24.0, 19.0, 22.0, 9.0, 9.0, 7.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.390625, -5.21746826171875, -5.0443115234375, -4.87115478515625, -4.697998046875, -4.52484130859375, -4.3516845703125, -4.17852783203125, -4.00537109375, -3.83221435546875, -3.6590576171875, -3.48590087890625, -3.312744140625, -3.13958740234375, -2.9664306640625, -2.79327392578125, -2.6201171875, -2.44696044921875, -2.2738037109375, -2.10064697265625, -1.927490234375, -1.75433349609375, -1.5811767578125, -1.40802001953125, -1.23486328125, -1.06170654296875, -0.8885498046875, -0.71539306640625, -0.542236328125, -0.36907958984375, -0.1959228515625, -0.02276611328125, 0.150390625, 0.32354736328125, 0.4967041015625, 0.66986083984375, 0.843017578125, 1.01617431640625, 1.1893310546875, 1.36248779296875, 1.53564453125, 1.70880126953125, 1.8819580078125, 2.05511474609375, 2.228271484375, 2.40142822265625, 2.5745849609375, 2.74774169921875, 2.9208984375, 3.09405517578125, 3.2672119140625, 3.44036865234375, 3.613525390625, 3.78668212890625, 3.9598388671875, 4.13299560546875, 4.30615234375, 4.47930908203125, 4.6524658203125, 4.82562255859375, 4.998779296875, 5.17193603515625, 5.3450927734375, 5.51824951171875, 5.69140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 18.0, 34.0, 42.0, 66.0, 119.0, 132.0, 125.0, 175.0, 104.0, 69.0, 45.0, 28.0, 14.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.661224365234375, -53.9853401184082, -52.30945587158203, -50.633575439453125, -48.95769119262695, -47.28180694580078, -45.60592269897461, -43.93003845214844, -42.25415802001953, -40.57827377319336, -38.90238952636719, -37.22650909423828, -35.55062484741211, -33.87474060058594, -32.198856353759766, -30.522974014282227, -28.847089767456055, -27.171205520629883, -25.495323181152344, -23.819438934326172, -22.143556594848633, -20.46767234802246, -18.791790008544922, -17.11590576171875, -15.440022468566895, -13.764139175415039, -12.088255882263184, -10.412372589111328, -8.736488342285156, -7.060605049133301, -5.384721755981445, -3.70883846282959, -2.0329551696777344, -0.35707175731658936, 1.3188116550445557, 2.9946951866149902, 4.670578479766846, 6.346462249755859, 8.022345542907715, 9.69822883605957, 11.374112129211426, 13.049995422363281, 14.725878715515137, 16.401762008666992, 18.077646255493164, 19.753528594970703, 21.429412841796875, 23.105297088623047, 24.781179428100586, 26.457063674926758, 28.132946014404297, 29.80883026123047, 31.484712600708008, 33.16059875488281, 34.83647918701172, 36.51236343383789, 38.18824768066406, 39.864131927490234, 41.540016174316406, 43.21589660644531, 44.891780853271484, 46.567665100097656, 48.24354934692383, 49.91943359375, 51.595314025878906]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 5.0, 3.0, 5.0, 9.0, 12.0, 12.0, 9.0, 29.0, 28.0, 28.0, 26.0, 37.0, 29.0, 57.0, 36.0, 35.0, 35.0, 46.0, 52.0, 51.0, 45.0, 40.0, 37.0, 54.0, 38.0, 29.0, 26.0, 32.0, 24.0, 23.0, 26.0, 15.0, 13.0, 14.0, 6.0, 6.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.908897399902344, -19.228694915771484, -18.548490524291992, -17.868288040161133, -17.18808364868164, -16.50788116455078, -15.827676773071289, -15.14747428894043, -14.467269897460938, -13.787066459655762, -13.106863021850586, -12.42665958404541, -11.746456146240234, -11.066252708435059, -10.386049270629883, -9.705846786499023, -9.025643348693848, -8.345439910888672, -7.665236473083496, -6.98503303527832, -6.3048295974731445, -5.624626159667969, -4.944423198699951, -4.264219760894775, -3.5840163230895996, -2.903812885284424, -2.223609447479248, -1.5434062480926514, -0.8632028102874756, -0.1829993724822998, 0.4972038269042969, 1.1774072647094727, 1.8576107025146484, 2.537814140319824, 3.218017578125, 3.8982207775115967, 4.578424453735352, 5.258627891540527, 5.938830852508545, 6.619034290313721, 7.2992377281188965, 7.979441165924072, 8.65964412689209, 9.339847564697266, 10.020051002502441, 10.700254440307617, 11.380457878112793, 12.060661315917969, 12.740864753723145, 13.42106819152832, 14.101271629333496, 14.781475067138672, 15.461678504943848, 16.141881942749023, 16.822084426879883, 17.502288818359375, 18.182491302490234, 18.862693786621094, 19.542898178100586, 20.223100662231445, 20.903305053710938, 21.583507537841797, 22.26371192932129, 22.94391441345215, 23.62411880493164]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 26.0, 30.0, 43.0, 72.0, 116.0, 257.0, 461.0, 925.0, 1835.0, 4292.0, 9609.0, 24647.0, 63961.0, 162715.0, 315785.0, 267359.0, 119378.0, 46058.0, 17642.0, 7184.0, 3045.0, 1495.0, 770.0, 366.0, 203.0, 108.0, 64.0, 36.0, 23.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8984375, -14.4580078125, -14.017578125, -13.5771484375, -13.13671875, -12.6962890625, -12.255859375, -11.8154296875, -11.375, -10.9345703125, -10.494140625, -10.0537109375, -9.61328125, -9.1728515625, -8.732421875, -8.2919921875, -7.8515625, -7.4111328125, -6.970703125, -6.5302734375, -6.08984375, -5.6494140625, -5.208984375, -4.7685546875, -4.328125, -3.8876953125, -3.447265625, -3.0068359375, -2.56640625, -2.1259765625, -1.685546875, -1.2451171875, -0.8046875, -0.3642578125, 0.076171875, 0.5166015625, 0.95703125, 1.3974609375, 1.837890625, 2.2783203125, 2.71875, 3.1591796875, 3.599609375, 4.0400390625, 4.48046875, 4.9208984375, 5.361328125, 5.8017578125, 6.2421875, 6.6826171875, 7.123046875, 7.5634765625, 8.00390625, 8.4443359375, 8.884765625, 9.3251953125, 9.765625, 10.2060546875, 10.646484375, 11.0869140625, 11.52734375, 11.9677734375, 12.408203125, 12.8486328125, 13.2890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 1.0, 9.0, 5.0, 2.0, 13.0, 7.0, 21.0, 17.0, 20.0, 23.0, 41.0, 38.0, 36.0, 38.0, 42.0, 42.0, 47.0, 62.0, 57.0, 44.0, 62.0, 58.0, 44.0, 29.0, 32.0, 38.0, 29.0, 25.0, 25.0, 20.0, 16.0, 12.0, 9.0, 5.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.162109375, -2.091339111328125, -2.02056884765625, -1.949798583984375, -1.8790283203125, -1.808258056640625, -1.73748779296875, -1.666717529296875, -1.595947265625, -1.525177001953125, -1.45440673828125, -1.383636474609375, -1.3128662109375, -1.242095947265625, -1.17132568359375, -1.100555419921875, -1.02978515625, -0.959014892578125, -0.88824462890625, -0.817474365234375, -0.7467041015625, -0.675933837890625, -0.60516357421875, -0.534393310546875, -0.463623046875, -0.392852783203125, -0.32208251953125, -0.251312255859375, -0.1805419921875, -0.109771728515625, -0.03900146484375, 0.031768798828125, 0.1025390625, 0.173309326171875, 0.24407958984375, 0.314849853515625, 0.3856201171875, 0.456390380859375, 0.52716064453125, 0.597930908203125, 0.668701171875, 0.739471435546875, 0.81024169921875, 0.881011962890625, 0.9517822265625, 1.022552490234375, 1.09332275390625, 1.164093017578125, 1.23486328125, 1.305633544921875, 1.37640380859375, 1.447174072265625, 1.5179443359375, 1.588714599609375, 1.65948486328125, 1.730255126953125, 1.801025390625, 1.871795654296875, 1.94256591796875, 2.013336181640625, 2.0841064453125, 2.154876708984375, 2.22564697265625, 2.296417236328125, 2.3671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 18.0, 18.0, 31.0, 54.0, 85.0, 107.0, 190.0, 297.0, 457.0, 799.0, 1414.0, 2571.0, 5031.0, 11144.0, 24637.0, 59792.0, 142180.0, 289654.0, 277916.0, 132978.0, 55606.0, 23001.0, 10043.0, 4844.0, 2365.0, 1317.0, 774.0, 454.0, 278.0, 157.0, 98.0, 74.0, 47.0, 37.0, 23.0, 13.0, 15.0, 9.0, 3.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.6484375, -14.2039794921875, -13.759521484375, -13.3150634765625, -12.87060546875, -12.4261474609375, -11.981689453125, -11.5372314453125, -11.0927734375, -10.6483154296875, -10.203857421875, -9.7593994140625, -9.31494140625, -8.8704833984375, -8.426025390625, -7.9815673828125, -7.537109375, -7.0926513671875, -6.648193359375, -6.2037353515625, -5.75927734375, -5.3148193359375, -4.870361328125, -4.4259033203125, -3.9814453125, -3.5369873046875, -3.092529296875, -2.6480712890625, -2.20361328125, -1.7591552734375, -1.314697265625, -0.8702392578125, -0.42578125, 0.0186767578125, 0.463134765625, 0.9075927734375, 1.35205078125, 1.7965087890625, 2.240966796875, 2.6854248046875, 3.1298828125, 3.5743408203125, 4.018798828125, 4.4632568359375, 4.90771484375, 5.3521728515625, 5.796630859375, 6.2410888671875, 6.685546875, 7.1300048828125, 7.574462890625, 8.0189208984375, 8.46337890625, 8.9078369140625, 9.352294921875, 9.7967529296875, 10.2412109375, 10.6856689453125, 11.130126953125, 11.5745849609375, 12.01904296875, 12.4635009765625, 12.907958984375, 13.3524169921875, 13.796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 7.0, 14.0, 18.0, 22.0, 27.0, 18.0, 32.0, 31.0, 35.0, 40.0, 36.0, 40.0, 52.0, 40.0, 45.0, 40.0, 45.0, 32.0, 42.0, 31.0, 46.0, 37.0, 31.0, 31.0, 33.0, 22.0, 24.0, 21.0, 8.0, 13.0, 14.0, 12.0, 5.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.30322265625, -10.9189453125, -10.53466796875, -10.150390625, -9.76611328125, -9.3818359375, -8.99755859375, -8.61328125, -8.22900390625, -7.8447265625, -7.46044921875, -7.076171875, -6.69189453125, -6.3076171875, -5.92333984375, -5.5390625, -5.15478515625, -4.7705078125, -4.38623046875, -4.001953125, -3.61767578125, -3.2333984375, -2.84912109375, -2.46484375, -2.08056640625, -1.6962890625, -1.31201171875, -0.927734375, -0.54345703125, -0.1591796875, 0.22509765625, 0.609375, 0.99365234375, 1.3779296875, 1.76220703125, 2.146484375, 2.53076171875, 2.9150390625, 3.29931640625, 3.68359375, 4.06787109375, 4.4521484375, 4.83642578125, 5.220703125, 5.60498046875, 5.9892578125, 6.37353515625, 6.7578125, 7.14208984375, 7.5263671875, 7.91064453125, 8.294921875, 8.67919921875, 9.0634765625, 9.44775390625, 9.83203125, 10.21630859375, 10.6005859375, 10.98486328125, 11.369140625, 11.75341796875, 12.1376953125, 12.52197265625, 12.90625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 12.0, 10.0, 22.0, 20.0, 33.0, 32.0, 61.0, 72.0, 105.0, 167.0, 275.0, 393.0, 689.0, 1223.0, 2217.0, 4261.0, 9038.0, 20786.0, 56581.0, 185108.0, 434892.0, 221172.0, 67129.0, 23685.0, 9980.0, 4736.0, 2441.0, 1312.0, 730.0, 484.0, 292.0, 183.0, 108.0, 67.0, 47.0, 44.0, 31.0, 26.0, 21.0, 19.0, 13.0, 4.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.765625, -9.4658203125, -9.166015625, -8.8662109375, -8.56640625, -8.2666015625, -7.966796875, -7.6669921875, -7.3671875, -7.0673828125, -6.767578125, -6.4677734375, -6.16796875, -5.8681640625, -5.568359375, -5.2685546875, -4.96875, -4.6689453125, -4.369140625, -4.0693359375, -3.76953125, -3.4697265625, -3.169921875, -2.8701171875, -2.5703125, -2.2705078125, -1.970703125, -1.6708984375, -1.37109375, -1.0712890625, -0.771484375, -0.4716796875, -0.171875, 0.1279296875, 0.427734375, 0.7275390625, 1.02734375, 1.3271484375, 1.626953125, 1.9267578125, 2.2265625, 2.5263671875, 2.826171875, 3.1259765625, 3.42578125, 3.7255859375, 4.025390625, 4.3251953125, 4.625, 4.9248046875, 5.224609375, 5.5244140625, 5.82421875, 6.1240234375, 6.423828125, 6.7236328125, 7.0234375, 7.3232421875, 7.623046875, 7.9228515625, 8.22265625, 8.5224609375, 8.822265625, 9.1220703125, 9.421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 8.0, 14.0, 24.0, 24.0, 30.0, 50.0, 61.0, 94.0, 150.0, 140.0, 126.0, 75.0, 51.0, 36.0, 27.0, 14.0, 11.0, 14.0, 7.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027599334716796875, -0.00267106294631958, -0.0025821924209594727, -0.0024933218955993652, -0.002404451370239258, -0.0023155808448791504, -0.002226710319519043, -0.0021378397941589355, -0.002048969268798828, -0.0019600987434387207, -0.0018712282180786133, -0.0017823576927185059, -0.0016934871673583984, -0.001604616641998291, -0.0015157461166381836, -0.0014268755912780762, -0.0013380050659179688, -0.0012491345405578613, -0.001160264015197754, -0.0010713934898376465, -0.000982522964477539, -0.0008936524391174316, -0.0008047819137573242, -0.0007159113883972168, -0.0006270408630371094, -0.000538170337677002, -0.00044929981231689453, -0.0003604292869567871, -0.0002715587615966797, -0.00018268823623657227, -9.381771087646484e-05, -4.947185516357422e-06, 8.392333984375e-05, 0.00017279386520385742, 0.00026166439056396484, 0.00035053491592407227, 0.0004394054412841797, 0.0005282759666442871, 0.0006171464920043945, 0.000706017017364502, 0.0007948875427246094, 0.0008837580680847168, 0.0009726285934448242, 0.0010614991188049316, 0.001150369644165039, 0.0012392401695251465, 0.001328110694885254, 0.0014169812202453613, 0.0015058517456054688, 0.0015947222709655762, 0.0016835927963256836, 0.001772463321685791, 0.0018613338470458984, 0.0019502043724060059, 0.0020390748977661133, 0.0021279454231262207, 0.002216815948486328, 0.0023056864738464355, 0.002394556999206543, 0.0024834275245666504, 0.002572298049926758, 0.0026611685752868652, 0.0027500391006469727, 0.00283890962600708, 0.0029277801513671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 13.0, 11.0, 25.0, 28.0, 36.0, 70.0, 100.0, 125.0, 231.0, 367.0, 568.0, 995.0, 1770.0, 3477.0, 7434.0, 16208.0, 41422.0, 135768.0, 478727.0, 251137.0, 65740.0, 23933.0, 10176.0, 4637.0, 2368.0, 1274.0, 692.0, 412.0, 264.0, 169.0, 106.0, 73.0, 48.0, 44.0, 22.0, 27.0, 12.0, 10.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.640625, -11.2615966796875, -10.882568359375, -10.5035400390625, -10.12451171875, -9.7454833984375, -9.366455078125, -8.9874267578125, -8.6083984375, -8.2293701171875, -7.850341796875, -7.4713134765625, -7.09228515625, -6.7132568359375, -6.334228515625, -5.9552001953125, -5.576171875, -5.1971435546875, -4.818115234375, -4.4390869140625, -4.06005859375, -3.6810302734375, -3.302001953125, -2.9229736328125, -2.5439453125, -2.1649169921875, -1.785888671875, -1.4068603515625, -1.02783203125, -0.6488037109375, -0.269775390625, 0.1092529296875, 0.48828125, 0.8673095703125, 1.246337890625, 1.6253662109375, 2.00439453125, 2.3834228515625, 2.762451171875, 3.1414794921875, 3.5205078125, 3.8995361328125, 4.278564453125, 4.6575927734375, 5.03662109375, 5.4156494140625, 5.794677734375, 6.1737060546875, 6.552734375, 6.9317626953125, 7.310791015625, 7.6898193359375, 8.06884765625, 8.4478759765625, 8.826904296875, 9.2059326171875, 9.5849609375, 9.9639892578125, 10.343017578125, 10.7220458984375, 11.10107421875, 11.4801025390625, 11.859130859375, 12.2381591796875, 12.6171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 2.0, 2.0, 3.0, 5.0, 10.0, 8.0, 10.0, 20.0, 27.0, 29.0, 33.0, 43.0, 63.0, 115.0, 104.0, 120.0, 96.0, 95.0, 49.0, 46.0, 24.0, 20.0, 15.0, 8.0, 15.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.448974609375, -10.10107421875, -9.753173828125, -9.4052734375, -9.057373046875, -8.70947265625, -8.361572265625, -8.013671875, -7.665771484375, -7.31787109375, -6.969970703125, -6.6220703125, -6.274169921875, -5.92626953125, -5.578369140625, -5.23046875, -4.882568359375, -4.53466796875, -4.186767578125, -3.8388671875, -3.490966796875, -3.14306640625, -2.795166015625, -2.447265625, -2.099365234375, -1.75146484375, -1.403564453125, -1.0556640625, -0.707763671875, -0.35986328125, -0.011962890625, 0.3359375, 0.683837890625, 1.03173828125, 1.379638671875, 1.7275390625, 2.075439453125, 2.42333984375, 2.771240234375, 3.119140625, 3.467041015625, 3.81494140625, 4.162841796875, 4.5107421875, 4.858642578125, 5.20654296875, 5.554443359375, 5.90234375, 6.250244140625, 6.59814453125, 6.946044921875, 7.2939453125, 7.641845703125, 7.98974609375, 8.337646484375, 8.685546875, 9.033447265625, 9.38134765625, 9.729248046875, 10.0771484375, 10.425048828125, 10.77294921875, 11.120849609375, 11.46875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 7.0, 21.0, 31.0, 56.0, 79.0, 106.0, 120.0, 151.0, 123.0, 112.0, 70.0, 50.0, 31.0, 18.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.38300323486328, -92.82000732421875, -88.25701904296875, -83.69402313232422, -79.13102722167969, -74.56803894042969, -70.00504302978516, -65.44204711914062, -60.87905502319336, -56.316062927246094, -51.75306701660156, -47.1900749206543, -42.62708282470703, -38.0640869140625, -33.501094818115234, -28.938100814819336, -24.375106811523438, -19.81211280822754, -15.249119758605957, -10.686126708984375, -6.123132705688477, -1.5601387023925781, 3.0028533935546875, 7.565847396850586, 12.128841400146484, 16.691835403442383, 21.25482940673828, 25.817821502685547, 30.380815505981445, 34.943809509277344, 39.50680160522461, 44.069793701171875, 48.63279724121094, 53.1957893371582, 57.758785247802734, 62.32177734375, 66.88477325439453, 71.44776916503906, 76.01075744628906, 80.5737533569336, 85.13674926757812, 89.69974517822266, 94.26273345947266, 98.82572937011719, 103.38872528076172, 107.95172119140625, 112.51470947265625, 117.07770538330078, 121.64069366455078, 126.20368957519531, 130.7666778564453, 135.32968139648438, 139.89266967773438, 144.45565795898438, 149.01864624023438, 153.58164978027344, 158.14463806152344, 162.70762634277344, 167.2706298828125, 171.8336181640625, 176.3966064453125, 180.95960998535156, 185.52259826660156, 190.08558654785156, 194.64859008789062]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 4.0, 3.0, 12.0, 8.0, 10.0, 13.0, 16.0, 20.0, 27.0, 42.0, 48.0, 31.0, 43.0, 45.0, 56.0, 51.0, 55.0, 50.0, 54.0, 53.0, 56.0, 47.0, 43.0, 37.0, 39.0, 19.0, 26.0, 23.0, 13.0, 11.0, 11.0, 7.0, 6.0, 10.0, 2.0, 8.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.67121887207031, -68.75943756103516, -65.84766387939453, -62.935882568359375, -60.024105072021484, -57.112327575683594, -54.20054626464844, -51.28876876831055, -48.376991271972656, -45.465213775634766, -42.553436279296875, -39.64165496826172, -36.72987747192383, -33.81809997558594, -30.906320571899414, -27.99454116821289, -25.082763671875, -22.17098617553711, -19.259206771850586, -16.347427368164062, -13.435649871826172, -10.523871421813965, -7.612092971801758, -4.700313568115234, -1.7885360717773438, 1.1232423782348633, 4.03502082824707, 6.946799278259277, 9.858577728271484, 12.770356178283691, 15.682134628295898, 18.593914031982422, 21.50568389892578, 24.417461395263672, 27.329240798950195, 30.24102020263672, 33.15279769897461, 36.0645751953125, 38.976356506347656, 41.88813400268555, 44.79991149902344, 47.71168899536133, 50.62346649169922, 53.535247802734375, 56.447025299072266, 59.358802795410156, 62.27058410644531, 65.18235778808594, 68.0941390991211, 71.00592041015625, 73.91769409179688, 76.82947540283203, 79.74125671386719, 82.65303039550781, 85.56481170654297, 88.47659301757812, 91.38836669921875, 94.3001480102539, 97.21192169189453, 100.12370300292969, 103.03547668457031, 105.94725799560547, 108.85903930664062, 111.77081298828125, 114.6825942993164]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 25.0, 37.0, 111.0, 210.0, 537.0, 1372.0, 4244.0, 16696.0, 105932.0, 3849198.0, 183662.0, 23444.0, 5670.0, 1867.0, 647.0, 280.0, 116.0, 77.0, 31.0, 28.0, 25.0, 12.0, 8.0, 9.0, 0.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.39501953125, -18.3525390625, -17.31005859375, -16.267578125, -15.22509765625, -14.1826171875, -13.14013671875, -12.09765625, -11.05517578125, -10.0126953125, -8.97021484375, -7.927734375, -6.88525390625, -5.8427734375, -4.80029296875, -3.7578125, -2.71533203125, -1.6728515625, -0.63037109375, 0.412109375, 1.45458984375, 2.4970703125, 3.53955078125, 4.58203125, 5.62451171875, 6.6669921875, 7.70947265625, 8.751953125, 9.79443359375, 10.8369140625, 11.87939453125, 12.921875, 13.96435546875, 15.0068359375, 16.04931640625, 17.091796875, 18.13427734375, 19.1767578125, 20.21923828125, 21.26171875, 22.30419921875, 23.3466796875, 24.38916015625, 25.431640625, 26.47412109375, 27.5166015625, 28.55908203125, 29.6015625, 30.64404296875, 31.6865234375, 32.72900390625, 33.771484375, 34.81396484375, 35.8564453125, 36.89892578125, 37.94140625, 38.98388671875, 40.0263671875, 41.06884765625, 42.111328125, 43.15380859375, 44.1962890625, 45.23876953125, 46.28125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 9.0, 18.0, 10.0, 18.0, 14.0, 22.0, 29.0, 45.0, 50.0, 78.0, 61.0, 68.0, 56.0, 75.0, 53.0, 62.0, 53.0, 62.0, 34.0, 40.0, 32.0, 21.0, 28.0, 18.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.01751708984375, -1.9178466796875, -1.81817626953125, -1.718505859375, -1.61883544921875, -1.5191650390625, -1.41949462890625, -1.31982421875, -1.22015380859375, -1.1204833984375, -1.02081298828125, -0.921142578125, -0.82147216796875, -0.7218017578125, -0.62213134765625, -0.5224609375, -0.42279052734375, -0.3231201171875, -0.22344970703125, -0.123779296875, -0.02410888671875, 0.0755615234375, 0.17523193359375, 0.27490234375, 0.37457275390625, 0.4742431640625, 0.57391357421875, 0.673583984375, 0.77325439453125, 0.8729248046875, 0.97259521484375, 1.072265625, 1.17193603515625, 1.2716064453125, 1.37127685546875, 1.470947265625, 1.57061767578125, 1.6702880859375, 1.76995849609375, 1.86962890625, 1.96929931640625, 2.0689697265625, 2.16864013671875, 2.268310546875, 2.36798095703125, 2.4676513671875, 2.56732177734375, 2.6669921875, 2.76666259765625, 2.8663330078125, 2.96600341796875, 3.065673828125, 3.16534423828125, 3.2650146484375, 3.36468505859375, 3.46435546875, 3.56402587890625, 3.6636962890625, 3.76336669921875, 3.863037109375, 3.96270751953125, 4.0623779296875, 4.16204833984375, 4.26171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 13.0, 28.0, 34.0, 52.0, 61.0, 96.0, 169.0, 266.0, 505.0, 858.0, 1800.0, 3854.0, 9124.0, 24787.0, 83885.0, 466710.0, 3273951.0, 241555.0, 54833.0, 17875.0, 7165.0, 3067.0, 1499.0, 792.0, 471.0, 300.0, 183.0, 112.0, 79.0, 43.0, 35.0, 16.0, 14.0, 6.0, 11.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0], "bins": [-25.640625, -24.971923828125, -24.30322265625, -23.634521484375, -22.9658203125, -22.297119140625, -21.62841796875, -20.959716796875, -20.291015625, -19.622314453125, -18.95361328125, -18.284912109375, -17.6162109375, -16.947509765625, -16.27880859375, -15.610107421875, -14.94140625, -14.272705078125, -13.60400390625, -12.935302734375, -12.2666015625, -11.597900390625, -10.92919921875, -10.260498046875, -9.591796875, -8.923095703125, -8.25439453125, -7.585693359375, -6.9169921875, -6.248291015625, -5.57958984375, -4.910888671875, -4.2421875, -3.573486328125, -2.90478515625, -2.236083984375, -1.5673828125, -0.898681640625, -0.22998046875, 0.438720703125, 1.107421875, 1.776123046875, 2.44482421875, 3.113525390625, 3.7822265625, 4.450927734375, 5.11962890625, 5.788330078125, 6.45703125, 7.125732421875, 7.79443359375, 8.463134765625, 9.1318359375, 9.800537109375, 10.46923828125, 11.137939453125, 11.806640625, 12.475341796875, 13.14404296875, 13.812744140625, 14.4814453125, 15.150146484375, 15.81884765625, 16.487548828125, 17.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 13.0, 14.0, 14.0, 38.0, 52.0, 74.0, 143.0, 218.0, 491.0, 1956.0, 507.0, 199.0, 113.0, 72.0, 42.0, 32.0, 16.0, 13.0, 13.0, 14.0, 5.0, 10.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.6171875, -8.38739013671875, -8.1575927734375, -7.92779541015625, -7.697998046875, -7.46820068359375, -7.2384033203125, -7.00860595703125, -6.77880859375, -6.54901123046875, -6.3192138671875, -6.08941650390625, -5.859619140625, -5.62982177734375, -5.4000244140625, -5.17022705078125, -4.9404296875, -4.71063232421875, -4.4808349609375, -4.25103759765625, -4.021240234375, -3.79144287109375, -3.5616455078125, -3.33184814453125, -3.10205078125, -2.87225341796875, -2.6424560546875, -2.41265869140625, -2.182861328125, -1.95306396484375, -1.7232666015625, -1.49346923828125, -1.263671875, -1.03387451171875, -0.8040771484375, -0.57427978515625, -0.344482421875, -0.11468505859375, 0.1151123046875, 0.34490966796875, 0.57470703125, 0.80450439453125, 1.0343017578125, 1.26409912109375, 1.493896484375, 1.72369384765625, 1.9534912109375, 2.18328857421875, 2.4130859375, 2.64288330078125, 2.8726806640625, 3.10247802734375, 3.332275390625, 3.56207275390625, 3.7918701171875, 4.02166748046875, 4.25146484375, 4.48126220703125, 4.7110595703125, 4.94085693359375, 5.170654296875, 5.40045166015625, 5.6302490234375, 5.86004638671875, 6.08984375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 19.0, 99.0, 236.0, 336.0, 203.0, 81.0, 23.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.80752563476562, -172.45155334472656, -169.09559631347656, -165.7396240234375, -162.3836669921875, -159.02769470214844, -155.67172241210938, -152.31576538085938, -148.9597930908203, -145.60382080078125, -142.24786376953125, -138.8918914794922, -135.53591918945312, -132.17996215820312, -128.82398986816406, -125.46802520751953, -122.112060546875, -118.75609588623047, -115.40013122558594, -112.04415893554688, -108.68819427490234, -105.33222961425781, -101.97625732421875, -98.62029266357422, -95.26432800292969, -91.90836334228516, -88.55239868164062, -85.19642639160156, -81.84046173095703, -78.4844970703125, -75.12852478027344, -71.7725601196289, -68.41658782958984, -65.06062316894531, -61.704654693603516, -58.34868621826172, -54.99272155761719, -51.636756896972656, -48.28078842163086, -44.92481994628906, -41.56885528564453, -38.212890625, -34.8569221496582, -31.50095558166504, -28.144989013671875, -24.78902244567871, -21.433055877685547, -18.077089309692383, -14.721122741699219, -11.365156173706055, -8.00918960571289, -4.653223037719727, -1.2972564697265625, 2.0587100982666016, 5.414676666259766, 8.77064323425293, 12.126609802246094, 15.482576370239258, 18.838542938232422, 22.194509506225586, 25.55047607421875, 28.906442642211914, 32.26240921020508, 35.618377685546875, 38.974342346191406]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 8.0, 10.0, 10.0, 16.0, 26.0, 26.0, 36.0, 27.0, 52.0, 34.0, 49.0, 60.0, 58.0, 59.0, 56.0, 72.0, 59.0, 51.0, 60.0, 40.0, 34.0, 38.0, 28.0, 21.0, 26.0, 13.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.22268295288086, -26.33050537109375, -25.43832778930664, -24.546152114868164, -23.653974533081055, -22.761796951293945, -21.86962127685547, -20.97744369506836, -20.08526611328125, -19.19308853149414, -18.30091094970703, -17.408735275268555, -16.516557693481445, -15.624380111694336, -14.732203483581543, -13.84002685546875, -12.94784927368164, -12.055671691894531, -11.163495063781738, -10.271318435668945, -9.379140853881836, -8.486963272094727, -7.594786643981934, -6.702609539031982, -5.810432434082031, -4.91825532913208, -4.026078224182129, -3.1339011192321777, -2.2417240142822266, -1.3495469093322754, -0.4573698043823242, 0.43480730056762695, 1.326986312866211, 2.219163417816162, 3.1113405227661133, 4.0035176277160645, 4.895694732666016, 5.787871837615967, 6.680048942565918, 7.572226047515869, 8.46440315246582, 9.35658073425293, 10.248757362365723, 11.140933990478516, 12.033111572265625, 12.925289154052734, 13.817465782165527, 14.70964241027832, 15.60181999206543, 16.49399757385254, 17.386173248291016, 18.278350830078125, 19.170528411865234, 20.062705993652344, 20.954883575439453, 21.84705924987793, 22.73923683166504, 23.63141441345215, 24.523590087890625, 25.415767669677734, 26.307945251464844, 27.200122833251953, 28.092300415039062, 28.98447608947754, 29.87665367126465]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 6.0, 14.0, 12.0, 17.0, 28.0, 41.0, 67.0, 90.0, 125.0, 197.0, 281.0, 448.0, 739.0, 1126.0, 1949.0, 3263.0, 5886.0, 10637.0, 20026.0, 39120.0, 75308.0, 138131.0, 220089.0, 223712.0, 142359.0, 77756.0, 40372.0, 21138.0, 10983.0, 5922.0, 3383.0, 1970.0, 1234.0, 731.0, 472.0, 287.0, 219.0, 140.0, 83.0, 66.0, 41.0, 24.0, 15.0, 18.0, 7.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.625, -10.312744140625, -10.00048828125, -9.688232421875, -9.3759765625, -9.063720703125, -8.75146484375, -8.439208984375, -8.126953125, -7.814697265625, -7.50244140625, -7.190185546875, -6.8779296875, -6.565673828125, -6.25341796875, -5.941162109375, -5.62890625, -5.316650390625, -5.00439453125, -4.692138671875, -4.3798828125, -4.067626953125, -3.75537109375, -3.443115234375, -3.130859375, -2.818603515625, -2.50634765625, -2.194091796875, -1.8818359375, -1.569580078125, -1.25732421875, -0.945068359375, -0.6328125, -0.320556640625, -0.00830078125, 0.303955078125, 0.6162109375, 0.928466796875, 1.24072265625, 1.552978515625, 1.865234375, 2.177490234375, 2.48974609375, 2.802001953125, 3.1142578125, 3.426513671875, 3.73876953125, 4.051025390625, 4.36328125, 4.675537109375, 4.98779296875, 5.300048828125, 5.6123046875, 5.924560546875, 6.23681640625, 6.549072265625, 6.861328125, 7.173583984375, 7.48583984375, 7.798095703125, 8.1103515625, 8.422607421875, 8.73486328125, 9.047119140625, 9.359375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 13.0, 11.0, 10.0, 8.0, 16.0, 12.0, 13.0, 26.0, 23.0, 34.0, 56.0, 49.0, 61.0, 40.0, 62.0, 50.0, 43.0, 48.0, 46.0, 46.0, 41.0, 46.0, 47.0, 29.0, 31.0, 23.0, 24.0, 11.0, 25.0, 11.0, 8.0, 4.0, 7.0, 6.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.2694091796875, -2.187255859375, -2.1051025390625, -2.02294921875, -1.9407958984375, -1.858642578125, -1.7764892578125, -1.6943359375, -1.6121826171875, -1.530029296875, -1.4478759765625, -1.36572265625, -1.2835693359375, -1.201416015625, -1.1192626953125, -1.037109375, -0.9549560546875, -0.872802734375, -0.7906494140625, -0.70849609375, -0.6263427734375, -0.544189453125, -0.4620361328125, -0.3798828125, -0.2977294921875, -0.215576171875, -0.1334228515625, -0.05126953125, 0.0308837890625, 0.113037109375, 0.1951904296875, 0.27734375, 0.3594970703125, 0.441650390625, 0.5238037109375, 0.60595703125, 0.6881103515625, 0.770263671875, 0.8524169921875, 0.9345703125, 1.0167236328125, 1.098876953125, 1.1810302734375, 1.26318359375, 1.3453369140625, 1.427490234375, 1.5096435546875, 1.591796875, 1.6739501953125, 1.756103515625, 1.8382568359375, 1.92041015625, 2.0025634765625, 2.084716796875, 2.1668701171875, 2.2490234375, 2.3311767578125, 2.413330078125, 2.4954833984375, 2.57763671875, 2.6597900390625, 2.741943359375, 2.8240966796875, 2.90625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 5.0, 5.0, 11.0, 13.0, 23.0, 44.0, 50.0, 82.0, 120.0, 173.0, 311.0, 455.0, 762.0, 1457.0, 2792.0, 5680.0, 12820.0, 30683.0, 76469.0, 183724.0, 325850.0, 232504.0, 101763.0, 40869.0, 16912.0, 7379.0, 3461.0, 1770.0, 946.0, 517.0, 333.0, 195.0, 119.0, 89.0, 52.0, 30.0, 28.0, 14.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-14.625, -14.2030029296875, -13.781005859375, -13.3590087890625, -12.93701171875, -12.5150146484375, -12.093017578125, -11.6710205078125, -11.2490234375, -10.8270263671875, -10.405029296875, -9.9830322265625, -9.56103515625, -9.1390380859375, -8.717041015625, -8.2950439453125, -7.873046875, -7.4510498046875, -7.029052734375, -6.6070556640625, -6.18505859375, -5.7630615234375, -5.341064453125, -4.9190673828125, -4.4970703125, -4.0750732421875, -3.653076171875, -3.2310791015625, -2.80908203125, -2.3870849609375, -1.965087890625, -1.5430908203125, -1.12109375, -0.6990966796875, -0.277099609375, 0.1448974609375, 0.56689453125, 0.9888916015625, 1.410888671875, 1.8328857421875, 2.2548828125, 2.6768798828125, 3.098876953125, 3.5208740234375, 3.94287109375, 4.3648681640625, 4.786865234375, 5.2088623046875, 5.630859375, 6.0528564453125, 6.474853515625, 6.8968505859375, 7.31884765625, 7.7408447265625, 8.162841796875, 8.5848388671875, 9.0068359375, 9.4288330078125, 9.850830078125, 10.2728271484375, 10.69482421875, 11.1168212890625, 11.538818359375, 11.9608154296875, 12.3828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 10.0, 7.0, 12.0, 9.0, 26.0, 11.0, 20.0, 25.0, 19.0, 30.0, 36.0, 24.0, 38.0, 48.0, 35.0, 45.0, 39.0, 40.0, 41.0, 46.0, 45.0, 37.0, 32.0, 32.0, 42.0, 33.0, 33.0, 22.0, 27.0, 27.0, 12.0, 11.0, 11.0, 10.0, 10.0, 16.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.6953125, -10.341064453125, -9.98681640625, -9.632568359375, -9.2783203125, -8.924072265625, -8.56982421875, -8.215576171875, -7.861328125, -7.507080078125, -7.15283203125, -6.798583984375, -6.4443359375, -6.090087890625, -5.73583984375, -5.381591796875, -5.02734375, -4.673095703125, -4.31884765625, -3.964599609375, -3.6103515625, -3.256103515625, -2.90185546875, -2.547607421875, -2.193359375, -1.839111328125, -1.48486328125, -1.130615234375, -0.7763671875, -0.422119140625, -0.06787109375, 0.286376953125, 0.640625, 0.994873046875, 1.34912109375, 1.703369140625, 2.0576171875, 2.411865234375, 2.76611328125, 3.120361328125, 3.474609375, 3.828857421875, 4.18310546875, 4.537353515625, 4.8916015625, 5.245849609375, 5.60009765625, 5.954345703125, 6.30859375, 6.662841796875, 7.01708984375, 7.371337890625, 7.7255859375, 8.079833984375, 8.43408203125, 8.788330078125, 9.142578125, 9.496826171875, 9.85107421875, 10.205322265625, 10.5595703125, 10.913818359375, 11.26806640625, 11.622314453125, 11.9765625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 13.0, 11.0, 29.0, 36.0, 106.0, 213.0, 565.0, 1609.0, 5390.0, 24394.0, 168229.0, 697901.0, 123894.0, 19492.0, 4447.0, 1348.0, 504.0, 196.0, 81.0, 36.0, 21.0, 13.0, 5.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.359375, -20.720458984375, -20.08154296875, -19.442626953125, -18.8037109375, -18.164794921875, -17.52587890625, -16.886962890625, -16.248046875, -15.609130859375, -14.97021484375, -14.331298828125, -13.6923828125, -13.053466796875, -12.41455078125, -11.775634765625, -11.13671875, -10.497802734375, -9.85888671875, -9.219970703125, -8.5810546875, -7.942138671875, -7.30322265625, -6.664306640625, -6.025390625, -5.386474609375, -4.74755859375, -4.108642578125, -3.4697265625, -2.830810546875, -2.19189453125, -1.552978515625, -0.9140625, -0.275146484375, 0.36376953125, 1.002685546875, 1.6416015625, 2.280517578125, 2.91943359375, 3.558349609375, 4.197265625, 4.836181640625, 5.47509765625, 6.114013671875, 6.7529296875, 7.391845703125, 8.03076171875, 8.669677734375, 9.30859375, 9.947509765625, 10.58642578125, 11.225341796875, 11.8642578125, 12.503173828125, 13.14208984375, 13.781005859375, 14.419921875, 15.058837890625, 15.69775390625, 16.336669921875, 16.9755859375, 17.614501953125, 18.25341796875, 18.892333984375, 19.53125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 7.0, 9.0, 15.0, 10.0, 22.0, 24.0, 22.0, 50.0, 68.0, 95.0, 130.0, 134.0, 118.0, 55.0, 53.0, 37.0, 19.0, 32.0, 17.0, 16.0, 10.0, 14.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002506256103515625, -0.002411186695098877, -0.002316117286682129, -0.002221047878265381, -0.002125978469848633, -0.0020309090614318848, -0.0019358396530151367, -0.0018407702445983887, -0.0017457008361816406, -0.0016506314277648926, -0.0015555620193481445, -0.0014604926109313965, -0.0013654232025146484, -0.0012703537940979004, -0.0011752843856811523, -0.0010802149772644043, -0.0009851455688476562, -0.0008900761604309082, -0.0007950067520141602, -0.0006999373435974121, -0.0006048679351806641, -0.000509798526763916, -0.00041472911834716797, -0.0003196597099304199, -0.00022459030151367188, -0.00012952089309692383, -3.445148468017578e-05, 6.0617923736572266e-05, 0.0001556873321533203, 0.00025075674057006836, 0.0003458261489868164, 0.00044089555740356445, 0.0005359649658203125, 0.0006310343742370605, 0.0007261037826538086, 0.0008211731910705566, 0.0009162425994873047, 0.0010113120079040527, 0.0011063814163208008, 0.0012014508247375488, 0.0012965202331542969, 0.001391589641571045, 0.001486659049987793, 0.001581728458404541, 0.001676797866821289, 0.0017718672752380371, 0.0018669366836547852, 0.001962006092071533, 0.0020570755004882812, 0.0021521449089050293, 0.0022472143173217773, 0.0023422837257385254, 0.0024373531341552734, 0.0025324225425720215, 0.0026274919509887695, 0.0027225613594055176, 0.0028176307678222656, 0.0029127001762390137, 0.0030077695846557617, 0.0031028389930725098, 0.003197908401489258, 0.003292977809906006, 0.003388047218322754, 0.003483116626739502, 0.00357818603515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 12.0, 22.0, 24.0, 45.0, 60.0, 111.0, 148.0, 294.0, 460.0, 848.0, 1808.0, 4002.0, 10839.0, 33331.0, 128178.0, 539091.0, 247397.0, 54526.0, 16321.0, 5908.0, 2394.0, 1156.0, 674.0, 328.0, 187.0, 113.0, 93.0, 49.0, 28.0, 26.0, 14.0, 13.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.0760498046875, -14.628662109375, -14.1812744140625, -13.73388671875, -13.2864990234375, -12.839111328125, -12.3917236328125, -11.9443359375, -11.4969482421875, -11.049560546875, -10.6021728515625, -10.15478515625, -9.7073974609375, -9.260009765625, -8.8126220703125, -8.365234375, -7.9178466796875, -7.470458984375, -7.0230712890625, -6.57568359375, -6.1282958984375, -5.680908203125, -5.2335205078125, -4.7861328125, -4.3387451171875, -3.891357421875, -3.4439697265625, -2.99658203125, -2.5491943359375, -2.101806640625, -1.6544189453125, -1.20703125, -0.7596435546875, -0.312255859375, 0.1351318359375, 0.58251953125, 1.0299072265625, 1.477294921875, 1.9246826171875, 2.3720703125, 2.8194580078125, 3.266845703125, 3.7142333984375, 4.16162109375, 4.6090087890625, 5.056396484375, 5.5037841796875, 5.951171875, 6.3985595703125, 6.845947265625, 7.2933349609375, 7.74072265625, 8.1881103515625, 8.635498046875, 9.0828857421875, 9.5302734375, 9.9776611328125, 10.425048828125, 10.8724365234375, 11.31982421875, 11.7672119140625, 12.214599609375, 12.6619873046875, 13.109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 11.0, 13.0, 9.0, 24.0, 31.0, 40.0, 38.0, 49.0, 69.0, 94.0, 87.0, 85.0, 85.0, 92.0, 56.0, 42.0, 41.0, 29.0, 18.0, 22.0, 10.0, 17.0, 8.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.4140625, -11.0989990234375, -10.783935546875, -10.4688720703125, -10.15380859375, -9.8387451171875, -9.523681640625, -9.2086181640625, -8.8935546875, -8.5784912109375, -8.263427734375, -7.9483642578125, -7.63330078125, -7.3182373046875, -7.003173828125, -6.6881103515625, -6.373046875, -6.0579833984375, -5.742919921875, -5.4278564453125, -5.11279296875, -4.7977294921875, -4.482666015625, -4.1676025390625, -3.8525390625, -3.5374755859375, -3.222412109375, -2.9073486328125, -2.59228515625, -2.2772216796875, -1.962158203125, -1.6470947265625, -1.33203125, -1.0169677734375, -0.701904296875, -0.3868408203125, -0.07177734375, 0.2432861328125, 0.558349609375, 0.8734130859375, 1.1884765625, 1.5035400390625, 1.818603515625, 2.1336669921875, 2.44873046875, 2.7637939453125, 3.078857421875, 3.3939208984375, 3.708984375, 4.0240478515625, 4.339111328125, 4.6541748046875, 4.96923828125, 5.2843017578125, 5.599365234375, 5.9144287109375, 6.2294921875, 6.5445556640625, 6.859619140625, 7.1746826171875, 7.48974609375, 7.8048095703125, 8.119873046875, 8.4349365234375, 8.75]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 15.0, 16.0, 32.0, 55.0, 89.0, 114.0, 120.0, 127.0, 130.0, 100.0, 62.0, 45.0, 29.0, 21.0, 9.0, 13.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.07423400878906, -77.1078109741211, -73.14139556884766, -69.17497253417969, -65.20854949951172, -61.242130279541016, -57.27571105957031, -53.309288024902344, -49.342864990234375, -45.37644577026367, -41.4100227355957, -37.443603515625, -33.47718048095703, -29.510761260986328, -25.544340133666992, -21.577919006347656, -17.611499786376953, -13.645078659057617, -9.678657531738281, -5.712237358093262, -1.7458162307739258, 2.2206039428710938, 6.18702507019043, 10.153446197509766, 14.119867324829102, 18.086288452148438, 22.052709579467773, 26.01913070678711, 29.985549926757812, 33.95197296142578, 37.918392181396484, 41.88481140136719, 45.851234436035156, 49.81765365600586, 53.78407669067383, 57.75049591064453, 61.7169189453125, 65.68333435058594, 69.6497573852539, 73.61618041992188, 77.58260345458984, 81.54902648925781, 85.51544189453125, 89.48186492919922, 93.44828796386719, 97.41470336914062, 101.3811264038086, 105.34754943847656, 109.31396484375, 113.28038787841797, 117.2468032836914, 121.21322631835938, 125.17964935302734, 129.1460723876953, 133.11248779296875, 137.07891845703125, 141.0453338623047, 145.01174926757812, 148.97817993164062, 152.94459533691406, 156.9110107421875, 160.87744140625, 164.84385681152344, 168.81027221679688, 172.77670288085938]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 7.0, 3.0, 4.0, 8.0, 4.0, 11.0, 7.0, 6.0, 14.0, 13.0, 17.0, 14.0, 18.0, 25.0, 24.0, 25.0, 43.0, 23.0, 34.0, 38.0, 36.0, 39.0, 36.0, 41.0, 43.0, 42.0, 47.0, 44.0, 46.0, 35.0, 25.0, 29.0, 27.0, 24.0, 31.0, 24.0, 18.0, 9.0, 12.0, 6.0, 4.0, 17.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.22677230834961, -55.3734130859375, -53.520050048828125, -51.666690826416016, -49.81332778930664, -47.95996856689453, -46.106605529785156, -44.25324630737305, -42.39988708496094, -40.54652786254883, -38.69316482543945, -36.839805603027344, -34.98644256591797, -33.13308334350586, -31.279722213745117, -29.426361083984375, -27.572999954223633, -25.71963882446289, -23.86627769470215, -22.012916564941406, -20.159557342529297, -18.306196212768555, -16.452835083007812, -14.599474906921387, -12.746113777160645, -10.892752647399902, -9.039392471313477, -7.186031341552734, -5.33267068862915, -3.4793100357055664, -1.6259489059448242, 0.22741127014160156, 2.0807723999023438, 3.9341330528259277, 5.787493705749512, 7.640854835510254, 9.49421501159668, 11.347576141357422, 13.200937271118164, 15.05429744720459, 16.907657623291016, 18.761018753051758, 20.6143798828125, 22.46773910522461, 24.32110023498535, 26.174461364746094, 28.027822494506836, 29.881183624267578, 31.73454475402832, 33.58790588378906, 35.44126510620117, 37.29462814331055, 39.147987365722656, 41.00135040283203, 42.85470962524414, 44.70806884765625, 46.561431884765625, 48.414791107177734, 50.26815414428711, 52.12151336669922, 53.974876403808594, 55.8282356262207, 57.68159484863281, 59.53495788574219, 61.3883171081543]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 14.0, 20.0, 26.0, 42.0, 62.0, 144.0, 214.0, 539.0, 1267.0, 3401.0, 10565.0, 40396.0, 233463.0, 3555086.0, 283022.0, 46720.0, 12257.0, 4030.0, 1639.0, 642.0, 307.0, 154.0, 92.0, 48.0, 29.0, 13.0, 21.0, 12.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.46875, -20.689208984375, -19.90966796875, -19.130126953125, -18.3505859375, -17.571044921875, -16.79150390625, -16.011962890625, -15.232421875, -14.452880859375, -13.67333984375, -12.893798828125, -12.1142578125, -11.334716796875, -10.55517578125, -9.775634765625, -8.99609375, -8.216552734375, -7.43701171875, -6.657470703125, -5.8779296875, -5.098388671875, -4.31884765625, -3.539306640625, -2.759765625, -1.980224609375, -1.20068359375, -0.421142578125, 0.3583984375, 1.137939453125, 1.91748046875, 2.697021484375, 3.4765625, 4.256103515625, 5.03564453125, 5.815185546875, 6.5947265625, 7.374267578125, 8.15380859375, 8.933349609375, 9.712890625, 10.492431640625, 11.27197265625, 12.051513671875, 12.8310546875, 13.610595703125, 14.39013671875, 15.169677734375, 15.94921875, 16.728759765625, 17.50830078125, 18.287841796875, 19.0673828125, 19.846923828125, 20.62646484375, 21.406005859375, 22.185546875, 22.965087890625, 23.74462890625, 24.524169921875, 25.3037109375, 26.083251953125, 26.86279296875, 27.642333984375, 28.421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 9.0, 6.0, 8.0, 6.0, 16.0, 24.0, 26.0, 24.0, 28.0, 38.0, 35.0, 42.0, 41.0, 48.0, 48.0, 56.0, 47.0, 44.0, 36.0, 51.0, 49.0, 41.0, 34.0, 42.0, 27.0, 31.0, 20.0, 19.0, 15.0, 14.0, 13.0, 7.0, 9.0, 10.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.455078125, -2.3778076171875, -2.300537109375, -2.2232666015625, -2.14599609375, -2.0687255859375, -1.991455078125, -1.9141845703125, -1.8369140625, -1.7596435546875, -1.682373046875, -1.6051025390625, -1.52783203125, -1.4505615234375, -1.373291015625, -1.2960205078125, -1.21875, -1.1414794921875, -1.064208984375, -0.9869384765625, -0.90966796875, -0.8323974609375, -0.755126953125, -0.6778564453125, -0.6005859375, -0.5233154296875, -0.446044921875, -0.3687744140625, -0.29150390625, -0.2142333984375, -0.136962890625, -0.0596923828125, 0.017578125, 0.0948486328125, 0.172119140625, 0.2493896484375, 0.32666015625, 0.4039306640625, 0.481201171875, 0.5584716796875, 0.6357421875, 0.7130126953125, 0.790283203125, 0.8675537109375, 0.94482421875, 1.0220947265625, 1.099365234375, 1.1766357421875, 1.25390625, 1.3311767578125, 1.408447265625, 1.4857177734375, 1.56298828125, 1.6402587890625, 1.717529296875, 1.7947998046875, 1.8720703125, 1.9493408203125, 2.026611328125, 2.1038818359375, 2.18115234375, 2.2584228515625, 2.335693359375, 2.4129638671875, 2.490234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 13.0, 20.0, 25.0, 36.0, 44.0, 83.0, 123.0, 167.0, 257.0, 411.0, 746.0, 1258.0, 2272.0, 4536.0, 9860.0, 23357.0, 62969.0, 212381.0, 1544281.0, 1993643.0, 226003.0, 66283.0, 24552.0, 10338.0, 4854.0, 2421.0, 1332.0, 728.0, 465.0, 265.0, 189.0, 114.0, 71.0, 45.0, 30.0, 23.0, 15.0, 14.0, 12.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-17.78125, -17.301025390625, -16.82080078125, -16.340576171875, -15.8603515625, -15.380126953125, -14.89990234375, -14.419677734375, -13.939453125, -13.459228515625, -12.97900390625, -12.498779296875, -12.0185546875, -11.538330078125, -11.05810546875, -10.577880859375, -10.09765625, -9.617431640625, -9.13720703125, -8.656982421875, -8.1767578125, -7.696533203125, -7.21630859375, -6.736083984375, -6.255859375, -5.775634765625, -5.29541015625, -4.815185546875, -4.3349609375, -3.854736328125, -3.37451171875, -2.894287109375, -2.4140625, -1.933837890625, -1.45361328125, -0.973388671875, -0.4931640625, -0.012939453125, 0.46728515625, 0.947509765625, 1.427734375, 1.907958984375, 2.38818359375, 2.868408203125, 3.3486328125, 3.828857421875, 4.30908203125, 4.789306640625, 5.26953125, 5.749755859375, 6.22998046875, 6.710205078125, 7.1904296875, 7.670654296875, 8.15087890625, 8.631103515625, 9.111328125, 9.591552734375, 10.07177734375, 10.552001953125, 11.0322265625, 11.512451171875, 11.99267578125, 12.472900390625, 12.953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 11.0, 14.0, 12.0, 19.0, 21.0, 50.0, 54.0, 74.0, 106.0, 160.0, 258.0, 444.0, 1149.0, 707.0, 366.0, 183.0, 125.0, 88.0, 44.0, 41.0, 38.0, 21.0, 15.0, 13.0, 9.0, 7.0, 8.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.342529296875, -7.11865234375, -6.894775390625, -6.6708984375, -6.447021484375, -6.22314453125, -5.999267578125, -5.775390625, -5.551513671875, -5.32763671875, -5.103759765625, -4.8798828125, -4.656005859375, -4.43212890625, -4.208251953125, -3.984375, -3.760498046875, -3.53662109375, -3.312744140625, -3.0888671875, -2.864990234375, -2.64111328125, -2.417236328125, -2.193359375, -1.969482421875, -1.74560546875, -1.521728515625, -1.2978515625, -1.073974609375, -0.85009765625, -0.626220703125, -0.40234375, -0.178466796875, 0.04541015625, 0.269287109375, 0.4931640625, 0.717041015625, 0.94091796875, 1.164794921875, 1.388671875, 1.612548828125, 1.83642578125, 2.060302734375, 2.2841796875, 2.508056640625, 2.73193359375, 2.955810546875, 3.1796875, 3.403564453125, 3.62744140625, 3.851318359375, 4.0751953125, 4.299072265625, 4.52294921875, 4.746826171875, 4.970703125, 5.194580078125, 5.41845703125, 5.642333984375, 5.8662109375, 6.090087890625, 6.31396484375, 6.537841796875, 6.76171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 18.0, 46.0, 82.0, 119.0, 175.0, 178.0, 160.0, 96.0, 54.0, 33.0, 17.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.79619598388672, -123.09005737304688, -120.38392639160156, -117.67779541015625, -114.9716567993164, -112.26551818847656, -109.55938720703125, -106.85325622558594, -104.1471176147461, -101.44097900390625, -98.73484802246094, -96.02871704101562, -93.32257843017578, -90.61643981933594, -87.91030883789062, -85.20417785644531, -82.49803924560547, -79.79190063476562, -77.08576965332031, -74.379638671875, -71.67350006103516, -68.96736145019531, -66.26123046875, -63.55509567260742, -60.848960876464844, -58.142826080322266, -55.43669128417969, -52.73055648803711, -50.02442169189453, -47.31828689575195, -44.612152099609375, -41.9060173034668, -39.19988250732422, -36.49374771118164, -33.78761291503906, -31.081478118896484, -28.375343322753906, -25.669208526611328, -22.96307373046875, -20.256938934326172, -17.550804138183594, -14.844669342041016, -12.138534545898438, -9.43239974975586, -6.726264953613281, -4.020130157470703, -1.313995361328125, 1.3921394348144531, 4.098274230957031, 6.804409027099609, 9.510543823242188, 12.216678619384766, 14.922813415527344, 17.628948211669922, 20.3350830078125, 23.041217803955078, 25.747352600097656, 28.453487396240234, 31.159622192382812, 33.86575698852539, 36.57189178466797, 39.27802658081055, 41.984161376953125, 44.6902961730957, 47.39643096923828]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 9.0, 14.0, 11.0, 20.0, 21.0, 24.0, 25.0, 41.0, 26.0, 41.0, 29.0, 30.0, 38.0, 34.0, 60.0, 41.0, 36.0, 37.0, 44.0, 41.0, 34.0, 38.0, 34.0, 37.0, 31.0, 30.0, 27.0, 23.0, 23.0, 13.0, 22.0, 8.0, 8.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.75122833251953, -30.80316734313965, -29.8551082611084, -28.907047271728516, -27.958986282348633, -27.01092529296875, -26.0628662109375, -25.114805221557617, -24.166744232177734, -23.21868324279785, -22.2706241607666, -21.32256317138672, -20.374502182006836, -19.426441192626953, -18.478382110595703, -17.53032112121582, -16.582260131835938, -15.634200096130371, -14.686139106750488, -13.738079071044922, -12.790018081665039, -11.841958045959473, -10.893898010253906, -9.945837020874023, -8.997777938842773, -8.049717903137207, -7.101656913757324, -6.153596878051758, -5.205535888671875, -4.257475852966309, -3.309415340423584, -2.3613548278808594, -1.4132938385009766, -0.46523338556289673, 0.4828270673751831, 1.4308874607086182, 2.3789479732513428, 3.3270082473754883, 4.275068759918213, 5.2231292724609375, 6.171189785003662, 7.119250297546387, 8.067310333251953, 9.015371322631836, 9.963431358337402, 10.911491394042969, 11.859552383422852, 12.807613372802734, 13.7556734085083, 14.703733444213867, 15.65179443359375, 16.599855422973633, 17.547914505004883, 18.495975494384766, 19.44403648376465, 20.39209747314453, 21.34015655517578, 22.288217544555664, 23.236276626586914, 24.184337615966797, 25.13239860534668, 26.080459594726562, 27.028518676757812, 27.976579666137695, 28.924640655517578]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 12.0, 12.0, 15.0, 26.0, 52.0, 105.0, 126.0, 284.0, 659.0, 1494.0, 3815.0, 11180.0, 36224.0, 120401.0, 370121.0, 344716.0, 109478.0, 33264.0, 10379.0, 3485.0, 1457.0, 599.0, 277.0, 149.0, 81.0, 47.0, 27.0, 28.0, 13.0, 10.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.01171875, -23.3046875, -22.59765625, -21.890625, -21.18359375, -20.4765625, -19.76953125, -19.0625, -18.35546875, -17.6484375, -16.94140625, -16.234375, -15.52734375, -14.8203125, -14.11328125, -13.40625, -12.69921875, -11.9921875, -11.28515625, -10.578125, -9.87109375, -9.1640625, -8.45703125, -7.75, -7.04296875, -6.3359375, -5.62890625, -4.921875, -4.21484375, -3.5078125, -2.80078125, -2.09375, -1.38671875, -0.6796875, 0.02734375, 0.734375, 1.44140625, 2.1484375, 2.85546875, 3.5625, 4.26953125, 4.9765625, 5.68359375, 6.390625, 7.09765625, 7.8046875, 8.51171875, 9.21875, 9.92578125, 10.6328125, 11.33984375, 12.046875, 12.75390625, 13.4609375, 14.16796875, 14.875, 15.58203125, 16.2890625, 16.99609375, 17.703125, 18.41015625, 19.1171875, 19.82421875, 20.53125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 17.0, 12.0, 19.0, 25.0, 17.0, 23.0, 28.0, 36.0, 44.0, 49.0, 47.0, 43.0, 46.0, 48.0, 49.0, 44.0, 45.0, 49.0, 41.0, 28.0, 23.0, 32.0, 36.0, 23.0, 23.0, 16.0, 19.0, 20.0, 18.0, 6.0, 7.0, 7.0, 10.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.47265625, -2.396820068359375, -2.32098388671875, -2.245147705078125, -2.1693115234375, -2.093475341796875, -2.01763916015625, -1.941802978515625, -1.865966796875, -1.790130615234375, -1.71429443359375, -1.638458251953125, -1.5626220703125, -1.486785888671875, -1.41094970703125, -1.335113525390625, -1.25927734375, -1.183441162109375, -1.10760498046875, -1.031768798828125, -0.9559326171875, -0.880096435546875, -0.80426025390625, -0.728424072265625, -0.652587890625, -0.576751708984375, -0.50091552734375, -0.425079345703125, -0.3492431640625, -0.273406982421875, -0.19757080078125, -0.121734619140625, -0.0458984375, 0.029937744140625, 0.10577392578125, 0.181610107421875, 0.2574462890625, 0.333282470703125, 0.40911865234375, 0.484954833984375, 0.560791015625, 0.636627197265625, 0.71246337890625, 0.788299560546875, 0.8641357421875, 0.939971923828125, 1.01580810546875, 1.091644287109375, 1.16748046875, 1.243316650390625, 1.31915283203125, 1.394989013671875, 1.4708251953125, 1.546661376953125, 1.62249755859375, 1.698333740234375, 1.774169921875, 1.850006103515625, 1.92584228515625, 2.001678466796875, 2.0775146484375, 2.153350830078125, 2.22918701171875, 2.305023193359375, 2.380859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 20.0, 11.0, 24.0, 42.0, 67.0, 98.0, 142.0, 209.0, 304.0, 532.0, 813.0, 1454.0, 2584.0, 4666.0, 9083.0, 18618.0, 39371.0, 84179.0, 178231.0, 297148.0, 213470.0, 103597.0, 48248.0, 22349.0, 10796.0, 5445.0, 2886.0, 1630.0, 990.0, 510.0, 342.0, 227.0, 156.0, 81.0, 75.0, 49.0, 27.0, 26.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.0943603515625, -10.719970703125, -10.3455810546875, -9.97119140625, -9.5968017578125, -9.222412109375, -8.8480224609375, -8.4736328125, -8.0992431640625, -7.724853515625, -7.3504638671875, -6.97607421875, -6.6016845703125, -6.227294921875, -5.8529052734375, -5.478515625, -5.1041259765625, -4.729736328125, -4.3553466796875, -3.98095703125, -3.6065673828125, -3.232177734375, -2.8577880859375, -2.4833984375, -2.1090087890625, -1.734619140625, -1.3602294921875, -0.98583984375, -0.6114501953125, -0.237060546875, 0.1373291015625, 0.51171875, 0.8861083984375, 1.260498046875, 1.6348876953125, 2.00927734375, 2.3836669921875, 2.758056640625, 3.1324462890625, 3.5068359375, 3.8812255859375, 4.255615234375, 4.6300048828125, 5.00439453125, 5.3787841796875, 5.753173828125, 6.1275634765625, 6.501953125, 6.8763427734375, 7.250732421875, 7.6251220703125, 7.99951171875, 8.3739013671875, 8.748291015625, 9.1226806640625, 9.4970703125, 9.8714599609375, 10.245849609375, 10.6202392578125, 10.99462890625, 11.3690185546875, 11.743408203125, 12.1177978515625, 12.4921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 4.0, 8.0, 12.0, 8.0, 7.0, 20.0, 20.0, 21.0, 19.0, 35.0, 26.0, 35.0, 42.0, 44.0, 63.0, 47.0, 30.0, 38.0, 45.0, 37.0, 50.0, 47.0, 50.0, 37.0, 33.0, 35.0, 33.0, 22.0, 28.0, 13.0, 15.0, 11.0, 16.0, 6.0, 9.0, 4.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.3203125, -12.9146728515625, -12.509033203125, -12.1033935546875, -11.69775390625, -11.2921142578125, -10.886474609375, -10.4808349609375, -10.0751953125, -9.6695556640625, -9.263916015625, -8.8582763671875, -8.45263671875, -8.0469970703125, -7.641357421875, -7.2357177734375, -6.830078125, -6.4244384765625, -6.018798828125, -5.6131591796875, -5.20751953125, -4.8018798828125, -4.396240234375, -3.9906005859375, -3.5849609375, -3.1793212890625, -2.773681640625, -2.3680419921875, -1.96240234375, -1.5567626953125, -1.151123046875, -0.7454833984375, -0.33984375, 0.0657958984375, 0.471435546875, 0.8770751953125, 1.28271484375, 1.6883544921875, 2.093994140625, 2.4996337890625, 2.9052734375, 3.3109130859375, 3.716552734375, 4.1221923828125, 4.52783203125, 4.9334716796875, 5.339111328125, 5.7447509765625, 6.150390625, 6.5560302734375, 6.961669921875, 7.3673095703125, 7.77294921875, 8.1785888671875, 8.584228515625, 8.9898681640625, 9.3955078125, 9.8011474609375, 10.206787109375, 10.6124267578125, 11.01806640625, 11.4237060546875, 11.829345703125, 12.2349853515625, 12.640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 13.0, 10.0, 26.0, 31.0, 33.0, 58.0, 83.0, 143.0, 232.0, 323.0, 574.0, 881.0, 1577.0, 2716.0, 5274.0, 10403.0, 22957.0, 59866.0, 227940.0, 498978.0, 137863.0, 42821.0, 17596.0, 8113.0, 4256.0, 2289.0, 1328.0, 851.0, 498.0, 281.0, 198.0, 108.0, 78.0, 49.0, 27.0, 22.0, 18.0, 11.0, 12.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-13.9453125, -13.5391845703125, -13.133056640625, -12.7269287109375, -12.32080078125, -11.9146728515625, -11.508544921875, -11.1024169921875, -10.6962890625, -10.2901611328125, -9.884033203125, -9.4779052734375, -9.07177734375, -8.6656494140625, -8.259521484375, -7.8533935546875, -7.447265625, -7.0411376953125, -6.635009765625, -6.2288818359375, -5.82275390625, -5.4166259765625, -5.010498046875, -4.6043701171875, -4.1982421875, -3.7921142578125, -3.385986328125, -2.9798583984375, -2.57373046875, -2.1676025390625, -1.761474609375, -1.3553466796875, -0.94921875, -0.5430908203125, -0.136962890625, 0.2691650390625, 0.67529296875, 1.0814208984375, 1.487548828125, 1.8936767578125, 2.2998046875, 2.7059326171875, 3.112060546875, 3.5181884765625, 3.92431640625, 4.3304443359375, 4.736572265625, 5.1427001953125, 5.548828125, 5.9549560546875, 6.361083984375, 6.7672119140625, 7.17333984375, 7.5794677734375, 7.985595703125, 8.3917236328125, 8.7978515625, 9.2039794921875, 9.610107421875, 10.0162353515625, 10.42236328125, 10.8284912109375, 11.234619140625, 11.6407470703125, 12.046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 8.0, 14.0, 26.0, 33.0, 28.0, 44.0, 85.0, 139.0, 207.0, 141.0, 77.0, 29.0, 38.0, 31.0, 16.0, 15.0, 10.0, 13.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034961700439453125, -0.003368884325027466, -0.003241598606109619, -0.0031143128871917725, -0.0029870271682739258, -0.002859741449356079, -0.0027324557304382324, -0.0026051700115203857, -0.002477884292602539, -0.0023505985736846924, -0.0022233128547668457, -0.002096027135848999, -0.0019687414169311523, -0.0018414556980133057, -0.001714169979095459, -0.0015868842601776123, -0.0014595985412597656, -0.001332312822341919, -0.0012050271034240723, -0.0010777413845062256, -0.0009504556655883789, -0.0008231699466705322, -0.0006958842277526855, -0.0005685985088348389, -0.0004413127899169922, -0.0003140270709991455, -0.00018674135208129883, -5.945563316345215e-05, 6.783008575439453e-05, 0.0001951158046722412, 0.0003224015235900879, 0.00044968724250793457, 0.0005769729614257812, 0.0007042586803436279, 0.0008315443992614746, 0.0009588301181793213, 0.001086115837097168, 0.0012134015560150146, 0.0013406872749328613, 0.001467972993850708, 0.0015952587127685547, 0.0017225444316864014, 0.001849830150604248, 0.0019771158695220947, 0.0021044015884399414, 0.002231687307357788, 0.0023589730262756348, 0.0024862587451934814, 0.002613544464111328, 0.002740830183029175, 0.0028681159019470215, 0.002995401620864868, 0.003122687339782715, 0.0032499730587005615, 0.003377258777618408, 0.003504544496536255, 0.0036318302154541016, 0.0037591159343719482, 0.003886401653289795, 0.004013687372207642, 0.004140973091125488, 0.004268258810043335, 0.004395544528961182, 0.004522830247879028, 0.004650115966796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 1.0, 7.0, 6.0, 10.0, 16.0, 23.0, 36.0, 43.0, 69.0, 97.0, 138.0, 234.0, 334.0, 524.0, 926.0, 1413.0, 2392.0, 4330.0, 8102.0, 15262.0, 32345.0, 83943.0, 346653.0, 387688.0, 92949.0, 34666.0, 16392.0, 8612.0, 4600.0, 2687.0, 1515.0, 894.0, 515.0, 348.0, 238.0, 161.0, 115.0, 80.0, 55.0, 35.0, 28.0, 16.0, 17.0, 10.0, 8.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.269775390625, -10.90673828125, -10.543701171875, -10.1806640625, -9.817626953125, -9.45458984375, -9.091552734375, -8.728515625, -8.365478515625, -8.00244140625, -7.639404296875, -7.2763671875, -6.913330078125, -6.55029296875, -6.187255859375, -5.82421875, -5.461181640625, -5.09814453125, -4.735107421875, -4.3720703125, -4.009033203125, -3.64599609375, -3.282958984375, -2.919921875, -2.556884765625, -2.19384765625, -1.830810546875, -1.4677734375, -1.104736328125, -0.74169921875, -0.378662109375, -0.015625, 0.347412109375, 0.71044921875, 1.073486328125, 1.4365234375, 1.799560546875, 2.16259765625, 2.525634765625, 2.888671875, 3.251708984375, 3.61474609375, 3.977783203125, 4.3408203125, 4.703857421875, 5.06689453125, 5.429931640625, 5.79296875, 6.156005859375, 6.51904296875, 6.882080078125, 7.2451171875, 7.608154296875, 7.97119140625, 8.334228515625, 8.697265625, 9.060302734375, 9.42333984375, 9.786376953125, 10.1494140625, 10.512451171875, 10.87548828125, 11.238525390625, 11.6015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 6.0, 9.0, 4.0, 6.0, 13.0, 17.0, 15.0, 19.0, 33.0, 48.0, 55.0, 84.0, 95.0, 129.0, 136.0, 90.0, 56.0, 53.0, 23.0, 24.0, 12.0, 10.0, 11.0, 9.0, 11.0, 2.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5491943359375, -11.184326171875, -10.8194580078125, -10.45458984375, -10.0897216796875, -9.724853515625, -9.3599853515625, -8.9951171875, -8.6302490234375, -8.265380859375, -7.9005126953125, -7.53564453125, -7.1707763671875, -6.805908203125, -6.4410400390625, -6.076171875, -5.7113037109375, -5.346435546875, -4.9815673828125, -4.61669921875, -4.2518310546875, -3.886962890625, -3.5220947265625, -3.1572265625, -2.7923583984375, -2.427490234375, -2.0626220703125, -1.69775390625, -1.3328857421875, -0.968017578125, -0.6031494140625, -0.23828125, 0.1265869140625, 0.491455078125, 0.8563232421875, 1.22119140625, 1.5860595703125, 1.950927734375, 2.3157958984375, 2.6806640625, 3.0455322265625, 3.410400390625, 3.7752685546875, 4.14013671875, 4.5050048828125, 4.869873046875, 5.2347412109375, 5.599609375, 5.9644775390625, 6.329345703125, 6.6942138671875, 7.05908203125, 7.4239501953125, 7.788818359375, 8.1536865234375, 8.5185546875, 8.8834228515625, 9.248291015625, 9.6131591796875, 9.97802734375, 10.3428955078125, 10.707763671875, 11.0726318359375, 11.4375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 18.0, 57.0, 132.0, 230.0, 243.0, 174.0, 77.0, 40.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-416.04974365234375, -407.0478820800781, -398.0460205078125, -389.044189453125, -380.0423278808594, -371.04046630859375, -362.0386047363281, -353.0367431640625, -344.034912109375, -335.0330505371094, -326.03118896484375, -317.02935791015625, -308.0274963378906, -299.025634765625, -290.0237731933594, -281.02191162109375, -272.0200500488281, -263.0181884765625, -254.01634216308594, -245.0144805908203, -236.01263427734375, -227.01077270507812, -218.0089111328125, -209.00704956054688, -200.0052032470703, -191.0033416748047, -182.00149536132812, -172.9996337890625, -163.99777221679688, -154.9959259033203, -145.9940643310547, -136.99221801757812, -127.99037170410156, -118.98851776123047, -109.98666381835938, -100.98480224609375, -91.98294830322266, -82.98109436035156, -73.97923278808594, -64.97737884521484, -55.97552490234375, -46.973670959472656, -37.9718132019043, -28.96995735168457, -19.968101501464844, -10.96624755859375, -1.9643898010253906, 7.037467956542969, 16.039321899414062, 25.04117774963379, 34.043033599853516, 43.044891357421875, 52.04674530029297, 61.04859924316406, 70.05046081542969, 79.05231475830078, 88.05416870117188, 97.05602264404297, 106.05787658691406, 115.05973815917969, 124.06159210205078, 133.06344604492188, 142.0653076171875, 151.06716918945312, 160.0690155029297]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 8.0, 13.0, 4.0, 10.0, 11.0, 16.0, 14.0, 21.0, 20.0, 29.0, 30.0, 35.0, 29.0, 37.0, 30.0, 39.0, 46.0, 49.0, 53.0, 49.0, 37.0, 35.0, 39.0, 43.0, 30.0, 35.0, 35.0, 23.0, 26.0, 28.0, 18.0, 21.0, 9.0, 14.0, 13.0, 7.0, 5.0, 7.0, 6.0, 3.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.68264770507812, -72.4303970336914, -70.17814636230469, -67.92589569091797, -65.67364501953125, -63.421390533447266, -61.16913604736328, -58.91688537597656, -56.664634704589844, -54.412384033203125, -52.160133361816406, -49.90787887573242, -47.6556282043457, -45.403377532958984, -43.151123046875, -40.89887237548828, -38.64662170410156, -36.394371032714844, -34.142120361328125, -31.88986587524414, -29.637615203857422, -27.385364532470703, -25.13311195373535, -22.880859375, -20.62860870361328, -18.376358032226562, -16.12410545349121, -13.871853828430176, -11.61960220336914, -9.367350578308105, -7.11509895324707, -4.862847328186035, -2.610595703125, -0.35834407806396484, 1.8939075469970703, 4.1461591720581055, 6.398410797119141, 8.650662422180176, 10.902914047241211, 13.155165672302246, 15.407417297363281, 17.65966796875, 19.91192054748535, 22.164173126220703, 24.416423797607422, 26.66867446899414, 28.920927047729492, 31.173179626464844, 33.42543029785156, 35.67768096923828, 37.929931640625, 40.182186126708984, 42.4344367980957, 44.68668746948242, 46.938941955566406, 49.191192626953125, 51.443443298339844, 53.69569396972656, 55.94794464111328, 58.200199127197266, 60.452449798583984, 62.7047004699707, 64.95695495605469, 67.2092056274414, 69.46145629882812]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 13.0, 17.0, 26.0, 71.0, 94.0, 191.0, 437.0, 1054.0, 2893.0, 8800.0, 36381.0, 340907.0, 3686628.0, 91786.0, 17183.0, 4826.0, 1654.0, 664.0, 322.0, 142.0, 68.0, 32.0, 23.0, 16.0, 13.0, 7.0, 8.0, 9.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.16748046875, -25.2412109375, -24.31494140625, -23.388671875, -22.46240234375, -21.5361328125, -20.60986328125, -19.68359375, -18.75732421875, -17.8310546875, -16.90478515625, -15.978515625, -15.05224609375, -14.1259765625, -13.19970703125, -12.2734375, -11.34716796875, -10.4208984375, -9.49462890625, -8.568359375, -7.64208984375, -6.7158203125, -5.78955078125, -4.86328125, -3.93701171875, -3.0107421875, -2.08447265625, -1.158203125, -0.23193359375, 0.6943359375, 1.62060546875, 2.546875, 3.47314453125, 4.3994140625, 5.32568359375, 6.251953125, 7.17822265625, 8.1044921875, 9.03076171875, 9.95703125, 10.88330078125, 11.8095703125, 12.73583984375, 13.662109375, 14.58837890625, 15.5146484375, 16.44091796875, 17.3671875, 18.29345703125, 19.2197265625, 20.14599609375, 21.072265625, 21.99853515625, 22.9248046875, 23.85107421875, 24.77734375, 25.70361328125, 26.6298828125, 27.55615234375, 28.482421875, 29.40869140625, 30.3349609375, 31.26123046875, 32.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 9.0, 14.0, 22.0, 22.0, 27.0, 26.0, 31.0, 29.0, 30.0, 41.0, 46.0, 42.0, 36.0, 42.0, 49.0, 37.0, 45.0, 55.0, 36.0, 33.0, 38.0, 30.0, 33.0, 29.0, 29.0, 14.0, 19.0, 20.0, 17.0, 11.0, 9.0, 8.0, 13.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.3828125, -2.303802490234375, -2.22479248046875, -2.145782470703125, -2.0667724609375, -1.987762451171875, -1.90875244140625, -1.829742431640625, -1.750732421875, -1.671722412109375, -1.59271240234375, -1.513702392578125, -1.4346923828125, -1.355682373046875, -1.27667236328125, -1.197662353515625, -1.11865234375, -1.039642333984375, -0.96063232421875, -0.881622314453125, -0.8026123046875, -0.723602294921875, -0.64459228515625, -0.565582275390625, -0.486572265625, -0.407562255859375, -0.32855224609375, -0.249542236328125, -0.1705322265625, -0.091522216796875, -0.01251220703125, 0.066497802734375, 0.1455078125, 0.224517822265625, 0.30352783203125, 0.382537841796875, 0.4615478515625, 0.540557861328125, 0.61956787109375, 0.698577880859375, 0.777587890625, 0.856597900390625, 0.93560791015625, 1.014617919921875, 1.0936279296875, 1.172637939453125, 1.25164794921875, 1.330657958984375, 1.40966796875, 1.488677978515625, 1.56768798828125, 1.646697998046875, 1.7257080078125, 1.804718017578125, 1.88372802734375, 1.962738037109375, 2.041748046875, 2.120758056640625, 2.19976806640625, 2.278778076171875, 2.3577880859375, 2.436798095703125, 2.51580810546875, 2.594818115234375, 2.673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 11.0, 21.0, 16.0, 28.0, 55.0, 83.0, 129.0, 202.0, 313.0, 539.0, 904.0, 1644.0, 3262.0, 6652.0, 15689.0, 42366.0, 166435.0, 2988183.0, 811267.0, 103378.0, 30452.0, 11558.0, 5073.0, 2682.0, 1362.0, 771.0, 437.0, 262.0, 176.0, 118.0, 54.0, 45.0, 38.0, 29.0, 12.0, 7.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.875, -21.208984375, -20.54296875, -19.876953125, -19.2109375, -18.544921875, -17.87890625, -17.212890625, -16.546875, -15.880859375, -15.21484375, -14.548828125, -13.8828125, -13.216796875, -12.55078125, -11.884765625, -11.21875, -10.552734375, -9.88671875, -9.220703125, -8.5546875, -7.888671875, -7.22265625, -6.556640625, -5.890625, -5.224609375, -4.55859375, -3.892578125, -3.2265625, -2.560546875, -1.89453125, -1.228515625, -0.5625, 0.103515625, 0.76953125, 1.435546875, 2.1015625, 2.767578125, 3.43359375, 4.099609375, 4.765625, 5.431640625, 6.09765625, 6.763671875, 7.4296875, 8.095703125, 8.76171875, 9.427734375, 10.09375, 10.759765625, 11.42578125, 12.091796875, 12.7578125, 13.423828125, 14.08984375, 14.755859375, 15.421875, 16.087890625, 16.75390625, 17.419921875, 18.0859375, 18.751953125, 19.41796875, 20.083984375, 20.75]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 6.0, 12.0, 16.0, 23.0, 26.0, 34.0, 60.0, 104.0, 133.0, 259.0, 700.0, 1666.0, 426.0, 218.0, 112.0, 62.0, 45.0, 38.0, 19.0, 19.0, 20.0, 11.0, 11.0, 10.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.23468017578125, -4.9888916015625, -4.74310302734375, -4.497314453125, -4.25152587890625, -4.0057373046875, -3.75994873046875, -3.51416015625, -3.26837158203125, -3.0225830078125, -2.77679443359375, -2.531005859375, -2.28521728515625, -2.0394287109375, -1.79364013671875, -1.5478515625, -1.30206298828125, -1.0562744140625, -0.81048583984375, -0.564697265625, -0.31890869140625, -0.0731201171875, 0.17266845703125, 0.41845703125, 0.66424560546875, 0.9100341796875, 1.15582275390625, 1.401611328125, 1.64739990234375, 1.8931884765625, 2.13897705078125, 2.384765625, 2.63055419921875, 2.8763427734375, 3.12213134765625, 3.367919921875, 3.61370849609375, 3.8594970703125, 4.10528564453125, 4.35107421875, 4.59686279296875, 4.8426513671875, 5.08843994140625, 5.334228515625, 5.58001708984375, 5.8258056640625, 6.07159423828125, 6.3173828125, 6.56317138671875, 6.8089599609375, 7.05474853515625, 7.300537109375, 7.54632568359375, 7.7921142578125, 8.03790283203125, 8.28369140625, 8.52947998046875, 8.7752685546875, 9.02105712890625, 9.266845703125, 9.51263427734375, 9.7584228515625, 10.00421142578125, 10.25]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 11.0, 15.0, 14.0, 32.0, 46.0, 56.0, 67.0, 94.0, 89.0, 109.0, 86.0, 91.0, 76.0, 68.0, 34.0, 32.0, 34.0, 16.0, 6.0, 2.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.06221008300781, -60.53546905517578, -59.008731842041016, -57.481990814208984, -55.95525360107422, -54.42851257324219, -52.901771545410156, -51.375030517578125, -49.84829330444336, -48.32155227661133, -46.79481506347656, -45.26807403564453, -43.7413330078125, -42.214595794677734, -40.6878547668457, -39.16111755371094, -37.634376525878906, -36.107635498046875, -34.58089828491211, -33.05415725708008, -31.52741813659668, -30.00067901611328, -28.47393798828125, -26.94719886779785, -25.420459747314453, -23.893720626831055, -22.366981506347656, -20.840240478515625, -19.313501358032227, -17.786762237548828, -16.260021209716797, -14.733282089233398, -13.20654296875, -11.679803848266602, -10.153063774108887, -8.626323699951172, -7.099584579467773, -5.572844982147217, -4.04610538482666, -2.5193653106689453, -0.9926261901855469, 0.5341134071350098, 2.0608530044555664, 3.587592601776123, 5.11433219909668, 6.641071796417236, 8.167811393737793, 9.694551467895508, 11.221290588378906, 12.748029708862305, 14.27476978302002, 15.801509857177734, 17.328248977661133, 18.85498809814453, 20.381729125976562, 21.90846824645996, 23.43520736694336, 24.961946487426758, 26.488685607910156, 28.015426635742188, 29.542165756225586, 31.068904876708984, 32.595645904541016, 34.12238311767578, 35.64912414550781]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 8.0, 13.0, 17.0, 22.0, 23.0, 36.0, 29.0, 33.0, 36.0, 40.0, 51.0, 42.0, 42.0, 43.0, 50.0, 53.0, 47.0, 37.0, 43.0, 54.0, 32.0, 38.0, 28.0, 29.0, 31.0, 19.0, 16.0, 12.0, 13.0, 9.0, 8.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.675498962402344, -30.72734260559082, -29.77918815612793, -28.831031799316406, -27.882877349853516, -26.934720993041992, -25.98656463623047, -25.038410186767578, -24.090255737304688, -23.142099380493164, -22.193944931030273, -21.24578857421875, -20.29763412475586, -19.349477767944336, -18.401321411132812, -17.453166961669922, -16.5050106048584, -15.556855201721191, -14.608699798583984, -13.660543441772461, -12.71238899230957, -11.764232635498047, -10.81607723236084, -9.867921829223633, -8.919766426086426, -7.971611022949219, -7.023455619812012, -6.0752997398376465, -5.1271443367004395, -4.178988933563232, -3.230833053588867, -2.28267765045166, -1.3345203399658203, -0.38636481761932373, 0.5617907047271729, 1.509946346282959, 2.458101749420166, 3.406257152557373, 4.354413032531738, 5.302568435668945, 6.250723838806152, 7.198879241943359, 8.147034645080566, 9.095190048217773, 10.043346405029297, 10.991500854492188, 11.939657211303711, 12.887812614440918, 13.835968017578125, 14.784123420715332, 15.732278823852539, 16.680435180664062, 17.628589630126953, 18.576745986938477, 19.52490234375, 20.47305679321289, 21.42121124267578, 22.369367599487305, 23.317522048950195, 24.26567840576172, 25.21383285522461, 26.161989212036133, 27.110145568847656, 28.058300018310547, 29.00645637512207]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 8.0, 26.0, 35.0, 51.0, 73.0, 126.0, 206.0, 296.0, 462.0, 764.0, 1311.0, 2301.0, 3905.0, 7098.0, 12875.0, 24889.0, 46846.0, 88059.0, 161587.0, 241891.0, 203603.0, 117416.0, 62538.0, 33349.0, 17510.0, 9180.0, 5109.0, 2826.0, 1652.0, 972.0, 553.0, 357.0, 234.0, 136.0, 95.0, 57.0, 41.0, 24.0, 20.0, 16.0, 9.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.7578125, -11.3485107421875, -10.939208984375, -10.5299072265625, -10.12060546875, -9.7113037109375, -9.302001953125, -8.8927001953125, -8.4833984375, -8.0740966796875, -7.664794921875, -7.2554931640625, -6.84619140625, -6.4368896484375, -6.027587890625, -5.6182861328125, -5.208984375, -4.7996826171875, -4.390380859375, -3.9810791015625, -3.57177734375, -3.1624755859375, -2.753173828125, -2.3438720703125, -1.9345703125, -1.5252685546875, -1.115966796875, -0.7066650390625, -0.29736328125, 0.1119384765625, 0.521240234375, 0.9305419921875, 1.33984375, 1.7491455078125, 2.158447265625, 2.5677490234375, 2.97705078125, 3.3863525390625, 3.795654296875, 4.2049560546875, 4.6142578125, 5.0235595703125, 5.432861328125, 5.8421630859375, 6.25146484375, 6.6607666015625, 7.070068359375, 7.4793701171875, 7.888671875, 8.2979736328125, 8.707275390625, 9.1165771484375, 9.52587890625, 9.9351806640625, 10.344482421875, 10.7537841796875, 11.1630859375, 11.5723876953125, 11.981689453125, 12.3909912109375, 12.80029296875, 13.2095947265625, 13.618896484375, 14.0281982421875, 14.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 14.0, 5.0, 15.0, 6.0, 18.0, 12.0, 23.0, 20.0, 24.0, 30.0, 37.0, 33.0, 47.0, 43.0, 38.0, 35.0, 44.0, 49.0, 34.0, 38.0, 48.0, 49.0, 43.0, 36.0, 41.0, 28.0, 21.0, 26.0, 20.0, 17.0, 22.0, 10.0, 9.0, 11.0, 5.0, 5.0, 9.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.73828125, -2.652679443359375, -2.56707763671875, -2.481475830078125, -2.3958740234375, -2.310272216796875, -2.22467041015625, -2.139068603515625, -2.053466796875, -1.967864990234375, -1.88226318359375, -1.796661376953125, -1.7110595703125, -1.625457763671875, -1.53985595703125, -1.454254150390625, -1.36865234375, -1.283050537109375, -1.19744873046875, -1.111846923828125, -1.0262451171875, -0.940643310546875, -0.85504150390625, -0.769439697265625, -0.683837890625, -0.598236083984375, -0.51263427734375, -0.427032470703125, -0.3414306640625, -0.255828857421875, -0.17022705078125, -0.084625244140625, 0.0009765625, 0.086578369140625, 0.17218017578125, 0.257781982421875, 0.3433837890625, 0.428985595703125, 0.51458740234375, 0.600189208984375, 0.685791015625, 0.771392822265625, 0.85699462890625, 0.942596435546875, 1.0281982421875, 1.113800048828125, 1.19940185546875, 1.285003662109375, 1.37060546875, 1.456207275390625, 1.54180908203125, 1.627410888671875, 1.7130126953125, 1.798614501953125, 1.88421630859375, 1.969818115234375, 2.055419921875, 2.141021728515625, 2.22662353515625, 2.312225341796875, 2.3978271484375, 2.483428955078125, 2.56903076171875, 2.654632568359375, 2.740234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 6.0, 15.0, 21.0, 27.0, 27.0, 41.0, 61.0, 93.0, 124.0, 169.0, 251.0, 329.0, 587.0, 945.0, 1521.0, 2737.0, 5064.0, 9963.0, 19994.0, 40800.0, 85489.0, 177633.0, 295647.0, 208212.0, 101115.0, 48504.0, 23562.0, 11595.0, 6008.0, 3279.0, 1801.0, 991.0, 644.0, 410.0, 275.0, 170.0, 137.0, 97.0, 36.0, 38.0, 39.0, 25.0, 22.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -13.03515625, -12.609375, -12.18359375, -11.7578125, -11.33203125, -10.90625, -10.48046875, -10.0546875, -9.62890625, -9.203125, -8.77734375, -8.3515625, -7.92578125, -7.5, -7.07421875, -6.6484375, -6.22265625, -5.796875, -5.37109375, -4.9453125, -4.51953125, -4.09375, -3.66796875, -3.2421875, -2.81640625, -2.390625, -1.96484375, -1.5390625, -1.11328125, -0.6875, -0.26171875, 0.1640625, 0.58984375, 1.015625, 1.44140625, 1.8671875, 2.29296875, 2.71875, 3.14453125, 3.5703125, 3.99609375, 4.421875, 4.84765625, 5.2734375, 5.69921875, 6.125, 6.55078125, 6.9765625, 7.40234375, 7.828125, 8.25390625, 8.6796875, 9.10546875, 9.53125, 9.95703125, 10.3828125, 10.80859375, 11.234375, 11.66015625, 12.0859375, 12.51171875, 12.9375, 13.36328125, 13.7890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 10.0, 13.0, 17.0, 16.0, 22.0, 27.0, 14.0, 35.0, 35.0, 31.0, 33.0, 36.0, 40.0, 52.0, 35.0, 40.0, 59.0, 51.0, 34.0, 43.0, 46.0, 37.0, 32.0, 29.0, 30.0, 26.0, 28.0, 24.0, 11.0, 15.0, 9.0, 10.0, 10.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.3494873046875, -13.870849609375, -13.3922119140625, -12.91357421875, -12.4349365234375, -11.956298828125, -11.4776611328125, -10.9990234375, -10.5203857421875, -10.041748046875, -9.5631103515625, -9.08447265625, -8.6058349609375, -8.127197265625, -7.6485595703125, -7.169921875, -6.6912841796875, -6.212646484375, -5.7340087890625, -5.25537109375, -4.7767333984375, -4.298095703125, -3.8194580078125, -3.3408203125, -2.8621826171875, -2.383544921875, -1.9049072265625, -1.42626953125, -0.9476318359375, -0.468994140625, 0.0096435546875, 0.48828125, 0.9669189453125, 1.445556640625, 1.9241943359375, 2.40283203125, 2.8814697265625, 3.360107421875, 3.8387451171875, 4.3173828125, 4.7960205078125, 5.274658203125, 5.7532958984375, 6.23193359375, 6.7105712890625, 7.189208984375, 7.6678466796875, 8.146484375, 8.6251220703125, 9.103759765625, 9.5823974609375, 10.06103515625, 10.5396728515625, 11.018310546875, 11.4969482421875, 11.9755859375, 12.4542236328125, 12.932861328125, 13.4114990234375, 13.89013671875, 14.3687744140625, 14.847412109375, 15.3260498046875, 15.8046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 12.0, 11.0, 11.0, 26.0, 39.0, 44.0, 59.0, 104.0, 163.0, 274.0, 474.0, 756.0, 1289.0, 2324.0, 4724.0, 9892.0, 23415.0, 60132.0, 207239.0, 490990.0, 158714.0, 49973.0, 20046.0, 8692.0, 4105.0, 2187.0, 1103.0, 646.0, 419.0, 247.0, 142.0, 99.0, 60.0, 46.0, 29.0, 19.0, 16.0, 8.0, 8.0, 11.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.4765625, -15.0133056640625, -14.550048828125, -14.0867919921875, -13.62353515625, -13.1602783203125, -12.697021484375, -12.2337646484375, -11.7705078125, -11.3072509765625, -10.843994140625, -10.3807373046875, -9.91748046875, -9.4542236328125, -8.990966796875, -8.5277099609375, -8.064453125, -7.6011962890625, -7.137939453125, -6.6746826171875, -6.21142578125, -5.7481689453125, -5.284912109375, -4.8216552734375, -4.3583984375, -3.8951416015625, -3.431884765625, -2.9686279296875, -2.50537109375, -2.0421142578125, -1.578857421875, -1.1156005859375, -0.65234375, -0.1890869140625, 0.274169921875, 0.7374267578125, 1.20068359375, 1.6639404296875, 2.127197265625, 2.5904541015625, 3.0537109375, 3.5169677734375, 3.980224609375, 4.4434814453125, 4.90673828125, 5.3699951171875, 5.833251953125, 6.2965087890625, 6.759765625, 7.2230224609375, 7.686279296875, 8.1495361328125, 8.61279296875, 9.0760498046875, 9.539306640625, 10.0025634765625, 10.4658203125, 10.9290771484375, 11.392333984375, 11.8555908203125, 12.31884765625, 12.7821044921875, 13.245361328125, 13.7086181640625, 14.171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 20.0, 17.0, 26.0, 35.0, 40.0, 49.0, 95.0, 126.0, 168.0, 107.0, 65.0, 46.0, 34.0, 39.0, 33.0, 16.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00421905517578125, -0.00408405065536499, -0.0039490461349487305, -0.0038140416145324707, -0.003679037094116211, -0.003544032573699951, -0.0034090280532836914, -0.0032740235328674316, -0.003139019012451172, -0.003004014492034912, -0.0028690099716186523, -0.0027340054512023926, -0.002599000930786133, -0.002463996410369873, -0.0023289918899536133, -0.0021939873695373535, -0.0020589828491210938, -0.001923978328704834, -0.0017889738082885742, -0.0016539692878723145, -0.0015189647674560547, -0.001383960247039795, -0.0012489557266235352, -0.0011139512062072754, -0.0009789466857910156, -0.0008439421653747559, -0.0007089376449584961, -0.0005739331245422363, -0.00043892860412597656, -0.0003039240837097168, -0.00016891956329345703, -3.3915042877197266e-05, 0.0001010894775390625, 0.00023609399795532227, 0.00037109851837158203, 0.0005061030387878418, 0.0006411075592041016, 0.0007761120796203613, 0.0009111166000366211, 0.0010461211204528809, 0.0011811256408691406, 0.0013161301612854004, 0.0014511346817016602, 0.00158613920211792, 0.0017211437225341797, 0.0018561482429504395, 0.0019911527633666992, 0.002126157283782959, 0.0022611618041992188, 0.0023961663246154785, 0.0025311708450317383, 0.002666175365447998, 0.002801179885864258, 0.0029361844062805176, 0.0030711889266967773, 0.003206193447113037, 0.003341197967529297, 0.0034762024879455566, 0.0036112070083618164, 0.003746211528778076, 0.003881216049194336, 0.004016220569610596, 0.0041512250900268555, 0.004286229610443115, 0.004421234130859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 6.0, 13.0, 25.0, 22.0, 53.0, 73.0, 109.0, 193.0, 326.0, 642.0, 1273.0, 2502.0, 5511.0, 12860.0, 33892.0, 112896.0, 560409.0, 230413.0, 53543.0, 19067.0, 7695.0, 3439.0, 1716.0, 820.0, 438.0, 237.0, 149.0, 79.0, 51.0, 32.0, 21.0, 8.0, 11.0, 6.0, 3.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.756103515625, -18.19970703125, -17.643310546875, -17.0869140625, -16.530517578125, -15.97412109375, -15.417724609375, -14.861328125, -14.304931640625, -13.74853515625, -13.192138671875, -12.6357421875, -12.079345703125, -11.52294921875, -10.966552734375, -10.41015625, -9.853759765625, -9.29736328125, -8.740966796875, -8.1845703125, -7.628173828125, -7.07177734375, -6.515380859375, -5.958984375, -5.402587890625, -4.84619140625, -4.289794921875, -3.7333984375, -3.177001953125, -2.62060546875, -2.064208984375, -1.5078125, -0.951416015625, -0.39501953125, 0.161376953125, 0.7177734375, 1.274169921875, 1.83056640625, 2.386962890625, 2.943359375, 3.499755859375, 4.05615234375, 4.612548828125, 5.1689453125, 5.725341796875, 6.28173828125, 6.838134765625, 7.39453125, 7.950927734375, 8.50732421875, 9.063720703125, 9.6201171875, 10.176513671875, 10.73291015625, 11.289306640625, 11.845703125, 12.402099609375, 12.95849609375, 13.514892578125, 14.0712890625, 14.627685546875, 15.18408203125, 15.740478515625, 16.296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 11.0, 8.0, 18.0, 22.0, 17.0, 26.0, 29.0, 52.0, 82.0, 100.0, 111.0, 123.0, 80.0, 68.0, 44.0, 29.0, 29.0, 16.0, 17.0, 15.0, 14.0, 8.0, 7.0, 9.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.71875, -13.32421875, -12.9296875, -12.53515625, -12.140625, -11.74609375, -11.3515625, -10.95703125, -10.5625, -10.16796875, -9.7734375, -9.37890625, -8.984375, -8.58984375, -8.1953125, -7.80078125, -7.40625, -7.01171875, -6.6171875, -6.22265625, -5.828125, -5.43359375, -5.0390625, -4.64453125, -4.25, -3.85546875, -3.4609375, -3.06640625, -2.671875, -2.27734375, -1.8828125, -1.48828125, -1.09375, -0.69921875, -0.3046875, 0.08984375, 0.484375, 0.87890625, 1.2734375, 1.66796875, 2.0625, 2.45703125, 2.8515625, 3.24609375, 3.640625, 4.03515625, 4.4296875, 4.82421875, 5.21875, 5.61328125, 6.0078125, 6.40234375, 6.796875, 7.19140625, 7.5859375, 7.98046875, 8.375, 8.76953125, 9.1640625, 9.55859375, 9.953125, 10.34765625, 10.7421875, 11.13671875, 11.53125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 13.0, 19.0, 34.0, 47.0, 65.0, 87.0, 102.0, 126.0, 127.0, 102.0, 96.0, 62.0, 41.0, 13.0, 22.0, 12.0, 7.0, 5.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.1421661376953, -171.5607452392578, -165.97933959960938, -160.39791870117188, -154.81649780273438, -149.23507690429688, -143.65365600585938, -138.07225036621094, -132.49082946777344, -126.90940856933594, -121.32799530029297, -115.74658203125, -110.1651611328125, -104.583740234375, -99.00232696533203, -93.42091369628906, -87.83949279785156, -82.25807189941406, -76.6766586303711, -71.09524536132812, -65.51382446289062, -59.93240737915039, -54.350990295410156, -48.76957321166992, -43.18815612792969, -37.60673904418945, -32.02532196044922, -26.443904876708984, -20.86248779296875, -15.281070709228516, -9.699653625488281, -4.118236541748047, 1.46319580078125, 7.044612884521484, 12.626029968261719, 18.207447052001953, 23.788864135742188, 29.370281219482422, 34.951698303222656, 40.53311538696289, 46.114532470703125, 51.69594955444336, 57.277366638183594, 62.85878372192383, 68.44020080566406, 74.02162170410156, 79.60303497314453, 85.1844482421875, 90.765869140625, 96.3472900390625, 101.92870330810547, 107.51011657714844, 113.09153747558594, 118.67295837402344, 124.2543716430664, 129.83578491210938, 135.41720581054688, 140.99862670898438, 146.58004760742188, 152.1614532470703, 157.7428741455078, 163.3242950439453, 168.90570068359375, 174.48712158203125, 180.06854248046875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 7.0, 16.0, 12.0, 18.0, 10.0, 21.0, 23.0, 26.0, 38.0, 33.0, 39.0, 31.0, 35.0, 36.0, 46.0, 47.0, 44.0, 48.0, 36.0, 39.0, 42.0, 25.0, 39.0, 42.0, 35.0, 31.0, 27.0, 27.0, 22.0, 16.0, 18.0, 12.0, 9.0, 7.0, 8.0, 10.0, 3.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-88.88740539550781, -86.19448852539062, -83.50157928466797, -80.80866241455078, -78.11575317382812, -75.42283630371094, -72.72992706298828, -70.0370101928711, -67.34410095214844, -64.65118408203125, -61.958274841308594, -59.26536178588867, -56.57244873046875, -53.87953567504883, -51.186622619628906, -48.49370574951172, -45.8007926940918, -43.107879638671875, -40.41496658325195, -37.72205352783203, -35.02914047241211, -32.33622741699219, -29.643312454223633, -26.95039939880371, -24.25748634338379, -21.564573287963867, -18.871660232543945, -16.17874526977539, -13.485833168029785, -10.792920112609863, -8.100006103515625, -5.407093048095703, -2.7141799926757812, -0.021266698837280273, 2.6716465950012207, 5.364560127258301, 8.057473182678223, 10.750386238098145, 13.443300247192383, 16.136213302612305, 18.829126358032227, 21.52203941345215, 24.21495246887207, 26.907867431640625, 29.600780487060547, 32.29369354248047, 34.98660659790039, 37.67951965332031, 40.372432708740234, 43.065345764160156, 45.75825881958008, 48.451171875, 51.14408493041992, 53.836997985839844, 56.52991485595703, 59.22282409667969, 61.915740966796875, 64.60865783691406, 67.30156707763672, 69.9944839477539, 72.68739318847656, 75.38031005859375, 78.0732192993164, 80.7661361694336, 83.45904541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 12.0, 15.0, 28.0, 36.0, 67.0, 113.0, 183.0, 294.0, 571.0, 1116.0, 2356.0, 4994.0, 12271.0, 34586.0, 126741.0, 2600409.0, 1248922.0, 110593.0, 30738.0, 11240.0, 4628.0, 2102.0, 1025.0, 519.0, 277.0, 159.0, 86.0, 73.0, 45.0, 20.0, 17.0, 10.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.71875, -16.048828125, -15.37890625, -14.708984375, -14.0390625, -13.369140625, -12.69921875, -12.029296875, -11.359375, -10.689453125, -10.01953125, -9.349609375, -8.6796875, -8.009765625, -7.33984375, -6.669921875, -6.0, -5.330078125, -4.66015625, -3.990234375, -3.3203125, -2.650390625, -1.98046875, -1.310546875, -0.640625, 0.029296875, 0.69921875, 1.369140625, 2.0390625, 2.708984375, 3.37890625, 4.048828125, 4.71875, 5.388671875, 6.05859375, 6.728515625, 7.3984375, 8.068359375, 8.73828125, 9.408203125, 10.078125, 10.748046875, 11.41796875, 12.087890625, 12.7578125, 13.427734375, 14.09765625, 14.767578125, 15.4375, 16.107421875, 16.77734375, 17.447265625, 18.1171875, 18.787109375, 19.45703125, 20.126953125, 20.796875, 21.466796875, 22.13671875, 22.806640625, 23.4765625, 24.146484375, 24.81640625, 25.486328125, 26.15625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 18.0, 18.0, 18.0, 18.0, 32.0, 46.0, 28.0, 38.0, 41.0, 48.0, 25.0, 47.0, 51.0, 46.0, 45.0, 57.0, 41.0, 37.0, 34.0, 34.0, 43.0, 33.0, 27.0, 23.0, 20.0, 19.0, 18.0, 16.0, 10.0, 9.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.736328125, -2.638671875, -2.541015625, -2.443359375, -2.345703125, -2.248046875, -2.150390625, -2.052734375, -1.955078125, -1.857421875, -1.759765625, -1.662109375, -1.564453125, -1.466796875, -1.369140625, -1.271484375, -1.173828125, -1.076171875, -0.978515625, -0.880859375, -0.783203125, -0.685546875, -0.587890625, -0.490234375, -0.392578125, -0.294921875, -0.197265625, -0.099609375, -0.001953125, 0.095703125, 0.193359375, 0.291015625, 0.388671875, 0.486328125, 0.583984375, 0.681640625, 0.779296875, 0.876953125, 0.974609375, 1.072265625, 1.169921875, 1.267578125, 1.365234375, 1.462890625, 1.560546875, 1.658203125, 1.755859375, 1.853515625, 1.951171875, 2.048828125, 2.146484375, 2.244140625, 2.341796875, 2.439453125, 2.537109375, 2.634765625, 2.732421875, 2.830078125, 2.927734375, 3.025390625, 3.123046875, 3.220703125, 3.318359375, 3.416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 17.0, 32.0, 27.0, 60.0, 119.0, 194.0, 377.0, 762.0, 1471.0, 3189.0, 7062.0, 17671.0, 49779.0, 183279.0, 2116916.0, 1564445.0, 170636.0, 48203.0, 17181.0, 6822.0, 2985.0, 1442.0, 733.0, 373.0, 221.0, 95.0, 75.0, 46.0, 14.0, 12.0, 13.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.359375, -13.734375, -13.109375, -12.484375, -11.859375, -11.234375, -10.609375, -9.984375, -9.359375, -8.734375, -8.109375, -7.484375, -6.859375, -6.234375, -5.609375, -4.984375, -4.359375, -3.734375, -3.109375, -2.484375, -1.859375, -1.234375, -0.609375, 0.015625, 0.640625, 1.265625, 1.890625, 2.515625, 3.140625, 3.765625, 4.390625, 5.015625, 5.640625, 6.265625, 6.890625, 7.515625, 8.140625, 8.765625, 9.390625, 10.015625, 10.640625, 11.265625, 11.890625, 12.515625, 13.140625, 13.765625, 14.390625, 15.015625, 15.640625, 16.265625, 16.890625, 17.515625, 18.140625, 18.765625, 19.390625, 20.015625, 20.640625, 21.265625, 21.890625, 22.515625, 23.140625, 23.765625, 24.390625, 25.015625, 25.640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 14.0, 4.0, 17.0, 14.0, 27.0, 38.0, 62.0, 72.0, 117.0, 175.0, 270.0, 455.0, 1224.0, 600.0, 293.0, 185.0, 124.0, 87.0, 63.0, 59.0, 41.0, 20.0, 15.0, 20.0, 14.0, 7.0, 6.0, 9.0, 9.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-8.7421875, -8.4969482421875, -8.251708984375, -8.0064697265625, -7.76123046875, -7.5159912109375, -7.270751953125, -7.0255126953125, -6.7802734375, -6.5350341796875, -6.289794921875, -6.0445556640625, -5.79931640625, -5.5540771484375, -5.308837890625, -5.0635986328125, -4.818359375, -4.5731201171875, -4.327880859375, -4.0826416015625, -3.83740234375, -3.5921630859375, -3.346923828125, -3.1016845703125, -2.8564453125, -2.6112060546875, -2.365966796875, -2.1207275390625, -1.87548828125, -1.6302490234375, -1.385009765625, -1.1397705078125, -0.89453125, -0.6492919921875, -0.404052734375, -0.1588134765625, 0.08642578125, 0.3316650390625, 0.576904296875, 0.8221435546875, 1.0673828125, 1.3126220703125, 1.557861328125, 1.8031005859375, 2.04833984375, 2.2935791015625, 2.538818359375, 2.7840576171875, 3.029296875, 3.2745361328125, 3.519775390625, 3.7650146484375, 4.01025390625, 4.2554931640625, 4.500732421875, 4.7459716796875, 4.9912109375, 5.2364501953125, 5.481689453125, 5.7269287109375, 5.97216796875, 6.2174072265625, 6.462646484375, 6.7078857421875, 6.953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 16.0, 29.0, 52.0, 90.0, 133.0, 161.0, 165.0, 115.0, 98.0, 67.0, 35.0, 13.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.73023986816406, -73.04025268554688, -70.35027313232422, -67.66028594970703, -64.97030639648438, -62.28031921386719, -59.59033203125, -56.90034866333008, -54.210365295410156, -51.520381927490234, -48.83039855957031, -46.140411376953125, -43.4504280090332, -40.76044464111328, -38.070457458496094, -35.38047409057617, -32.69049072265625, -30.000507354736328, -27.310522079467773, -24.62053680419922, -21.930553436279297, -19.240570068359375, -16.55058479309082, -13.860599517822266, -11.170616149902344, -8.480631828308105, -5.790647506713867, -3.100663185119629, -0.4106788635253906, 2.2793054580688477, 4.969289779663086, 7.659275054931641, 10.349266052246094, 13.039250373840332, 15.72923469543457, 18.419219970703125, 21.109203338623047, 23.79918670654297, 26.489171981811523, 29.179157257080078, 31.869140625, 34.55912399291992, 37.249107360839844, 39.93909454345703, 42.62907791137695, 45.319061279296875, 48.00904846191406, 50.699031829833984, 53.389015197753906, 56.07899856567383, 58.76898193359375, 61.45896911621094, 64.14895629882812, 66.83893585205078, 69.52892303466797, 72.21890258789062, 74.90888977050781, 77.598876953125, 80.28885650634766, 82.97884368896484, 85.6688232421875, 88.35881042480469, 91.04879760742188, 93.73878479003906, 96.42876434326172]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 9.0, 10.0, 11.0, 8.0, 10.0, 17.0, 12.0, 13.0, 22.0, 17.0, 16.0, 33.0, 32.0, 31.0, 41.0, 45.0, 49.0, 37.0, 40.0, 35.0, 49.0, 45.0, 34.0, 48.0, 40.0, 35.0, 37.0, 27.0, 26.0, 22.0, 25.0, 20.0, 23.0, 18.0, 11.0, 12.0, 10.0, 1.0, 6.0, 4.0, 9.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.12439727783203, -31.17691993713379, -30.229442596435547, -29.281965255737305, -28.334487915039062, -27.38701057434082, -26.439533233642578, -25.492055892944336, -24.544578552246094, -23.59710121154785, -22.64962387084961, -21.702146530151367, -20.754669189453125, -19.807191848754883, -18.85971450805664, -17.9122371673584, -16.964759826660156, -16.017282485961914, -15.069805145263672, -14.12232780456543, -13.174850463867188, -12.227373123168945, -11.279895782470703, -10.332418441772461, -9.384943008422852, -8.43746566772461, -7.489988327026367, -6.542510986328125, -5.595033645629883, -4.647556781768799, -3.7000794410705566, -2.7526021003723145, -1.805124282836914, -0.8576470017433167, 0.08983027935028076, 1.0373075008392334, 1.9847848415374756, 2.9322619438171387, 3.879739284515381, 4.827216625213623, 5.774693965911865, 6.722171306610107, 7.66964864730835, 8.617125511169434, 9.564602851867676, 10.512080192565918, 11.45955753326416, 12.407034873962402, 13.354512214660645, 14.301989555358887, 15.249466896057129, 16.196943283081055, 17.144420623779297, 18.09189796447754, 19.03937530517578, 19.986852645874023, 20.934329986572266, 21.881807327270508, 22.82928466796875, 23.776762008666992, 24.724239349365234, 25.671716690063477, 26.61919403076172, 27.56667137145996, 28.514148712158203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 9.0, 10.0, 9.0, 16.0, 27.0, 45.0, 66.0, 94.0, 140.0, 210.0, 373.0, 524.0, 960.0, 1614.0, 2728.0, 4881.0, 8943.0, 17660.0, 36470.0, 81228.0, 213430.0, 377425.0, 170431.0, 67331.0, 30738.0, 15020.0, 7851.0, 4216.0, 2451.0, 1405.0, 819.0, 496.0, 302.0, 236.0, 116.0, 84.0, 50.0, 42.0, 38.0, 18.0, 11.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.828125, -16.30859375, -15.7890625, -15.26953125, -14.75, -14.23046875, -13.7109375, -13.19140625, -12.671875, -12.15234375, -11.6328125, -11.11328125, -10.59375, -10.07421875, -9.5546875, -9.03515625, -8.515625, -7.99609375, -7.4765625, -6.95703125, -6.4375, -5.91796875, -5.3984375, -4.87890625, -4.359375, -3.83984375, -3.3203125, -2.80078125, -2.28125, -1.76171875, -1.2421875, -0.72265625, -0.203125, 0.31640625, 0.8359375, 1.35546875, 1.875, 2.39453125, 2.9140625, 3.43359375, 3.953125, 4.47265625, 4.9921875, 5.51171875, 6.03125, 6.55078125, 7.0703125, 7.58984375, 8.109375, 8.62890625, 9.1484375, 9.66796875, 10.1875, 10.70703125, 11.2265625, 11.74609375, 12.265625, 12.78515625, 13.3046875, 13.82421875, 14.34375, 14.86328125, 15.3828125, 15.90234375, 16.421875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 7.0, 3.0, 11.0, 25.0, 28.0, 25.0, 24.0, 26.0, 22.0, 33.0, 43.0, 27.0, 42.0, 25.0, 44.0, 43.0, 39.0, 46.0, 44.0, 38.0, 35.0, 36.0, 28.0, 41.0, 24.0, 27.0, 23.0, 27.0, 15.0, 13.0, 18.0, 14.0, 15.0, 9.0, 8.0, 16.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.919921875, -2.831573486328125, -2.74322509765625, -2.654876708984375, -2.5665283203125, -2.478179931640625, -2.38983154296875, -2.301483154296875, -2.213134765625, -2.124786376953125, -2.03643798828125, -1.948089599609375, -1.8597412109375, -1.771392822265625, -1.68304443359375, -1.594696044921875, -1.50634765625, -1.417999267578125, -1.32965087890625, -1.241302490234375, -1.1529541015625, -1.064605712890625, -0.97625732421875, -0.887908935546875, -0.799560546875, -0.711212158203125, -0.62286376953125, -0.534515380859375, -0.4461669921875, -0.357818603515625, -0.26947021484375, -0.181121826171875, -0.0927734375, -0.004425048828125, 0.08392333984375, 0.172271728515625, 0.2606201171875, 0.348968505859375, 0.43731689453125, 0.525665283203125, 0.614013671875, 0.702362060546875, 0.79071044921875, 0.879058837890625, 0.9674072265625, 1.055755615234375, 1.14410400390625, 1.232452392578125, 1.32080078125, 1.409149169921875, 1.49749755859375, 1.585845947265625, 1.6741943359375, 1.762542724609375, 1.85089111328125, 1.939239501953125, 2.027587890625, 2.115936279296875, 2.20428466796875, 2.292633056640625, 2.3809814453125, 2.469329833984375, 2.55767822265625, 2.646026611328125, 2.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 7.0, 14.0, 16.0, 14.0, 28.0, 17.0, 30.0, 52.0, 67.0, 97.0, 161.0, 244.0, 423.0, 749.0, 1401.0, 2973.0, 6376.0, 15391.0, 41125.0, 139531.0, 541202.0, 208781.0, 54695.0, 19530.0, 7951.0, 3698.0, 1738.0, 915.0, 513.0, 265.0, 177.0, 120.0, 66.0, 48.0, 44.0, 25.0, 22.0, 11.0, 12.0, 9.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -17.970703125, -17.26953125, -16.568359375, -15.8671875, -15.166015625, -14.46484375, -13.763671875, -13.0625, -12.361328125, -11.66015625, -10.958984375, -10.2578125, -9.556640625, -8.85546875, -8.154296875, -7.453125, -6.751953125, -6.05078125, -5.349609375, -4.6484375, -3.947265625, -3.24609375, -2.544921875, -1.84375, -1.142578125, -0.44140625, 0.259765625, 0.9609375, 1.662109375, 2.36328125, 3.064453125, 3.765625, 4.466796875, 5.16796875, 5.869140625, 6.5703125, 7.271484375, 7.97265625, 8.673828125, 9.375, 10.076171875, 10.77734375, 11.478515625, 12.1796875, 12.880859375, 13.58203125, 14.283203125, 14.984375, 15.685546875, 16.38671875, 17.087890625, 17.7890625, 18.490234375, 19.19140625, 19.892578125, 20.59375, 21.294921875, 21.99609375, 22.697265625, 23.3984375, 24.099609375, 24.80078125, 25.501953125, 26.203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 7.0, 7.0, 12.0, 15.0, 12.0, 9.0, 26.0, 15.0, 16.0, 31.0, 34.0, 40.0, 50.0, 47.0, 61.0, 42.0, 52.0, 52.0, 42.0, 51.0, 48.0, 42.0, 41.0, 33.0, 38.0, 37.0, 20.0, 27.0, 8.0, 12.0, 14.0, 4.0, 11.0, 6.0, 1.0, 6.0, 7.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.640625, -17.09228515625, -16.5439453125, -15.99560546875, -15.447265625, -14.89892578125, -14.3505859375, -13.80224609375, -13.25390625, -12.70556640625, -12.1572265625, -11.60888671875, -11.060546875, -10.51220703125, -9.9638671875, -9.41552734375, -8.8671875, -8.31884765625, -7.7705078125, -7.22216796875, -6.673828125, -6.12548828125, -5.5771484375, -5.02880859375, -4.48046875, -3.93212890625, -3.3837890625, -2.83544921875, -2.287109375, -1.73876953125, -1.1904296875, -0.64208984375, -0.09375, 0.45458984375, 1.0029296875, 1.55126953125, 2.099609375, 2.64794921875, 3.1962890625, 3.74462890625, 4.29296875, 4.84130859375, 5.3896484375, 5.93798828125, 6.486328125, 7.03466796875, 7.5830078125, 8.13134765625, 8.6796875, 9.22802734375, 9.7763671875, 10.32470703125, 10.873046875, 11.42138671875, 11.9697265625, 12.51806640625, 13.06640625, 13.61474609375, 14.1630859375, 14.71142578125, 15.259765625, 15.80810546875, 16.3564453125, 16.90478515625, 17.453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 11.0, 20.0, 32.0, 62.0, 127.0, 319.0, 803.0, 3049.0, 16371.0, 113289.0, 803203.0, 93412.0, 13870.0, 2674.0, 739.0, 261.0, 134.0, 75.0, 36.0, 23.0, 19.0, 6.0, 8.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.78125, -31.950439453125, -31.11962890625, -30.288818359375, -29.4580078125, -28.627197265625, -27.79638671875, -26.965576171875, -26.134765625, -25.303955078125, -24.47314453125, -23.642333984375, -22.8115234375, -21.980712890625, -21.14990234375, -20.319091796875, -19.48828125, -18.657470703125, -17.82666015625, -16.995849609375, -16.1650390625, -15.334228515625, -14.50341796875, -13.672607421875, -12.841796875, -12.010986328125, -11.18017578125, -10.349365234375, -9.5185546875, -8.687744140625, -7.85693359375, -7.026123046875, -6.1953125, -5.364501953125, -4.53369140625, -3.702880859375, -2.8720703125, -2.041259765625, -1.21044921875, -0.379638671875, 0.451171875, 1.281982421875, 2.11279296875, 2.943603515625, 3.7744140625, 4.605224609375, 5.43603515625, 6.266845703125, 7.09765625, 7.928466796875, 8.75927734375, 9.590087890625, 10.4208984375, 11.251708984375, 12.08251953125, 12.913330078125, 13.744140625, 14.574951171875, 15.40576171875, 16.236572265625, 17.0673828125, 17.898193359375, 18.72900390625, 19.559814453125, 20.390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 5.0, 5.0, 2.0, 6.0, 16.0, 8.0, 17.0, 19.0, 21.0, 40.0, 47.0, 98.0, 158.0, 164.0, 130.0, 61.0, 33.0, 33.0, 15.0, 23.0, 15.0, 8.0, 12.0, 9.0, 9.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.003582000732421875, -0.003480374813079834, -0.003378748893737793, -0.003277122974395752, -0.003175497055053711, -0.00307387113571167, -0.002972245216369629, -0.002870619297027588, -0.002768993377685547, -0.002667367458343506, -0.002565741539001465, -0.002464115619659424, -0.002362489700317383, -0.002260863780975342, -0.0021592378616333008, -0.0020576119422912598, -0.0019559860229492188, -0.0018543601036071777, -0.0017527341842651367, -0.0016511082649230957, -0.0015494823455810547, -0.0014478564262390137, -0.0013462305068969727, -0.0012446045875549316, -0.0011429786682128906, -0.0010413527488708496, -0.0009397268295288086, -0.0008381009101867676, -0.0007364749908447266, -0.0006348490715026855, -0.0005332231521606445, -0.0004315972328186035, -0.0003299713134765625, -0.00022834539413452148, -0.00012671947479248047, -2.5093555450439453e-05, 7.653236389160156e-05, 0.00017815828323364258, 0.0002797842025756836, 0.0003814101219177246, 0.0004830360412597656, 0.0005846619606018066, 0.0006862878799438477, 0.0007879137992858887, 0.0008895397186279297, 0.0009911656379699707, 0.0010927915573120117, 0.0011944174766540527, 0.0012960433959960938, 0.0013976693153381348, 0.0014992952346801758, 0.0016009211540222168, 0.0017025470733642578, 0.0018041729927062988, 0.0019057989120483398, 0.002007424831390381, 0.002109050750732422, 0.002210676670074463, 0.002312302589416504, 0.002413928508758545, 0.002515554428100586, 0.002617180347442627, 0.002718806266784668, 0.002820432186126709, 0.00292205810546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 13.0, 9.0, 12.0, 16.0, 29.0, 44.0, 88.0, 117.0, 216.0, 389.0, 708.0, 1784.0, 4917.0, 19016.0, 100055.0, 784166.0, 107904.0, 20364.0, 5169.0, 1756.0, 774.0, 430.0, 227.0, 139.0, 79.0, 41.0, 25.0, 14.0, 10.0, 14.0, 9.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.4375, -22.73828125, -22.0390625, -21.33984375, -20.640625, -19.94140625, -19.2421875, -18.54296875, -17.84375, -17.14453125, -16.4453125, -15.74609375, -15.046875, -14.34765625, -13.6484375, -12.94921875, -12.25, -11.55078125, -10.8515625, -10.15234375, -9.453125, -8.75390625, -8.0546875, -7.35546875, -6.65625, -5.95703125, -5.2578125, -4.55859375, -3.859375, -3.16015625, -2.4609375, -1.76171875, -1.0625, -0.36328125, 0.3359375, 1.03515625, 1.734375, 2.43359375, 3.1328125, 3.83203125, 4.53125, 5.23046875, 5.9296875, 6.62890625, 7.328125, 8.02734375, 8.7265625, 9.42578125, 10.125, 10.82421875, 11.5234375, 12.22265625, 12.921875, 13.62109375, 14.3203125, 15.01953125, 15.71875, 16.41796875, 17.1171875, 17.81640625, 18.515625, 19.21484375, 19.9140625, 20.61328125, 21.3125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 4.0, 9.0, 14.0, 7.0, 17.0, 12.0, 33.0, 40.0, 57.0, 118.0, 191.0, 173.0, 100.0, 57.0, 39.0, 22.0, 18.0, 18.0, 12.0, 8.0, 10.0, 4.0, 4.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.3648681640625, -10.925048828125, -10.4852294921875, -10.04541015625, -9.6055908203125, -9.165771484375, -8.7259521484375, -8.2861328125, -7.8463134765625, -7.406494140625, -6.9666748046875, -6.52685546875, -6.0870361328125, -5.647216796875, -5.2073974609375, -4.767578125, -4.3277587890625, -3.887939453125, -3.4481201171875, -3.00830078125, -2.5684814453125, -2.128662109375, -1.6888427734375, -1.2490234375, -0.8092041015625, -0.369384765625, 0.0704345703125, 0.51025390625, 0.9500732421875, 1.389892578125, 1.8297119140625, 2.26953125, 2.7093505859375, 3.149169921875, 3.5889892578125, 4.02880859375, 4.4686279296875, 4.908447265625, 5.3482666015625, 5.7880859375, 6.2279052734375, 6.667724609375, 7.1075439453125, 7.54736328125, 7.9871826171875, 8.427001953125, 8.8668212890625, 9.306640625, 9.7464599609375, 10.186279296875, 10.6260986328125, 11.06591796875, 11.5057373046875, 11.945556640625, 12.3853759765625, 12.8251953125, 13.2650146484375, 13.704833984375, 14.1446533203125, 14.58447265625, 15.0242919921875, 15.464111328125, 15.9039306640625, 16.34375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 21.0, 45.0, 80.0, 134.0, 218.0, 200.0, 119.0, 86.0, 43.0, 24.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-179.44461059570312, -171.34413146972656, -163.24366760253906, -155.1431884765625, -147.042724609375, -138.94224548339844, -130.84176635742188, -122.74130249023438, -114.64083099365234, -106.54035949707031, -98.43988800048828, -90.33941650390625, -82.23893737792969, -74.13847351074219, -66.03799438476562, -57.937522888183594, -49.83705139160156, -41.73657989501953, -33.6361083984375, -25.535633087158203, -17.435161590576172, -9.33469009399414, -1.2342147827148438, 6.8662567138671875, 14.966728210449219, 23.06719970703125, 31.167673110961914, 39.26814651489258, 47.36861801147461, 55.46908950805664, 63.56956481933594, 71.67003631591797, 79.7705078125, 87.87097930908203, 95.97145080566406, 104.07192993164062, 112.17239379882812, 120.27287292480469, 128.37335205078125, 136.47381591796875, 144.57427978515625, 152.6747589111328, 160.7752227783203, 168.87570190429688, 176.97616577148438, 185.07664489746094, 193.1771240234375, 201.277587890625, 209.37806701660156, 217.47854614257812, 225.57901000976562, 233.6794891357422, 241.7799530029297, 249.88043212890625, 257.98089599609375, 266.08135986328125, 274.1818542480469, 282.2823181152344, 290.3828125, 298.4832763671875, 306.583740234375, 314.6842041015625, 322.7846984863281, 330.8851623535156, 338.9856262207031]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 7.0, 6.0, 9.0, 13.0, 11.0, 28.0, 15.0, 20.0, 20.0, 26.0, 39.0, 24.0, 34.0, 29.0, 28.0, 46.0, 47.0, 52.0, 54.0, 39.0, 44.0, 43.0, 46.0, 37.0, 35.0, 37.0, 29.0, 38.0, 22.0, 19.0, 11.0, 14.0, 18.0, 12.0, 13.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-92.78024291992188, -89.91456604003906, -87.04888916015625, -84.1832046508789, -81.3175277709961, -78.45185089111328, -75.58616638183594, -72.72048950195312, -69.85481262207031, -66.9891357421875, -64.12345886230469, -61.257774353027344, -58.39209747314453, -55.52642059326172, -52.66073989868164, -49.79505920410156, -46.92938232421875, -44.06370544433594, -41.19802474975586, -38.33234405517578, -35.46666717529297, -32.600990295410156, -29.735309600830078, -26.869630813598633, -24.003952026367188, -21.138273239135742, -18.272594451904297, -15.406915664672852, -12.541236877441406, -9.675558090209961, -6.809879302978516, -3.9442005157470703, -1.078521728515625, 1.7871570587158203, 4.652835845947266, 7.518514633178711, 10.384193420410156, 13.249872207641602, 16.115550994873047, 18.981229782104492, 21.846908569335938, 24.712587356567383, 27.578266143798828, 30.443944931030273, 33.30962371826172, 36.17530059814453, 39.04098129272461, 41.90666198730469, 44.7723388671875, 47.63801574707031, 50.50369644165039, 53.36937713623047, 56.23505401611328, 59.100730895996094, 61.96641159057617, 64.83209228515625, 67.69776916503906, 70.56344604492188, 73.42912292480469, 76.29480743408203, 79.16048431396484, 82.02616119384766, 84.891845703125, 87.75752258300781, 90.62319946289062]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 14.0, 27.0, 45.0, 52.0, 136.0, 216.0, 429.0, 853.0, 1893.0, 4382.0, 12165.0, 39820.0, 217237.0, 3643797.0, 213581.0, 39093.0, 12214.0, 4625.0, 1872.0, 847.0, 456.0, 216.0, 113.0, 68.0, 41.0, 19.0, 15.0, 11.0, 10.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.828125, -30.8779296875, -29.927734375, -28.9775390625, -28.02734375, -27.0771484375, -26.126953125, -25.1767578125, -24.2265625, -23.2763671875, -22.326171875, -21.3759765625, -20.42578125, -19.4755859375, -18.525390625, -17.5751953125, -16.625, -15.6748046875, -14.724609375, -13.7744140625, -12.82421875, -11.8740234375, -10.923828125, -9.9736328125, -9.0234375, -8.0732421875, -7.123046875, -6.1728515625, -5.22265625, -4.2724609375, -3.322265625, -2.3720703125, -1.421875, -0.4716796875, 0.478515625, 1.4287109375, 2.37890625, 3.3291015625, 4.279296875, 5.2294921875, 6.1796875, 7.1298828125, 8.080078125, 9.0302734375, 9.98046875, 10.9306640625, 11.880859375, 12.8310546875, 13.78125, 14.7314453125, 15.681640625, 16.6318359375, 17.58203125, 18.5322265625, 19.482421875, 20.4326171875, 21.3828125, 22.3330078125, 23.283203125, 24.2333984375, 25.18359375, 26.1337890625, 27.083984375, 28.0341796875, 28.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 8.0, 4.0, 9.0, 14.0, 21.0, 23.0, 18.0, 31.0, 30.0, 34.0, 37.0, 50.0, 67.0, 54.0, 56.0, 46.0, 54.0, 46.0, 50.0, 56.0, 34.0, 34.0, 29.0, 32.0, 22.0, 24.0, 14.0, 22.0, 14.0, 15.0, 8.0, 13.0, 6.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.116943359375, -3.98779296875, -3.858642578125, -3.7294921875, -3.600341796875, -3.47119140625, -3.342041015625, -3.212890625, -3.083740234375, -2.95458984375, -2.825439453125, -2.6962890625, -2.567138671875, -2.43798828125, -2.308837890625, -2.1796875, -2.050537109375, -1.92138671875, -1.792236328125, -1.6630859375, -1.533935546875, -1.40478515625, -1.275634765625, -1.146484375, -1.017333984375, -0.88818359375, -0.759033203125, -0.6298828125, -0.500732421875, -0.37158203125, -0.242431640625, -0.11328125, 0.015869140625, 0.14501953125, 0.274169921875, 0.4033203125, 0.532470703125, 0.66162109375, 0.790771484375, 0.919921875, 1.049072265625, 1.17822265625, 1.307373046875, 1.4365234375, 1.565673828125, 1.69482421875, 1.823974609375, 1.953125, 2.082275390625, 2.21142578125, 2.340576171875, 2.4697265625, 2.598876953125, 2.72802734375, 2.857177734375, 2.986328125, 3.115478515625, 3.24462890625, 3.373779296875, 3.5029296875, 3.632080078125, 3.76123046875, 3.890380859375, 4.01953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 9.0, 28.0, 27.0, 35.0, 40.0, 66.0, 99.0, 163.0, 200.0, 305.0, 386.0, 595.0, 997.0, 1527.0, 2770.0, 5114.0, 9919.0, 21197.0, 52553.0, 169172.0, 1506181.0, 2137915.0, 184023.0, 55608.0, 22327.0, 10274.0, 5246.0, 2731.0, 1704.0, 988.0, 667.0, 400.0, 292.0, 194.0, 140.0, 111.0, 71.0, 55.0, 35.0, 40.0, 20.0, 23.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.3125, -18.727783203125, -18.14306640625, -17.558349609375, -16.9736328125, -16.388916015625, -15.80419921875, -15.219482421875, -14.634765625, -14.050048828125, -13.46533203125, -12.880615234375, -12.2958984375, -11.711181640625, -11.12646484375, -10.541748046875, -9.95703125, -9.372314453125, -8.78759765625, -8.202880859375, -7.6181640625, -7.033447265625, -6.44873046875, -5.864013671875, -5.279296875, -4.694580078125, -4.10986328125, -3.525146484375, -2.9404296875, -2.355712890625, -1.77099609375, -1.186279296875, -0.6015625, -0.016845703125, 0.56787109375, 1.152587890625, 1.7373046875, 2.322021484375, 2.90673828125, 3.491455078125, 4.076171875, 4.660888671875, 5.24560546875, 5.830322265625, 6.4150390625, 6.999755859375, 7.58447265625, 8.169189453125, 8.75390625, 9.338623046875, 9.92333984375, 10.508056640625, 11.0927734375, 11.677490234375, 12.26220703125, 12.846923828125, 13.431640625, 14.016357421875, 14.60107421875, 15.185791015625, 15.7705078125, 16.355224609375, 16.93994140625, 17.524658203125, 18.109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 0.0, 3.0, 3.0, 7.0, 14.0, 15.0, 16.0, 27.0, 37.0, 69.0, 96.0, 172.0, 354.0, 1496.0, 999.0, 335.0, 144.0, 95.0, 61.0, 39.0, 23.0, 24.0, 19.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.5382080078125, -9.170166015625, -8.8021240234375, -8.43408203125, -8.0660400390625, -7.697998046875, -7.3299560546875, -6.9619140625, -6.5938720703125, -6.225830078125, -5.8577880859375, -5.48974609375, -5.1217041015625, -4.753662109375, -4.3856201171875, -4.017578125, -3.6495361328125, -3.281494140625, -2.9134521484375, -2.54541015625, -2.1773681640625, -1.809326171875, -1.4412841796875, -1.0732421875, -0.7052001953125, -0.337158203125, 0.0308837890625, 0.39892578125, 0.7669677734375, 1.135009765625, 1.5030517578125, 1.87109375, 2.2391357421875, 2.607177734375, 2.9752197265625, 3.34326171875, 3.7113037109375, 4.079345703125, 4.4473876953125, 4.8154296875, 5.1834716796875, 5.551513671875, 5.9195556640625, 6.28759765625, 6.6556396484375, 7.023681640625, 7.3917236328125, 7.759765625, 8.1278076171875, 8.495849609375, 8.8638916015625, 9.23193359375, 9.5999755859375, 9.968017578125, 10.3360595703125, 10.7041015625, 11.0721435546875, 11.440185546875, 11.8082275390625, 12.17626953125, 12.5443115234375, 12.912353515625, 13.2803955078125, 13.6484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 11.0, 13.0, 19.0, 37.0, 32.0, 64.0, 66.0, 96.0, 68.0, 83.0, 102.0, 95.0, 89.0, 62.0, 44.0, 45.0, 31.0, 19.0, 6.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-77.00627899169922, -75.25033569335938, -73.49440002441406, -71.73845672607422, -69.98251342773438, -68.22657012939453, -66.47063446044922, -64.71469116210938, -62.95874786376953, -61.20280838012695, -59.44686508178711, -57.69092559814453, -55.93498229980469, -54.17904281616211, -52.423099517822266, -50.66716003417969, -48.911216735839844, -47.155277252197266, -45.39933395385742, -43.643394470214844, -41.887451171875, -40.13151168823242, -38.37556838989258, -36.61962890625, -34.86368942260742, -33.107749938964844, -31.351806640625, -29.59586524963379, -27.839923858642578, -26.083984375, -24.328041076660156, -22.572101593017578, -20.816158294677734, -19.060216903686523, -17.304275512695312, -15.548334121704102, -13.79239273071289, -12.036452293395996, -10.280510902404785, -8.524569511413574, -6.768628120422363, -5.012686729431152, -3.2567455768585205, -1.5008044242858887, 0.25513696670532227, 2.011077880859375, 3.767019271850586, 5.522960662841797, 7.278902053833008, 9.034843444824219, 10.79078483581543, 12.54672622680664, 14.302667617797852, 16.058609008789062, 17.81454849243164, 19.570491790771484, 21.326431274414062, 23.082372665405273, 24.838314056396484, 26.594255447387695, 28.350196838378906, 30.106136322021484, 31.862079620361328, 33.618019104003906, 35.37396240234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 8.0, 10.0, 11.0, 16.0, 17.0, 24.0, 25.0, 27.0, 35.0, 34.0, 34.0, 36.0, 25.0, 29.0, 35.0, 48.0, 43.0, 47.0, 27.0, 38.0, 43.0, 38.0, 34.0, 36.0, 31.0, 34.0, 32.0, 15.0, 22.0, 16.0, 15.0, 14.0, 14.0, 13.0, 9.0, 8.0, 3.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.550039291381836, -27.657567977905273, -26.765094757080078, -25.872623443603516, -24.980152130126953, -24.087678909301758, -23.195207595825195, -22.302734375, -21.410263061523438, -20.517791748046875, -19.62531852722168, -18.732847213745117, -17.840373992919922, -16.94790267944336, -16.055431365966797, -15.162959098815918, -14.270486831665039, -13.37801456451416, -12.485542297363281, -11.593070983886719, -10.70059871673584, -9.808126449584961, -8.915655136108398, -8.02318286895752, -7.130710601806641, -6.238238334655762, -5.345766544342041, -4.45329475402832, -3.5608224868774414, -2.6683502197265625, -1.7758784294128418, -0.8834066390991211, 0.009063720703125, 0.9015357494354248, 1.7940077781677246, 2.6864798069000244, 3.578951835632324, 4.471424102783203, 5.363895893096924, 6.2563676834106445, 7.148839950561523, 8.041312217712402, 8.933784484863281, 9.826255798339844, 10.718728065490723, 11.611200332641602, 12.503671646118164, 13.396143913269043, 14.288616180419922, 15.1810884475708, 16.07356071472168, 16.966032028198242, 17.858505249023438, 18.7509765625, 19.643447875976562, 20.535919189453125, 21.42839241027832, 22.320863723754883, 23.213336944580078, 24.10580825805664, 24.998279571533203, 25.8907527923584, 26.78322410583496, 27.675697326660156, 28.56816864013672]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 10.0, 7.0, 17.0, 29.0, 41.0, 63.0, 86.0, 165.0, 277.0, 462.0, 911.0, 1858.0, 3757.0, 8356.0, 18583.0, 43353.0, 112738.0, 361413.0, 325034.0, 100430.0, 39117.0, 16901.0, 7816.0, 3504.0, 1688.0, 846.0, 465.0, 238.0, 135.0, 84.0, 72.0, 30.0, 17.0, 11.0, 8.0, 7.0, 6.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-21.890625, -21.298095703125, -20.70556640625, -20.113037109375, -19.5205078125, -18.927978515625, -18.33544921875, -17.742919921875, -17.150390625, -16.557861328125, -15.96533203125, -15.372802734375, -14.7802734375, -14.187744140625, -13.59521484375, -13.002685546875, -12.41015625, -11.817626953125, -11.22509765625, -10.632568359375, -10.0400390625, -9.447509765625, -8.85498046875, -8.262451171875, -7.669921875, -7.077392578125, -6.48486328125, -5.892333984375, -5.2998046875, -4.707275390625, -4.11474609375, -3.522216796875, -2.9296875, -2.337158203125, -1.74462890625, -1.152099609375, -0.5595703125, 0.032958984375, 0.62548828125, 1.218017578125, 1.810546875, 2.403076171875, 2.99560546875, 3.588134765625, 4.1806640625, 4.773193359375, 5.36572265625, 5.958251953125, 6.55078125, 7.143310546875, 7.73583984375, 8.328369140625, 8.9208984375, 9.513427734375, 10.10595703125, 10.698486328125, 11.291015625, 11.883544921875, 12.47607421875, 13.068603515625, 13.6611328125, 14.253662109375, 14.84619140625, 15.438720703125, 16.03125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 8.0, 8.0, 15.0, 22.0, 19.0, 25.0, 27.0, 27.0, 30.0, 44.0, 42.0, 47.0, 34.0, 52.0, 43.0, 56.0, 44.0, 59.0, 47.0, 49.0, 34.0, 26.0, 35.0, 32.0, 26.0, 25.0, 24.0, 22.0, 11.0, 11.0, 4.0, 10.0, 10.0, 10.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.80078125, -4.6734619140625, -4.546142578125, -4.4188232421875, -4.29150390625, -4.1641845703125, -4.036865234375, -3.9095458984375, -3.7822265625, -3.6549072265625, -3.527587890625, -3.4002685546875, -3.27294921875, -3.1456298828125, -3.018310546875, -2.8909912109375, -2.763671875, -2.6363525390625, -2.509033203125, -2.3817138671875, -2.25439453125, -2.1270751953125, -1.999755859375, -1.8724365234375, -1.7451171875, -1.6177978515625, -1.490478515625, -1.3631591796875, -1.23583984375, -1.1085205078125, -0.981201171875, -0.8538818359375, -0.7265625, -0.5992431640625, -0.471923828125, -0.3446044921875, -0.21728515625, -0.0899658203125, 0.037353515625, 0.1646728515625, 0.2919921875, 0.4193115234375, 0.546630859375, 0.6739501953125, 0.80126953125, 0.9285888671875, 1.055908203125, 1.1832275390625, 1.310546875, 1.4378662109375, 1.565185546875, 1.6925048828125, 1.81982421875, 1.9471435546875, 2.074462890625, 2.2017822265625, 2.3291015625, 2.4564208984375, 2.583740234375, 2.7110595703125, 2.83837890625, 2.9656982421875, 3.093017578125, 3.2203369140625, 3.34765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 13.0, 18.0, 12.0, 27.0, 38.0, 58.0, 82.0, 175.0, 230.0, 425.0, 798.0, 1539.0, 3027.0, 6741.0, 14731.0, 34909.0, 103319.0, 469351.0, 297018.0, 68603.0, 25707.0, 11330.0, 5167.0, 2429.0, 1236.0, 637.0, 344.0, 194.0, 128.0, 86.0, 47.0, 39.0, 29.0, 15.0, 10.0, 10.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-19.421875, -18.811767578125, -18.20166015625, -17.591552734375, -16.9814453125, -16.371337890625, -15.76123046875, -15.151123046875, -14.541015625, -13.930908203125, -13.32080078125, -12.710693359375, -12.1005859375, -11.490478515625, -10.88037109375, -10.270263671875, -9.66015625, -9.050048828125, -8.43994140625, -7.829833984375, -7.2197265625, -6.609619140625, -5.99951171875, -5.389404296875, -4.779296875, -4.169189453125, -3.55908203125, -2.948974609375, -2.3388671875, -1.728759765625, -1.11865234375, -0.508544921875, 0.1015625, 0.711669921875, 1.32177734375, 1.931884765625, 2.5419921875, 3.152099609375, 3.76220703125, 4.372314453125, 4.982421875, 5.592529296875, 6.20263671875, 6.812744140625, 7.4228515625, 8.032958984375, 8.64306640625, 9.253173828125, 9.86328125, 10.473388671875, 11.08349609375, 11.693603515625, 12.3037109375, 12.913818359375, 13.52392578125, 14.134033203125, 14.744140625, 15.354248046875, 15.96435546875, 16.574462890625, 17.1845703125, 17.794677734375, 18.40478515625, 19.014892578125, 19.625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 14.0, 13.0, 18.0, 21.0, 25.0, 31.0, 39.0, 60.0, 58.0, 84.0, 76.0, 69.0, 63.0, 62.0, 74.0, 52.0, 54.0, 45.0, 31.0, 23.0, 16.0, 17.0, 11.0, 12.0, 4.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.849853515625, -23.07470703125, -22.299560546875, -21.5244140625, -20.749267578125, -19.97412109375, -19.198974609375, -18.423828125, -17.648681640625, -16.87353515625, -16.098388671875, -15.3232421875, -14.548095703125, -13.77294921875, -12.997802734375, -12.22265625, -11.447509765625, -10.67236328125, -9.897216796875, -9.1220703125, -8.346923828125, -7.57177734375, -6.796630859375, -6.021484375, -5.246337890625, -4.47119140625, -3.696044921875, -2.9208984375, -2.145751953125, -1.37060546875, -0.595458984375, 0.1796875, 0.954833984375, 1.72998046875, 2.505126953125, 3.2802734375, 4.055419921875, 4.83056640625, 5.605712890625, 6.380859375, 7.156005859375, 7.93115234375, 8.706298828125, 9.4814453125, 10.256591796875, 11.03173828125, 11.806884765625, 12.58203125, 13.357177734375, 14.13232421875, 14.907470703125, 15.6826171875, 16.457763671875, 17.23291015625, 18.008056640625, 18.783203125, 19.558349609375, 20.33349609375, 21.108642578125, 21.8837890625, 22.658935546875, 23.43408203125, 24.209228515625, 24.984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 12.0, 13.0, 24.0, 29.0, 68.0, 79.0, 136.0, 242.0, 449.0, 823.0, 1731.0, 3867.0, 8545.0, 19278.0, 46536.0, 178658.0, 584743.0, 132343.0, 39791.0, 16887.0, 7493.0, 3460.0, 1579.0, 760.0, 403.0, 239.0, 122.0, 79.0, 52.0, 27.0, 25.0, 14.0, 12.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.6612548828125, -9.353759765625, -9.0462646484375, -8.73876953125, -8.4312744140625, -8.123779296875, -7.8162841796875, -7.5087890625, -7.2012939453125, -6.893798828125, -6.5863037109375, -6.27880859375, -5.9713134765625, -5.663818359375, -5.3563232421875, -5.048828125, -4.7413330078125, -4.433837890625, -4.1263427734375, -3.81884765625, -3.5113525390625, -3.203857421875, -2.8963623046875, -2.5888671875, -2.2813720703125, -1.973876953125, -1.6663818359375, -1.35888671875, -1.0513916015625, -0.743896484375, -0.4364013671875, -0.12890625, 0.1785888671875, 0.486083984375, 0.7935791015625, 1.10107421875, 1.4085693359375, 1.716064453125, 2.0235595703125, 2.3310546875, 2.6385498046875, 2.946044921875, 3.2535400390625, 3.56103515625, 3.8685302734375, 4.176025390625, 4.4835205078125, 4.791015625, 5.0985107421875, 5.406005859375, 5.7135009765625, 6.02099609375, 6.3284912109375, 6.635986328125, 6.9434814453125, 7.2509765625, 7.5584716796875, 7.865966796875, 8.1734619140625, 8.48095703125, 8.7884521484375, 9.095947265625, 9.4034423828125, 9.7109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 16.0, 12.0, 9.0, 16.0, 20.0, 52.0, 101.0, 281.0, 273.0, 80.0, 34.0, 21.0, 15.0, 12.0, 11.0, 6.0, 6.0, 11.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006015777587890625, -0.0058481693267822266, -0.005680561065673828, -0.00551295280456543, -0.005345344543457031, -0.005177736282348633, -0.005010128021240234, -0.004842519760131836, -0.0046749114990234375, -0.004507303237915039, -0.004339694976806641, -0.004172086715698242, -0.004004478454589844, -0.0038368701934814453, -0.003669261932373047, -0.0035016536712646484, -0.00333404541015625, -0.0031664371490478516, -0.002998828887939453, -0.0028312206268310547, -0.0026636123657226562, -0.002496004104614258, -0.0023283958435058594, -0.002160787582397461, -0.0019931793212890625, -0.001825571060180664, -0.0016579627990722656, -0.0014903545379638672, -0.0013227462768554688, -0.0011551380157470703, -0.0009875297546386719, -0.0008199214935302734, -0.000652313232421875, -0.00048470497131347656, -0.0003170967102050781, -0.0001494884490966797, 1.811981201171875e-05, 0.0001857280731201172, 0.0003533363342285156, 0.0005209445953369141, 0.0006885528564453125, 0.0008561611175537109, 0.0010237693786621094, 0.0011913776397705078, 0.0013589859008789062, 0.0015265941619873047, 0.0016942024230957031, 0.0018618106842041016, 0.0020294189453125, 0.0021970272064208984, 0.002364635467529297, 0.0025322437286376953, 0.0026998519897460938, 0.002867460250854492, 0.0030350685119628906, 0.003202676773071289, 0.0033702850341796875, 0.003537893295288086, 0.0037055015563964844, 0.003873109817504883, 0.004040718078613281, 0.00420832633972168, 0.004375934600830078, 0.0045435428619384766, 0.004711151123046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 16.0, 21.0, 29.0, 40.0, 60.0, 93.0, 136.0, 247.0, 401.0, 779.0, 1461.0, 2849.0, 6095.0, 12785.0, 30155.0, 89384.0, 555803.0, 258130.0, 51613.0, 20315.0, 9180.0, 4336.0, 2053.0, 1060.0, 608.0, 302.0, 200.0, 101.0, 74.0, 50.0, 36.0, 34.0, 23.0, 17.0, 12.0, 13.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5859375, -9.2843017578125, -8.982666015625, -8.6810302734375, -8.37939453125, -8.0777587890625, -7.776123046875, -7.4744873046875, -7.1728515625, -6.8712158203125, -6.569580078125, -6.2679443359375, -5.96630859375, -5.6646728515625, -5.363037109375, -5.0614013671875, -4.759765625, -4.4581298828125, -4.156494140625, -3.8548583984375, -3.55322265625, -3.2515869140625, -2.949951171875, -2.6483154296875, -2.3466796875, -2.0450439453125, -1.743408203125, -1.4417724609375, -1.14013671875, -0.8385009765625, -0.536865234375, -0.2352294921875, 0.06640625, 0.3680419921875, 0.669677734375, 0.9713134765625, 1.27294921875, 1.5745849609375, 1.876220703125, 2.1778564453125, 2.4794921875, 2.7811279296875, 3.082763671875, 3.3843994140625, 3.68603515625, 3.9876708984375, 4.289306640625, 4.5909423828125, 4.892578125, 5.1942138671875, 5.495849609375, 5.7974853515625, 6.09912109375, 6.4007568359375, 6.702392578125, 7.0040283203125, 7.3056640625, 7.6072998046875, 7.908935546875, 8.2105712890625, 8.51220703125, 8.8138427734375, 9.115478515625, 9.4171142578125, 9.71875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 7.0, 6.0, 11.0, 18.0, 18.0, 19.0, 16.0, 37.0, 34.0, 68.0, 96.0, 128.0, 125.0, 114.0, 72.0, 51.0, 37.0, 16.0, 17.0, 12.0, 10.0, 8.0, 7.0, 4.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.50146484375, -7.2451171875, -6.98876953125, -6.732421875, -6.47607421875, -6.2197265625, -5.96337890625, -5.70703125, -5.45068359375, -5.1943359375, -4.93798828125, -4.681640625, -4.42529296875, -4.1689453125, -3.91259765625, -3.65625, -3.39990234375, -3.1435546875, -2.88720703125, -2.630859375, -2.37451171875, -2.1181640625, -1.86181640625, -1.60546875, -1.34912109375, -1.0927734375, -0.83642578125, -0.580078125, -0.32373046875, -0.0673828125, 0.18896484375, 0.4453125, 0.70166015625, 0.9580078125, 1.21435546875, 1.470703125, 1.72705078125, 1.9833984375, 2.23974609375, 2.49609375, 2.75244140625, 3.0087890625, 3.26513671875, 3.521484375, 3.77783203125, 4.0341796875, 4.29052734375, 4.546875, 4.80322265625, 5.0595703125, 5.31591796875, 5.572265625, 5.82861328125, 6.0849609375, 6.34130859375, 6.59765625, 6.85400390625, 7.1103515625, 7.36669921875, 7.623046875, 7.87939453125, 8.1357421875, 8.39208984375, 8.6484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 14.0, 28.0, 36.0, 62.0, 83.0, 100.0, 127.0, 123.0, 114.0, 94.0, 63.0, 58.0, 40.0, 17.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-222.4858856201172, -217.77609252929688, -213.06629943847656, -208.35650634765625, -203.64671325683594, -198.93692016601562, -194.22711181640625, -189.51731872558594, -184.80752563476562, -180.0977325439453, -175.387939453125, -170.6781463623047, -165.96835327148438, -161.258544921875, -156.54876708984375, -151.83895874023438, -147.12918090820312, -142.4193878173828, -137.7095947265625, -132.9998016357422, -128.29000854492188, -123.58020782470703, -118.87041473388672, -114.16061401367188, -109.45082092285156, -104.74102783203125, -100.03123474121094, -95.32144165039062, -90.61164093017578, -85.90184783935547, -81.19205474853516, -76.48225402832031, -71.7724609375, -67.06266784667969, -62.35287094116211, -57.6430778503418, -52.93328094482422, -48.223487854003906, -43.513694763183594, -38.803897857666016, -34.0941047668457, -29.384309768676758, -24.674514770507812, -19.9647216796875, -15.254926681518555, -10.54513168334961, -5.835338592529297, -1.1255416870117188, 3.5842514038085938, 8.294046401977539, 13.003840446472168, 17.713634490966797, 22.423429489135742, 27.133224487304688, 31.843017578125, 36.55281448364258, 41.26260757446289, 45.9724006652832, 50.68219757080078, 55.391990661621094, 60.101783752441406, 64.81158447265625, 69.52137756347656, 74.23117065429688, 78.94096374511719]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 13.0, 5.0, 14.0, 12.0, 18.0, 13.0, 15.0, 18.0, 37.0, 28.0, 30.0, 24.0, 27.0, 29.0, 33.0, 32.0, 53.0, 51.0, 46.0, 33.0, 54.0, 41.0, 39.0, 47.0, 38.0, 34.0, 23.0, 33.0, 31.0, 22.0, 20.0, 11.0, 18.0, 15.0, 11.0, 8.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-74.47787475585938, -72.0730972290039, -69.66831970214844, -67.26354217529297, -64.8587646484375, -62.45398712158203, -60.04920959472656, -57.644432067871094, -55.239654541015625, -52.834877014160156, -50.43009948730469, -48.02532196044922, -45.62054443359375, -43.21576690673828, -40.81098937988281, -38.406211853027344, -36.001434326171875, -33.596656799316406, -31.191879272460938, -28.78710174560547, -26.38232421875, -23.97754669189453, -21.572769165039062, -19.167991638183594, -16.763214111328125, -14.358436584472656, -11.953659057617188, -9.548881530761719, -7.14410400390625, -4.739326477050781, -2.3345489501953125, 0.07022857666015625, 2.4750137329101562, 4.879791259765625, 7.284568786621094, 9.689346313476562, 12.094123840332031, 14.4989013671875, 16.90367889404297, 19.308456420898438, 21.713233947753906, 24.118011474609375, 26.522789001464844, 28.927566528320312, 31.33234405517578, 33.73712158203125, 36.14189910888672, 38.54667663574219, 40.951454162597656, 43.356231689453125, 45.761009216308594, 48.16578674316406, 50.57056427001953, 52.975341796875, 55.38011932373047, 57.78489685058594, 60.189674377441406, 62.594451904296875, 64.99922943115234, 67.40400695800781, 69.80878448486328, 72.21356201171875, 74.61833953857422, 77.02311706542969, 79.42789459228516]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 12.0, 10.0, 13.0, 27.0, 35.0, 53.0, 65.0, 116.0, 161.0, 284.0, 501.0, 869.0, 1795.0, 3793.0, 8460.0, 21523.0, 64528.0, 312642.0, 3450970.0, 239877.0, 54564.0, 18943.0, 7835.0, 3483.0, 1659.0, 866.0, 428.0, 277.0, 171.0, 111.0, 61.0, 47.0, 31.0, 20.0, 20.0, 13.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.96875, -33.0849609375, -32.201171875, -31.3173828125, -30.43359375, -29.5498046875, -28.666015625, -27.7822265625, -26.8984375, -26.0146484375, -25.130859375, -24.2470703125, -23.36328125, -22.4794921875, -21.595703125, -20.7119140625, -19.828125, -18.9443359375, -18.060546875, -17.1767578125, -16.29296875, -15.4091796875, -14.525390625, -13.6416015625, -12.7578125, -11.8740234375, -10.990234375, -10.1064453125, -9.22265625, -8.3388671875, -7.455078125, -6.5712890625, -5.6875, -4.8037109375, -3.919921875, -3.0361328125, -2.15234375, -1.2685546875, -0.384765625, 0.4990234375, 1.3828125, 2.2666015625, 3.150390625, 4.0341796875, 4.91796875, 5.8017578125, 6.685546875, 7.5693359375, 8.453125, 9.3369140625, 10.220703125, 11.1044921875, 11.98828125, 12.8720703125, 13.755859375, 14.6396484375, 15.5234375, 16.4072265625, 17.291015625, 18.1748046875, 19.05859375, 19.9423828125, 20.826171875, 21.7099609375, 22.59375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 17.0, 18.0, 20.0, 25.0, 15.0, 22.0, 29.0, 37.0, 39.0, 38.0, 39.0, 48.0, 55.0, 42.0, 59.0, 43.0, 43.0, 33.0, 38.0, 38.0, 31.0, 32.0, 38.0, 23.0, 23.0, 21.0, 21.0, 20.0, 13.0, 14.0, 10.0, 12.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.54296875, -4.4156494140625, -4.288330078125, -4.1610107421875, -4.03369140625, -3.9063720703125, -3.779052734375, -3.6517333984375, -3.5244140625, -3.3970947265625, -3.269775390625, -3.1424560546875, -3.01513671875, -2.8878173828125, -2.760498046875, -2.6331787109375, -2.505859375, -2.3785400390625, -2.251220703125, -2.1239013671875, -1.99658203125, -1.8692626953125, -1.741943359375, -1.6146240234375, -1.4873046875, -1.3599853515625, -1.232666015625, -1.1053466796875, -0.97802734375, -0.8507080078125, -0.723388671875, -0.5960693359375, -0.46875, -0.3414306640625, -0.214111328125, -0.0867919921875, 0.04052734375, 0.1678466796875, 0.295166015625, 0.4224853515625, 0.5498046875, 0.6771240234375, 0.804443359375, 0.9317626953125, 1.05908203125, 1.1864013671875, 1.313720703125, 1.4410400390625, 1.568359375, 1.6956787109375, 1.822998046875, 1.9503173828125, 2.07763671875, 2.2049560546875, 2.332275390625, 2.4595947265625, 2.5869140625, 2.7142333984375, 2.841552734375, 2.9688720703125, 3.09619140625, 3.2235107421875, 3.350830078125, 3.4781494140625, 3.60546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 9.0, 7.0, 19.0, 17.0, 30.0, 48.0, 61.0, 91.0, 150.0, 186.0, 295.0, 435.0, 643.0, 912.0, 1473.0, 2350.0, 4248.0, 8230.0, 16518.0, 38378.0, 106181.0, 506481.0, 3095106.0, 278025.0, 75885.0, 29253.0, 13139.0, 6468.0, 3534.0, 2096.0, 1327.0, 857.0, 556.0, 376.0, 284.0, 203.0, 128.0, 86.0, 68.0, 47.0, 24.0, 14.0, 17.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.59375, -24.802490234375, -24.01123046875, -23.219970703125, -22.4287109375, -21.637451171875, -20.84619140625, -20.054931640625, -19.263671875, -18.472412109375, -17.68115234375, -16.889892578125, -16.0986328125, -15.307373046875, -14.51611328125, -13.724853515625, -12.93359375, -12.142333984375, -11.35107421875, -10.559814453125, -9.7685546875, -8.977294921875, -8.18603515625, -7.394775390625, -6.603515625, -5.812255859375, -5.02099609375, -4.229736328125, -3.4384765625, -2.647216796875, -1.85595703125, -1.064697265625, -0.2734375, 0.517822265625, 1.30908203125, 2.100341796875, 2.8916015625, 3.682861328125, 4.47412109375, 5.265380859375, 6.056640625, 6.847900390625, 7.63916015625, 8.430419921875, 9.2216796875, 10.012939453125, 10.80419921875, 11.595458984375, 12.38671875, 13.177978515625, 13.96923828125, 14.760498046875, 15.5517578125, 16.343017578125, 17.13427734375, 17.925537109375, 18.716796875, 19.508056640625, 20.29931640625, 21.090576171875, 21.8818359375, 22.673095703125, 23.46435546875, 24.255615234375, 25.046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 6.0, 7.0, 25.0, 28.0, 40.0, 31.0, 60.0, 99.0, 174.0, 359.0, 1431.0, 974.0, 303.0, 151.0, 90.0, 70.0, 57.0, 31.0, 24.0, 21.0, 18.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7117919921875, -10.314208984375, -9.9166259765625, -9.51904296875, -9.1214599609375, -8.723876953125, -8.3262939453125, -7.9287109375, -7.5311279296875, -7.133544921875, -6.7359619140625, -6.33837890625, -5.9407958984375, -5.543212890625, -5.1456298828125, -4.748046875, -4.3504638671875, -3.952880859375, -3.5552978515625, -3.15771484375, -2.7601318359375, -2.362548828125, -1.9649658203125, -1.5673828125, -1.1697998046875, -0.772216796875, -0.3746337890625, 0.02294921875, 0.4205322265625, 0.818115234375, 1.2156982421875, 1.61328125, 2.0108642578125, 2.408447265625, 2.8060302734375, 3.20361328125, 3.6011962890625, 3.998779296875, 4.3963623046875, 4.7939453125, 5.1915283203125, 5.589111328125, 5.9866943359375, 6.38427734375, 6.7818603515625, 7.179443359375, 7.5770263671875, 7.974609375, 8.3721923828125, 8.769775390625, 9.1673583984375, 9.56494140625, 9.9625244140625, 10.360107421875, 10.7576904296875, 11.1552734375, 11.5528564453125, 11.950439453125, 12.3480224609375, 12.74560546875, 13.1431884765625, 13.540771484375, 13.9383544921875, 14.3359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 22.0, 18.0, 40.0, 57.0, 76.0, 107.0, 104.0, 122.0, 122.0, 100.0, 70.0, 58.0, 34.0, 23.0, 8.0, 6.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-122.13401794433594, -119.43634033203125, -116.73866271972656, -114.04098510742188, -111.34329986572266, -108.64562225341797, -105.94794464111328, -103.2502670288086, -100.55258178710938, -97.85490417480469, -95.1572265625, -92.45954895019531, -89.7618637084961, -87.0641860961914, -84.36650848388672, -81.66883087158203, -78.97115325927734, -76.27347564697266, -73.57579803466797, -70.87811279296875, -68.18043518066406, -65.48275756835938, -62.78507995605469, -60.08740234375, -57.38972091674805, -54.69204330444336, -51.994361877441406, -49.29668426513672, -46.59900665283203, -43.90132522583008, -41.20364761352539, -38.50596618652344, -35.80829620361328, -33.110618591308594, -30.41293716430664, -27.715259552001953, -25.017580032348633, -22.319900512695312, -19.622222900390625, -16.924543380737305, -14.226863861083984, -11.529184341430664, -8.83150577545166, -6.133827209472656, -3.436147689819336, -0.7384681701660156, 1.9592094421386719, 4.656888961791992, 7.3545684814453125, 10.052248001098633, 12.749926567077637, 15.44760513305664, 18.14528465270996, 20.84296417236328, 23.54064178466797, 26.23832130432129, 28.93600082397461, 31.63368034362793, 34.33135986328125, 37.02903747558594, 39.726715087890625, 42.42439651489258, 45.122074127197266, 47.81975555419922, 50.517433166503906]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 3.0, 22.0, 13.0, 15.0, 15.0, 27.0, 21.0, 25.0, 27.0, 31.0, 46.0, 48.0, 45.0, 48.0, 40.0, 55.0, 53.0, 53.0, 52.0, 46.0, 43.0, 37.0, 39.0, 22.0, 25.0, 23.0, 24.0, 19.0, 12.0, 11.0, 13.0, 3.0, 10.0, 1.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.869972229003906, -46.35736846923828, -44.844764709472656, -43.332157135009766, -41.81955337524414, -40.306949615478516, -38.794342041015625, -37.28173828125, -35.769134521484375, -34.25653076171875, -32.743927001953125, -31.231319427490234, -29.71871566772461, -28.206111907958984, -26.693506240844727, -25.18090057373047, -23.668296813964844, -22.15569305419922, -20.64308738708496, -19.130481719970703, -17.617877960205078, -16.105274200439453, -14.592668533325195, -13.080063819885254, -11.567459106445312, -10.054854393005371, -8.54224967956543, -7.029644966125488, -5.517040252685547, -4.0044355392456055, -2.491830825805664, -0.9792261123657227, 0.5333786010742188, 2.04598331451416, 3.5585880279541016, 5.071192741394043, 6.583797454833984, 8.096402168273926, 9.609006881713867, 11.121611595153809, 12.63421630859375, 14.146821022033691, 15.659425735473633, 17.17203140258789, 18.684635162353516, 20.19723892211914, 21.7098445892334, 23.222450256347656, 24.73505401611328, 26.247657775878906, 27.760263442993164, 29.272869110107422, 30.785472869873047, 32.29807662963867, 33.81068420410156, 35.32328796386719, 36.83589172363281, 38.34849548339844, 39.86109924316406, 41.37370681762695, 42.88631057739258, 44.3989143371582, 45.911521911621094, 47.42412567138672, 48.936729431152344]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 20.0, 24.0, 26.0, 46.0, 53.0, 88.0, 158.0, 237.0, 424.0, 723.0, 1386.0, 2582.0, 4870.0, 9728.0, 19623.0, 38670.0, 75235.0, 150515.0, 281812.0, 230081.0, 114242.0, 57816.0, 29652.0, 14899.0, 7483.0, 3739.0, 1948.0, 1043.0, 524.0, 332.0, 186.0, 105.0, 84.0, 46.0, 38.0, 33.0, 24.0, 22.0, 12.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.171875, -17.63427734375, -17.0966796875, -16.55908203125, -16.021484375, -15.48388671875, -14.9462890625, -14.40869140625, -13.87109375, -13.33349609375, -12.7958984375, -12.25830078125, -11.720703125, -11.18310546875, -10.6455078125, -10.10791015625, -9.5703125, -9.03271484375, -8.4951171875, -7.95751953125, -7.419921875, -6.88232421875, -6.3447265625, -5.80712890625, -5.26953125, -4.73193359375, -4.1943359375, -3.65673828125, -3.119140625, -2.58154296875, -2.0439453125, -1.50634765625, -0.96875, -0.43115234375, 0.1064453125, 0.64404296875, 1.181640625, 1.71923828125, 2.2568359375, 2.79443359375, 3.33203125, 3.86962890625, 4.4072265625, 4.94482421875, 5.482421875, 6.02001953125, 6.5576171875, 7.09521484375, 7.6328125, 8.17041015625, 8.7080078125, 9.24560546875, 9.783203125, 10.32080078125, 10.8583984375, 11.39599609375, 11.93359375, 12.47119140625, 13.0087890625, 13.54638671875, 14.083984375, 14.62158203125, 15.1591796875, 15.69677734375, 16.234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 11.0, 7.0, 12.0, 15.0, 12.0, 15.0, 17.0, 13.0, 25.0, 18.0, 36.0, 24.0, 43.0, 27.0, 37.0, 32.0, 47.0, 43.0, 49.0, 46.0, 43.0, 43.0, 31.0, 46.0, 30.0, 39.0, 34.0, 30.0, 32.0, 25.0, 24.0, 22.0, 13.0, 13.0, 12.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.20330810546875, -4.0589599609375, -3.91461181640625, -3.770263671875, -3.62591552734375, -3.4815673828125, -3.33721923828125, -3.19287109375, -3.04852294921875, -2.9041748046875, -2.75982666015625, -2.615478515625, -2.47113037109375, -2.3267822265625, -2.18243408203125, -2.0380859375, -1.89373779296875, -1.7493896484375, -1.60504150390625, -1.460693359375, -1.31634521484375, -1.1719970703125, -1.02764892578125, -0.88330078125, -0.73895263671875, -0.5946044921875, -0.45025634765625, -0.305908203125, -0.16156005859375, -0.0172119140625, 0.12713623046875, 0.271484375, 0.41583251953125, 0.5601806640625, 0.70452880859375, 0.848876953125, 0.99322509765625, 1.1375732421875, 1.28192138671875, 1.42626953125, 1.57061767578125, 1.7149658203125, 1.85931396484375, 2.003662109375, 2.14801025390625, 2.2923583984375, 2.43670654296875, 2.5810546875, 2.72540283203125, 2.8697509765625, 3.01409912109375, 3.158447265625, 3.30279541015625, 3.4471435546875, 3.59149169921875, 3.73583984375, 3.88018798828125, 4.0245361328125, 4.16888427734375, 4.313232421875, 4.45758056640625, 4.6019287109375, 4.74627685546875, 4.890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 6.0, 11.0, 22.0, 10.0, 34.0, 43.0, 54.0, 92.0, 152.0, 223.0, 286.0, 536.0, 907.0, 1620.0, 3489.0, 8754.0, 23801.0, 66273.0, 194543.0, 469535.0, 179403.0, 61616.0, 21883.0, 7997.0, 3397.0, 1609.0, 838.0, 502.0, 288.0, 182.0, 140.0, 82.0, 49.0, 50.0, 33.0, 24.0, 14.0, 14.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.539794921875, -22.76708984375, -21.994384765625, -21.2216796875, -20.448974609375, -19.67626953125, -18.903564453125, -18.130859375, -17.358154296875, -16.58544921875, -15.812744140625, -15.0400390625, -14.267333984375, -13.49462890625, -12.721923828125, -11.94921875, -11.176513671875, -10.40380859375, -9.631103515625, -8.8583984375, -8.085693359375, -7.31298828125, -6.540283203125, -5.767578125, -4.994873046875, -4.22216796875, -3.449462890625, -2.6767578125, -1.904052734375, -1.13134765625, -0.358642578125, 0.4140625, 1.186767578125, 1.95947265625, 2.732177734375, 3.5048828125, 4.277587890625, 5.05029296875, 5.822998046875, 6.595703125, 7.368408203125, 8.14111328125, 8.913818359375, 9.6865234375, 10.459228515625, 11.23193359375, 12.004638671875, 12.77734375, 13.550048828125, 14.32275390625, 15.095458984375, 15.8681640625, 16.640869140625, 17.41357421875, 18.186279296875, 18.958984375, 19.731689453125, 20.50439453125, 21.277099609375, 22.0498046875, 22.822509765625, 23.59521484375, 24.367919921875, 25.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 12.0, 3.0, 11.0, 12.0, 15.0, 11.0, 27.0, 22.0, 22.0, 30.0, 29.0, 48.0, 29.0, 44.0, 52.0, 48.0, 60.0, 56.0, 48.0, 43.0, 36.0, 44.0, 40.0, 48.0, 28.0, 28.0, 21.0, 24.0, 23.0, 19.0, 18.0, 6.0, 8.0, 2.0, 3.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-28.703125, -27.864990234375, -27.02685546875, -26.188720703125, -25.3505859375, -24.512451171875, -23.67431640625, -22.836181640625, -21.998046875, -21.159912109375, -20.32177734375, -19.483642578125, -18.6455078125, -17.807373046875, -16.96923828125, -16.131103515625, -15.29296875, -14.454833984375, -13.61669921875, -12.778564453125, -11.9404296875, -11.102294921875, -10.26416015625, -9.426025390625, -8.587890625, -7.749755859375, -6.91162109375, -6.073486328125, -5.2353515625, -4.397216796875, -3.55908203125, -2.720947265625, -1.8828125, -1.044677734375, -0.20654296875, 0.631591796875, 1.4697265625, 2.307861328125, 3.14599609375, 3.984130859375, 4.822265625, 5.660400390625, 6.49853515625, 7.336669921875, 8.1748046875, 9.012939453125, 9.85107421875, 10.689208984375, 11.52734375, 12.365478515625, 13.20361328125, 14.041748046875, 14.8798828125, 15.718017578125, 16.55615234375, 17.394287109375, 18.232421875, 19.070556640625, 19.90869140625, 20.746826171875, 21.5849609375, 22.423095703125, 23.26123046875, 24.099365234375, 24.9375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 13.0, 21.0, 30.0, 44.0, 88.0, 142.0, 320.0, 956.0, 3931.0, 40307.0, 921206.0, 74220.0, 5376.0, 1143.0, 374.0, 158.0, 96.0, 47.0, 22.0, 28.0, 8.0, 8.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28125, -47.35498046875, -45.4287109375, -43.50244140625, -41.576171875, -39.64990234375, -37.7236328125, -35.79736328125, -33.87109375, -31.94482421875, -30.0185546875, -28.09228515625, -26.166015625, -24.23974609375, -22.3134765625, -20.38720703125, -18.4609375, -16.53466796875, -14.6083984375, -12.68212890625, -10.755859375, -8.82958984375, -6.9033203125, -4.97705078125, -3.05078125, -1.12451171875, 0.8017578125, 2.72802734375, 4.654296875, 6.58056640625, 8.5068359375, 10.43310546875, 12.359375, 14.28564453125, 16.2119140625, 18.13818359375, 20.064453125, 21.99072265625, 23.9169921875, 25.84326171875, 27.76953125, 29.69580078125, 31.6220703125, 33.54833984375, 35.474609375, 37.40087890625, 39.3271484375, 41.25341796875, 43.1796875, 45.10595703125, 47.0322265625, 48.95849609375, 50.884765625, 52.81103515625, 54.7373046875, 56.66357421875, 58.58984375, 60.51611328125, 62.4423828125, 64.36865234375, 66.294921875, 68.22119140625, 70.1474609375, 72.07373046875, 74.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 10.0, 13.0, 19.0, 31.0, 44.0, 46.0, 61.0, 97.0, 197.0, 183.0, 88.0, 50.0, 44.0, 35.0, 20.0, 17.0, 11.0, 10.0, 5.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003997802734375, -0.0038068294525146484, -0.003615856170654297, -0.0034248828887939453, -0.0032339096069335938, -0.003042936325073242, -0.0028519630432128906, -0.002660989761352539, -0.0024700164794921875, -0.002279043197631836, -0.0020880699157714844, -0.0018970966339111328, -0.0017061233520507812, -0.0015151500701904297, -0.0013241767883300781, -0.0011332035064697266, -0.000942230224609375, -0.0007512569427490234, -0.0005602836608886719, -0.0003693103790283203, -0.00017833709716796875, 1.2636184692382812e-05, 0.00020360946655273438, 0.00039458274841308594, 0.0005855560302734375, 0.0007765293121337891, 0.0009675025939941406, 0.0011584758758544922, 0.0013494491577148438, 0.0015404224395751953, 0.0017313957214355469, 0.0019223690032958984, 0.00211334228515625, 0.0023043155670166016, 0.002495288848876953, 0.0026862621307373047, 0.0028772354125976562, 0.003068208694458008, 0.0032591819763183594, 0.003450155258178711, 0.0036411285400390625, 0.003832101821899414, 0.004023075103759766, 0.004214048385620117, 0.004405021667480469, 0.00459599494934082, 0.004786968231201172, 0.0049779415130615234, 0.005168914794921875, 0.0053598880767822266, 0.005550861358642578, 0.00574183464050293, 0.005932807922363281, 0.006123781204223633, 0.006314754486083984, 0.006505727767944336, 0.0066967010498046875, 0.006887674331665039, 0.007078647613525391, 0.007269620895385742, 0.007460594177246094, 0.007651567459106445, 0.007842540740966797, 0.008033514022827148, 0.0082244873046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 15.0, 18.0, 24.0, 30.0, 62.0, 129.0, 206.0, 396.0, 778.0, 1827.0, 4757.0, 17368.0, 185646.0, 772879.0, 50182.0, 8794.0, 2962.0, 1222.0, 578.0, 321.0, 136.0, 68.0, 66.0, 30.0, 27.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.40625, -55.00537109375, -53.6044921875, -52.20361328125, -50.802734375, -49.40185546875, -48.0009765625, -46.60009765625, -45.19921875, -43.79833984375, -42.3974609375, -40.99658203125, -39.595703125, -38.19482421875, -36.7939453125, -35.39306640625, -33.9921875, -32.59130859375, -31.1904296875, -29.78955078125, -28.388671875, -26.98779296875, -25.5869140625, -24.18603515625, -22.78515625, -21.38427734375, -19.9833984375, -18.58251953125, -17.181640625, -15.78076171875, -14.3798828125, -12.97900390625, -11.578125, -10.17724609375, -8.7763671875, -7.37548828125, -5.974609375, -4.57373046875, -3.1728515625, -1.77197265625, -0.37109375, 1.02978515625, 2.4306640625, 3.83154296875, 5.232421875, 6.63330078125, 8.0341796875, 9.43505859375, 10.8359375, 12.23681640625, 13.6376953125, 15.03857421875, 16.439453125, 17.84033203125, 19.2412109375, 20.64208984375, 22.04296875, 23.44384765625, 24.8447265625, 26.24560546875, 27.646484375, 29.04736328125, 30.4482421875, 31.84912109375, 33.25]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 7.0, 6.0, 11.0, 16.0, 16.0, 23.0, 48.0, 85.0, 116.0, 211.0, 166.0, 88.0, 60.0, 46.0, 20.0, 21.0, 18.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.015625, -27.971923828125, -26.92822265625, -25.884521484375, -24.8408203125, -23.797119140625, -22.75341796875, -21.709716796875, -20.666015625, -19.622314453125, -18.57861328125, -17.534912109375, -16.4912109375, -15.447509765625, -14.40380859375, -13.360107421875, -12.31640625, -11.272705078125, -10.22900390625, -9.185302734375, -8.1416015625, -7.097900390625, -6.05419921875, -5.010498046875, -3.966796875, -2.923095703125, -1.87939453125, -0.835693359375, 0.2080078125, 1.251708984375, 2.29541015625, 3.339111328125, 4.3828125, 5.426513671875, 6.47021484375, 7.513916015625, 8.5576171875, 9.601318359375, 10.64501953125, 11.688720703125, 12.732421875, 13.776123046875, 14.81982421875, 15.863525390625, 16.9072265625, 17.950927734375, 18.99462890625, 20.038330078125, 21.08203125, 22.125732421875, 23.16943359375, 24.213134765625, 25.2568359375, 26.300537109375, 27.34423828125, 28.387939453125, 29.431640625, 30.475341796875, 31.51904296875, 32.562744140625, 33.6064453125, 34.650146484375, 35.69384765625, 36.737548828125, 37.78125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 27.0, 43.0, 84.0, 131.0, 171.0, 168.0, 148.0, 95.0, 49.0, 32.0, 19.0, 7.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-459.84710693359375, -447.7350769042969, -435.6230163574219, -423.510986328125, -411.39892578125, -399.2868957519531, -387.17486572265625, -375.06280517578125, -362.9507751464844, -350.8387451171875, -338.7266845703125, -326.6146545410156, -314.50262451171875, -302.39056396484375, -290.2785339355469, -278.16650390625, -266.054443359375, -253.94239807128906, -241.83035278320312, -229.71832275390625, -217.6062774658203, -205.49423217773438, -193.3822021484375, -181.27015686035156, -169.15811157226562, -157.0460662841797, -144.93402099609375, -132.82199096679688, -120.70994567871094, -108.597900390625, -96.4858627319336, -84.37382507324219, -72.26177978515625, -60.14973831176758, -48.037696838378906, -35.925655364990234, -23.813613891601562, -11.70157241821289, 0.41046905517578125, 12.522506713867188, 24.634552001953125, 36.7465934753418, 48.85863494873047, 60.97067642211914, 73.08271789550781, 85.19476318359375, 97.30680084228516, 109.41883850097656, 121.5308837890625, 133.64292907714844, 145.75497436523438, 157.86700439453125, 169.9790496826172, 182.09109497070312, 194.203125, 206.31517028808594, 218.42721557617188, 230.5392608642578, 242.65130615234375, 254.76333618164062, 266.8753662109375, 278.9874267578125, 291.0994567871094, 303.21148681640625, 315.32354736328125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 12.0, 5.0, 15.0, 10.0, 6.0, 15.0, 16.0, 17.0, 19.0, 21.0, 27.0, 20.0, 32.0, 37.0, 43.0, 44.0, 45.0, 40.0, 37.0, 32.0, 38.0, 41.0, 44.0, 32.0, 45.0, 32.0, 28.0, 33.0, 36.0, 21.0, 20.0, 26.0, 17.0, 16.0, 3.0, 11.0, 16.0, 7.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-131.43313598632812, -127.40620422363281, -123.3792724609375, -119.35234069824219, -115.32540130615234, -111.29846954345703, -107.27153778076172, -103.2446060180664, -99.21766662597656, -95.19073486328125, -91.16380310058594, -87.13687133789062, -83.10993194580078, -79.08300018310547, -75.05606842041016, -71.02913665771484, -67.00220489501953, -62.97527313232422, -58.94833755493164, -54.92140579223633, -50.89447021484375, -46.86753845214844, -42.840606689453125, -38.81367492675781, -34.786739349365234, -30.75980567932129, -26.732872009277344, -22.70594024658203, -18.679006576538086, -14.65207290649414, -10.625141143798828, -6.598207473754883, -2.5712814331054688, 1.4556517601013184, 5.4825849533081055, 9.509517669677734, 13.53645133972168, 17.563385009765625, 21.590316772460938, 25.617250442504883, 29.644184112548828, 33.67111587524414, 37.69805145263672, 41.72498321533203, 45.751914978027344, 49.77885055541992, 53.805782318115234, 57.83271789550781, 61.859649658203125, 65.88658142089844, 69.91351318359375, 73.94044494628906, 77.9673843383789, 81.99431610107422, 86.02124786376953, 90.04817962646484, 94.07511901855469, 98.10205078125, 102.12898254394531, 106.15591430664062, 110.18285369873047, 114.20978546142578, 118.2367172241211, 122.2636489868164, 126.29058074951172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 10.0, 12.0, 8.0, 24.0, 24.0, 36.0, 71.0, 114.0, 166.0, 230.0, 397.0, 615.0, 966.0, 1622.0, 2922.0, 5249.0, 10225.0, 21007.0, 46718.0, 122851.0, 512927.0, 2974841.0, 327674.0, 93263.0, 37099.0, 16846.0, 8238.0, 4315.0, 2360.0, 1331.0, 771.0, 450.0, 304.0, 193.0, 128.0, 89.0, 54.0, 36.0, 31.0, 16.0, 16.0, 7.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.555908203125, -20.84619140625, -20.136474609375, -19.4267578125, -18.717041015625, -18.00732421875, -17.297607421875, -16.587890625, -15.878173828125, -15.16845703125, -14.458740234375, -13.7490234375, -13.039306640625, -12.32958984375, -11.619873046875, -10.91015625, -10.200439453125, -9.49072265625, -8.781005859375, -8.0712890625, -7.361572265625, -6.65185546875, -5.942138671875, -5.232421875, -4.522705078125, -3.81298828125, -3.103271484375, -2.3935546875, -1.683837890625, -0.97412109375, -0.264404296875, 0.4453125, 1.155029296875, 1.86474609375, 2.574462890625, 3.2841796875, 3.993896484375, 4.70361328125, 5.413330078125, 6.123046875, 6.832763671875, 7.54248046875, 8.252197265625, 8.9619140625, 9.671630859375, 10.38134765625, 11.091064453125, 11.80078125, 12.510498046875, 13.22021484375, 13.929931640625, 14.6396484375, 15.349365234375, 16.05908203125, 16.768798828125, 17.478515625, 18.188232421875, 18.89794921875, 19.607666015625, 20.3173828125, 21.027099609375, 21.73681640625, 22.446533203125, 23.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 5.0, 14.0, 14.0, 24.0, 28.0, 41.0, 39.0, 45.0, 41.0, 47.0, 51.0, 46.0, 53.0, 54.0, 39.0, 41.0, 64.0, 37.0, 43.0, 40.0, 36.0, 25.0, 30.0, 24.0, 21.0, 15.0, 17.0, 10.0, 7.0, 8.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.4144287109375, -5.219482421875, -5.0245361328125, -4.82958984375, -4.6346435546875, -4.439697265625, -4.2447509765625, -4.0498046875, -3.8548583984375, -3.659912109375, -3.4649658203125, -3.27001953125, -3.0750732421875, -2.880126953125, -2.6851806640625, -2.490234375, -2.2952880859375, -2.100341796875, -1.9053955078125, -1.71044921875, -1.5155029296875, -1.320556640625, -1.1256103515625, -0.9306640625, -0.7357177734375, -0.540771484375, -0.3458251953125, -0.15087890625, 0.0440673828125, 0.239013671875, 0.4339599609375, 0.62890625, 0.8238525390625, 1.018798828125, 1.2137451171875, 1.40869140625, 1.6036376953125, 1.798583984375, 1.9935302734375, 2.1884765625, 2.3834228515625, 2.578369140625, 2.7733154296875, 2.96826171875, 3.1632080078125, 3.358154296875, 3.5531005859375, 3.748046875, 3.9429931640625, 4.137939453125, 4.3328857421875, 4.52783203125, 4.7227783203125, 4.917724609375, 5.1126708984375, 5.3076171875, 5.5025634765625, 5.697509765625, 5.8924560546875, 6.08740234375, 6.2823486328125, 6.477294921875, 6.6722412109375, 6.8671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 10.0, 5.0, 11.0, 17.0, 25.0, 48.0, 52.0, 80.0, 117.0, 178.0, 337.0, 516.0, 770.0, 1593.0, 3323.0, 7136.0, 17962.0, 51312.0, 193563.0, 2406181.0, 1282276.0, 156667.0, 43734.0, 15509.0, 6435.0, 2959.0, 1444.0, 757.0, 477.0, 281.0, 176.0, 122.0, 70.0, 42.0, 32.0, 24.0, 18.0, 10.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-43.40625, -42.291259765625, -41.17626953125, -40.061279296875, -38.9462890625, -37.831298828125, -36.71630859375, -35.601318359375, -34.486328125, -33.371337890625, -32.25634765625, -31.141357421875, -30.0263671875, -28.911376953125, -27.79638671875, -26.681396484375, -25.56640625, -24.451416015625, -23.33642578125, -22.221435546875, -21.1064453125, -19.991455078125, -18.87646484375, -17.761474609375, -16.646484375, -15.531494140625, -14.41650390625, -13.301513671875, -12.1865234375, -11.071533203125, -9.95654296875, -8.841552734375, -7.7265625, -6.611572265625, -5.49658203125, -4.381591796875, -3.2666015625, -2.151611328125, -1.03662109375, 0.078369140625, 1.193359375, 2.308349609375, 3.42333984375, 4.538330078125, 5.6533203125, 6.768310546875, 7.88330078125, 8.998291015625, 10.11328125, 11.228271484375, 12.34326171875, 13.458251953125, 14.5732421875, 15.688232421875, 16.80322265625, 17.918212890625, 19.033203125, 20.148193359375, 21.26318359375, 22.378173828125, 23.4931640625, 24.608154296875, 25.72314453125, 26.838134765625, 27.953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 12.0, 19.0, 25.0, 33.0, 42.0, 82.0, 103.0, 168.0, 298.0, 718.0, 1365.0, 477.0, 230.0, 158.0, 84.0, 65.0, 48.0, 39.0, 12.0, 20.0, 14.0, 12.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.802978515625, -13.18408203125, -12.565185546875, -11.9462890625, -11.327392578125, -10.70849609375, -10.089599609375, -9.470703125, -8.851806640625, -8.23291015625, -7.614013671875, -6.9951171875, -6.376220703125, -5.75732421875, -5.138427734375, -4.51953125, -3.900634765625, -3.28173828125, -2.662841796875, -2.0439453125, -1.425048828125, -0.80615234375, -0.187255859375, 0.431640625, 1.050537109375, 1.66943359375, 2.288330078125, 2.9072265625, 3.526123046875, 4.14501953125, 4.763916015625, 5.3828125, 6.001708984375, 6.62060546875, 7.239501953125, 7.8583984375, 8.477294921875, 9.09619140625, 9.715087890625, 10.333984375, 10.952880859375, 11.57177734375, 12.190673828125, 12.8095703125, 13.428466796875, 14.04736328125, 14.666259765625, 15.28515625, 15.904052734375, 16.52294921875, 17.141845703125, 17.7607421875, 18.379638671875, 18.99853515625, 19.617431640625, 20.236328125, 20.855224609375, 21.47412109375, 22.093017578125, 22.7119140625, 23.330810546875, 23.94970703125, 24.568603515625, 25.1875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 38.0, 66.0, 156.0, 218.0, 217.0, 162.0, 73.0, 36.0, 16.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.23800659179688, -110.52970886230469, -101.82141876220703, -93.11312866210938, -84.40483093261719, -75.696533203125, -66.98824310302734, -58.27994918823242, -49.5716552734375, -40.86336135864258, -32.155067443847656, -23.446773529052734, -14.738479614257812, -6.030185699462891, 2.6781082153320312, 11.386402130126953, 20.094696044921875, 28.802989959716797, 37.51128387451172, 46.21957778930664, 54.92787170410156, 63.636165618896484, 72.3444595336914, 81.05274963378906, 89.76104736328125, 98.46934509277344, 107.1776351928711, 115.88592529296875, 124.59422302246094, 133.30252075195312, 142.01080322265625, 150.71910095214844, 159.4273681640625, 168.1356658935547, 176.84396362304688, 185.55224609375, 194.2605438232422, 202.96884155273438, 211.6771240234375, 220.3854217529297, 229.09371948242188, 237.80201721191406, 246.51031494140625, 255.21859741210938, 263.9268798828125, 272.63519287109375, 281.3434753417969, 290.0517883300781, 298.76007080078125, 307.4683532714844, 316.1766662597656, 324.88494873046875, 333.59326171875, 342.3015441894531, 351.00982666015625, 359.7181396484375, 368.4264221191406, 377.13470458984375, 385.843017578125, 394.5513000488281, 403.25958251953125, 411.9678955078125, 420.6761779785156, 429.3844909667969, 438.0927734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 10.0, 13.0, 9.0, 11.0, 26.0, 22.0, 26.0, 25.0, 40.0, 35.0, 31.0, 39.0, 47.0, 51.0, 52.0, 46.0, 45.0, 38.0, 41.0, 34.0, 41.0, 48.0, 32.0, 36.0, 28.0, 29.0, 27.0, 25.0, 16.0, 19.0, 13.0, 7.0, 8.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.80278778076172, -87.22354888916016, -84.6443099975586, -82.06507110595703, -79.48583984375, -76.90660095214844, -74.32736206054688, -71.74812316894531, -69.16888427734375, -66.58964538574219, -64.01040649414062, -61.43117141723633, -58.851932525634766, -56.2726936340332, -53.693458557128906, -51.114219665527344, -48.53498077392578, -45.95574188232422, -43.376502990722656, -40.79726791381836, -38.2180290222168, -35.638790130615234, -33.05955505371094, -30.480316162109375, -27.901077270507812, -25.32183837890625, -22.74260139465332, -20.16336441040039, -17.584125518798828, -15.004887580871582, -12.425649642944336, -9.846412658691406, -7.2671661376953125, -4.687928199768066, -2.1086902618408203, 0.4705476760864258, 3.049785614013672, 5.629023551940918, 8.208261489868164, 10.787498474121094, 13.366737365722656, 15.945975303649902, 18.52521324157715, 21.104450225830078, 23.68368911743164, 26.262928009033203, 28.842164993286133, 31.421401977539062, 34.000640869140625, 36.57987976074219, 39.15911865234375, 41.73835372924805, 44.31759262084961, 46.89683151245117, 49.47606658935547, 52.05530548095703, 54.634544372558594, 57.213783264160156, 59.79302215576172, 62.372257232666016, 64.95149230957031, 67.53073120117188, 70.10997009277344, 72.689208984375, 75.26844787597656]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 12.0, 20.0, 32.0, 30.0, 62.0, 91.0, 121.0, 183.0, 253.0, 401.0, 651.0, 1005.0, 1633.0, 2838.0, 4549.0, 7708.0, 13768.0, 23998.0, 42344.0, 74248.0, 123280.0, 179085.0, 195176.0, 150900.0, 95199.0, 55479.0, 31641.0, 18349.0, 10297.0, 5958.0, 3493.0, 2139.0, 1311.0, 784.0, 476.0, 320.0, 211.0, 154.0, 93.0, 80.0, 38.0, 41.0, 22.0, 18.0, 13.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.640625, -14.1719970703125, -13.703369140625, -13.2347412109375, -12.76611328125, -12.2974853515625, -11.828857421875, -11.3602294921875, -10.8916015625, -10.4229736328125, -9.954345703125, -9.4857177734375, -9.01708984375, -8.5484619140625, -8.079833984375, -7.6112060546875, -7.142578125, -6.6739501953125, -6.205322265625, -5.7366943359375, -5.26806640625, -4.7994384765625, -4.330810546875, -3.8621826171875, -3.3935546875, -2.9249267578125, -2.456298828125, -1.9876708984375, -1.51904296875, -1.0504150390625, -0.581787109375, -0.1131591796875, 0.35546875, 0.8240966796875, 1.292724609375, 1.7613525390625, 2.22998046875, 2.6986083984375, 3.167236328125, 3.6358642578125, 4.1044921875, 4.5731201171875, 5.041748046875, 5.5103759765625, 5.97900390625, 6.4476318359375, 6.916259765625, 7.3848876953125, 7.853515625, 8.3221435546875, 8.790771484375, 9.2593994140625, 9.72802734375, 10.1966552734375, 10.665283203125, 11.1339111328125, 11.6025390625, 12.0711669921875, 12.539794921875, 13.0084228515625, 13.47705078125, 13.9456787109375, 14.414306640625, 14.8829345703125, 15.3515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 9.0, 9.0, 13.0, 10.0, 10.0, 25.0, 18.0, 21.0, 34.0, 29.0, 38.0, 40.0, 44.0, 38.0, 49.0, 41.0, 56.0, 53.0, 49.0, 56.0, 47.0, 43.0, 35.0, 29.0, 35.0, 19.0, 27.0, 14.0, 15.0, 20.0, 14.0, 7.0, 17.0, 4.0, 4.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.138916015625, -6.92236328125, -6.705810546875, -6.4892578125, -6.272705078125, -6.05615234375, -5.839599609375, -5.623046875, -5.406494140625, -5.18994140625, -4.973388671875, -4.7568359375, -4.540283203125, -4.32373046875, -4.107177734375, -3.890625, -3.674072265625, -3.45751953125, -3.240966796875, -3.0244140625, -2.807861328125, -2.59130859375, -2.374755859375, -2.158203125, -1.941650390625, -1.72509765625, -1.508544921875, -1.2919921875, -1.075439453125, -0.85888671875, -0.642333984375, -0.42578125, -0.209228515625, 0.00732421875, 0.223876953125, 0.4404296875, 0.656982421875, 0.87353515625, 1.090087890625, 1.306640625, 1.523193359375, 1.73974609375, 1.956298828125, 2.1728515625, 2.389404296875, 2.60595703125, 2.822509765625, 3.0390625, 3.255615234375, 3.47216796875, 3.688720703125, 3.9052734375, 4.121826171875, 4.33837890625, 4.554931640625, 4.771484375, 4.988037109375, 5.20458984375, 5.421142578125, 5.6376953125, 5.854248046875, 6.07080078125, 6.287353515625, 6.50390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 6.0, 14.0, 14.0, 18.0, 27.0, 55.0, 70.0, 94.0, 158.0, 260.0, 454.0, 868.0, 2179.0, 6189.0, 23650.0, 108780.0, 420036.0, 367884.0, 88981.0, 19578.0, 5364.0, 1926.0, 832.0, 415.0, 236.0, 153.0, 93.0, 53.0, 40.0, 28.0, 23.0, 12.0, 8.0, 14.0, 3.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.6865234375, -34.310546875, -32.9345703125, -31.55859375, -30.1826171875, -28.806640625, -27.4306640625, -26.0546875, -24.6787109375, -23.302734375, -21.9267578125, -20.55078125, -19.1748046875, -17.798828125, -16.4228515625, -15.046875, -13.6708984375, -12.294921875, -10.9189453125, -9.54296875, -8.1669921875, -6.791015625, -5.4150390625, -4.0390625, -2.6630859375, -1.287109375, 0.0888671875, 1.46484375, 2.8408203125, 4.216796875, 5.5927734375, 6.96875, 8.3447265625, 9.720703125, 11.0966796875, 12.47265625, 13.8486328125, 15.224609375, 16.6005859375, 17.9765625, 19.3525390625, 20.728515625, 22.1044921875, 23.48046875, 24.8564453125, 26.232421875, 27.6083984375, 28.984375, 30.3603515625, 31.736328125, 33.1123046875, 34.48828125, 35.8642578125, 37.240234375, 38.6162109375, 39.9921875, 41.3681640625, 42.744140625, 44.1201171875, 45.49609375, 46.8720703125, 48.248046875, 49.6240234375, 51.0]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 7.0, 11.0, 7.0, 12.0, 13.0, 15.0, 24.0, 26.0, 20.0, 31.0, 27.0, 42.0, 39.0, 36.0, 47.0, 33.0, 54.0, 56.0, 44.0, 51.0, 40.0, 50.0, 51.0, 44.0, 28.0, 29.0, 26.0, 22.0, 17.0, 9.0, 16.0, 12.0, 11.0, 5.0, 11.0, 7.0, 8.0, 10.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.8125, -39.46435546875, -38.1162109375, -36.76806640625, -35.419921875, -34.07177734375, -32.7236328125, -31.37548828125, -30.02734375, -28.67919921875, -27.3310546875, -25.98291015625, -24.634765625, -23.28662109375, -21.9384765625, -20.59033203125, -19.2421875, -17.89404296875, -16.5458984375, -15.19775390625, -13.849609375, -12.50146484375, -11.1533203125, -9.80517578125, -8.45703125, -7.10888671875, -5.7607421875, -4.41259765625, -3.064453125, -1.71630859375, -0.3681640625, 0.97998046875, 2.328125, 3.67626953125, 5.0244140625, 6.37255859375, 7.720703125, 9.06884765625, 10.4169921875, 11.76513671875, 13.11328125, 14.46142578125, 15.8095703125, 17.15771484375, 18.505859375, 19.85400390625, 21.2021484375, 22.55029296875, 23.8984375, 25.24658203125, 26.5947265625, 27.94287109375, 29.291015625, 30.63916015625, 31.9873046875, 33.33544921875, 34.68359375, 36.03173828125, 37.3798828125, 38.72802734375, 40.076171875, 41.42431640625, 42.7724609375, 44.12060546875, 45.46875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 11.0, 6.0, 10.0, 9.0, 14.0, 15.0, 17.0, 33.0, 43.0, 38.0, 74.0, 99.0, 257.0, 483.0, 1120.0, 3443.0, 14784.0, 122010.0, 678991.0, 198182.0, 21793.0, 4493.0, 1397.0, 558.0, 247.0, 123.0, 79.0, 47.0, 34.0, 33.0, 20.0, 19.0, 18.0, 10.0, 3.0, 10.0, 8.0, 7.0, 8.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.28125, -36.234130859375, -35.18701171875, -34.139892578125, -33.0927734375, -32.045654296875, -30.99853515625, -29.951416015625, -28.904296875, -27.857177734375, -26.81005859375, -25.762939453125, -24.7158203125, -23.668701171875, -22.62158203125, -21.574462890625, -20.52734375, -19.480224609375, -18.43310546875, -17.385986328125, -16.3388671875, -15.291748046875, -14.24462890625, -13.197509765625, -12.150390625, -11.103271484375, -10.05615234375, -9.009033203125, -7.9619140625, -6.914794921875, -5.86767578125, -4.820556640625, -3.7734375, -2.726318359375, -1.67919921875, -0.632080078125, 0.4150390625, 1.462158203125, 2.50927734375, 3.556396484375, 4.603515625, 5.650634765625, 6.69775390625, 7.744873046875, 8.7919921875, 9.839111328125, 10.88623046875, 11.933349609375, 12.98046875, 14.027587890625, 15.07470703125, 16.121826171875, 17.1689453125, 18.216064453125, 19.26318359375, 20.310302734375, 21.357421875, 22.404541015625, 23.45166015625, 24.498779296875, 25.5458984375, 26.593017578125, 27.64013671875, 28.687255859375, 29.734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 11.0, 13.0, 18.0, 25.0, 44.0, 47.0, 77.0, 102.0, 136.0, 110.0, 126.0, 96.0, 62.0, 38.0, 33.0, 16.0, 23.0, 8.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0048675537109375, -0.004666566848754883, -0.004465579986572266, -0.0042645931243896484, -0.004063606262207031, -0.003862619400024414, -0.003661632537841797, -0.0034606456756591797, -0.0032596588134765625, -0.0030586719512939453, -0.002857685089111328, -0.002656698226928711, -0.0024557113647460938, -0.0022547245025634766, -0.0020537376403808594, -0.0018527507781982422, -0.001651763916015625, -0.0014507770538330078, -0.0012497901916503906, -0.0010488033294677734, -0.0008478164672851562, -0.0006468296051025391, -0.0004458427429199219, -0.0002448558807373047, -4.38690185546875e-05, 0.0001571178436279297, 0.0003581047058105469, 0.0005590915679931641, 0.0007600784301757812, 0.0009610652923583984, 0.0011620521545410156, 0.0013630390167236328, 0.00156402587890625, 0.0017650127410888672, 0.0019659996032714844, 0.0021669864654541016, 0.0023679733276367188, 0.002568960189819336, 0.002769947052001953, 0.0029709339141845703, 0.0031719207763671875, 0.0033729076385498047, 0.003573894500732422, 0.003774881362915039, 0.003975868225097656, 0.0041768550872802734, 0.004377841949462891, 0.004578828811645508, 0.004779815673828125, 0.004980802536010742, 0.005181789398193359, 0.0053827762603759766, 0.005583763122558594, 0.005784749984741211, 0.005985736846923828, 0.006186723709106445, 0.0063877105712890625, 0.00658869743347168, 0.006789684295654297, 0.006990671157836914, 0.007191658020019531, 0.0073926448822021484, 0.007593631744384766, 0.007794618606567383, 0.00799560546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 14.0, 31.0, 28.0, 51.0, 83.0, 166.0, 326.0, 812.0, 2104.0, 7714.0, 46149.0, 425555.0, 496463.0, 56377.0, 8781.0, 2242.0, 855.0, 358.0, 184.0, 107.0, 54.0, 43.0, 24.0, 13.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.670166015625, -35.65283203125, -34.635498046875, -33.6181640625, -32.600830078125, -31.58349609375, -30.566162109375, -29.548828125, -28.531494140625, -27.51416015625, -26.496826171875, -25.4794921875, -24.462158203125, -23.44482421875, -22.427490234375, -21.41015625, -20.392822265625, -19.37548828125, -18.358154296875, -17.3408203125, -16.323486328125, -15.30615234375, -14.288818359375, -13.271484375, -12.254150390625, -11.23681640625, -10.219482421875, -9.2021484375, -8.184814453125, -7.16748046875, -6.150146484375, -5.1328125, -4.115478515625, -3.09814453125, -2.080810546875, -1.0634765625, -0.046142578125, 0.97119140625, 1.988525390625, 3.005859375, 4.023193359375, 5.04052734375, 6.057861328125, 7.0751953125, 8.092529296875, 9.10986328125, 10.127197265625, 11.14453125, 12.161865234375, 13.17919921875, 14.196533203125, 15.2138671875, 16.231201171875, 17.24853515625, 18.265869140625, 19.283203125, 20.300537109375, 21.31787109375, 22.335205078125, 23.3525390625, 24.369873046875, 25.38720703125, 26.404541015625, 27.421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 6.0, 12.0, 20.0, 36.0, 40.0, 51.0, 71.0, 96.0, 129.0, 129.0, 99.0, 85.0, 79.0, 31.0, 34.0, 24.0, 17.0, 12.0, 8.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.71875, -33.808837890625, -32.89892578125, -31.989013671875, -31.0791015625, -30.169189453125, -29.25927734375, -28.349365234375, -27.439453125, -26.529541015625, -25.61962890625, -24.709716796875, -23.7998046875, -22.889892578125, -21.97998046875, -21.070068359375, -20.16015625, -19.250244140625, -18.34033203125, -17.430419921875, -16.5205078125, -15.610595703125, -14.70068359375, -13.790771484375, -12.880859375, -11.970947265625, -11.06103515625, -10.151123046875, -9.2412109375, -8.331298828125, -7.42138671875, -6.511474609375, -5.6015625, -4.691650390625, -3.78173828125, -2.871826171875, -1.9619140625, -1.052001953125, -0.14208984375, 0.767822265625, 1.677734375, 2.587646484375, 3.49755859375, 4.407470703125, 5.3173828125, 6.227294921875, 7.13720703125, 8.047119140625, 8.95703125, 9.866943359375, 10.77685546875, 11.686767578125, 12.5966796875, 13.506591796875, 14.41650390625, 15.326416015625, 16.236328125, 17.146240234375, 18.05615234375, 18.966064453125, 19.8759765625, 20.785888671875, 21.69580078125, 22.605712890625, 23.515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 8.0, 19.0, 60.0, 163.0, 284.0, 243.0, 152.0, 46.0, 26.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5849609375, -113.4738540649414, -90.36274719238281, -67.25163269042969, -44.140525817871094, -21.0294189453125, 2.081695556640625, 25.192794799804688, 48.30390930175781, 71.4150161743164, 94.526123046875, 117.63723754882812, 140.74835205078125, 163.8594512939453, 186.97056579589844, 210.0816650390625, 233.19277954101562, 256.30389404296875, 279.4150085449219, 302.526123046875, 325.63720703125, 348.7483215332031, 371.85943603515625, 394.97052001953125, 418.0816650390625, 441.1927795410156, 464.30389404296875, 487.41497802734375, 510.5260925292969, 533.63720703125, 556.748291015625, 579.8594360351562, 602.9705200195312, 626.0816040039062, 649.1927490234375, 672.3038330078125, 695.4149780273438, 718.5260620117188, 741.63720703125, 764.748291015625, 787.859375, 810.970458984375, 834.0816040039062, 857.1926879882812, 880.3038330078125, 903.4149169921875, 926.5260009765625, 949.6371459960938, 972.748291015625, 995.859375, 1018.9705200195312, 1042.0816650390625, 1065.1927490234375, 1088.3038330078125, 1111.4149169921875, 1134.5260009765625, 1157.6370849609375, 1180.7481689453125, 1203.8592529296875, 1226.970458984375, 1250.08154296875, 1273.192626953125, 1296.3037109375, 1319.414794921875, 1342.5260009765625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 6.0, 9.0, 6.0, 14.0, 13.0, 14.0, 18.0, 18.0, 40.0, 34.0, 37.0, 33.0, 52.0, 39.0, 59.0, 45.0, 51.0, 39.0, 44.0, 32.0, 53.0, 33.0, 47.0, 40.0, 38.0, 37.0, 21.0, 19.0, 20.0, 15.0, 12.0, 10.0, 15.0, 7.0, 8.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.56011962890625, -215.1356658935547, -207.71121215820312, -200.28675842285156, -192.8623046875, -185.43783569335938, -178.01339721679688, -170.58892822265625, -163.1644744873047, -155.74002075195312, -148.31556701660156, -140.89111328125, -133.46665954589844, -126.04219818115234, -118.61774444580078, -111.19328308105469, -103.76883697509766, -96.3443832397461, -88.91992950439453, -81.49546813964844, -74.07101440429688, -66.64656066894531, -59.22210693359375, -51.79764938354492, -44.37319564819336, -36.9487419128418, -29.52428436279297, -22.099830627441406, -14.675374984741211, -7.250919342041016, 0.17353439331054688, 7.597991943359375, 15.022445678710938, 22.446901321411133, 29.871356964111328, 37.29581069946289, 44.72026824951172, 52.14472198486328, 59.569175720214844, 66.99363708496094, 74.4180908203125, 81.84254455566406, 89.26699829101562, 96.69145202636719, 104.11591339111328, 111.54036712646484, 118.9648208618164, 126.3892822265625, 133.813720703125, 141.23817443847656, 148.66262817382812, 156.0870819091797, 163.51153564453125, 170.93600463867188, 178.36044311523438, 185.784912109375, 193.20936584472656, 200.63381958007812, 208.0582733154297, 215.48272705078125, 222.9071807861328, 230.33163452148438, 237.756103515625, 245.18055725097656, 252.60501098632812]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 12.0, 12.0, 8.0, 14.0, 19.0, 34.0, 33.0, 65.0, 88.0, 127.0, 217.0, 349.0, 714.0, 1310.0, 2532.0, 5962.0, 17358.0, 105010.0, 3996259.0, 44262.0, 11269.0, 4393.0, 1946.0, 952.0, 527.0, 277.0, 188.0, 85.0, 72.0, 58.0, 38.0, 20.0, 7.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-53.3125, -51.7587890625, -50.205078125, -48.6513671875, -47.09765625, -45.5439453125, -43.990234375, -42.4365234375, -40.8828125, -39.3291015625, -37.775390625, -36.2216796875, -34.66796875, -33.1142578125, -31.560546875, -30.0068359375, -28.453125, -26.8994140625, -25.345703125, -23.7919921875, -22.23828125, -20.6845703125, -19.130859375, -17.5771484375, -16.0234375, -14.4697265625, -12.916015625, -11.3623046875, -9.80859375, -8.2548828125, -6.701171875, -5.1474609375, -3.59375, -2.0400390625, -0.486328125, 1.0673828125, 2.62109375, 4.1748046875, 5.728515625, 7.2822265625, 8.8359375, 10.3896484375, 11.943359375, 13.4970703125, 15.05078125, 16.6044921875, 18.158203125, 19.7119140625, 21.265625, 22.8193359375, 24.373046875, 25.9267578125, 27.48046875, 29.0341796875, 30.587890625, 32.1416015625, 33.6953125, 35.2490234375, 36.802734375, 38.3564453125, 39.91015625, 41.4638671875, 43.017578125, 44.5712890625, 46.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 12.0, 10.0, 14.0, 12.0, 19.0, 20.0, 30.0, 35.0, 40.0, 45.0, 53.0, 45.0, 43.0, 54.0, 48.0, 70.0, 53.0, 62.0, 48.0, 50.0, 38.0, 33.0, 35.0, 28.0, 29.0, 21.0, 11.0, 9.0, 6.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.5546875, -11.232177734375, -10.90966796875, -10.587158203125, -10.2646484375, -9.942138671875, -9.61962890625, -9.297119140625, -8.974609375, -8.652099609375, -8.32958984375, -8.007080078125, -7.6845703125, -7.362060546875, -7.03955078125, -6.717041015625, -6.39453125, -6.072021484375, -5.74951171875, -5.427001953125, -5.1044921875, -4.781982421875, -4.45947265625, -4.136962890625, -3.814453125, -3.491943359375, -3.16943359375, -2.846923828125, -2.5244140625, -2.201904296875, -1.87939453125, -1.556884765625, -1.234375, -0.911865234375, -0.58935546875, -0.266845703125, 0.0556640625, 0.378173828125, 0.70068359375, 1.023193359375, 1.345703125, 1.668212890625, 1.99072265625, 2.313232421875, 2.6357421875, 2.958251953125, 3.28076171875, 3.603271484375, 3.92578125, 4.248291015625, 4.57080078125, 4.893310546875, 5.2158203125, 5.538330078125, 5.86083984375, 6.183349609375, 6.505859375, 6.828369140625, 7.15087890625, 7.473388671875, 7.7958984375, 8.118408203125, 8.44091796875, 8.763427734375, 9.0859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 15.0, 26.0, 40.0, 45.0, 83.0, 93.0, 154.0, 202.0, 336.0, 487.0, 710.0, 1192.0, 2017.0, 3941.0, 9032.0, 31728.0, 3570056.0, 529627.0, 27318.0, 8241.0, 3641.0, 1993.0, 1126.0, 721.0, 456.0, 293.0, 199.0, 135.0, 99.0, 84.0, 55.0, 37.0, 25.0, 17.0, 12.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-65.5625, -63.7392578125, -61.916015625, -60.0927734375, -58.26953125, -56.4462890625, -54.623046875, -52.7998046875, -50.9765625, -49.1533203125, -47.330078125, -45.5068359375, -43.68359375, -41.8603515625, -40.037109375, -38.2138671875, -36.390625, -34.5673828125, -32.744140625, -30.9208984375, -29.09765625, -27.2744140625, -25.451171875, -23.6279296875, -21.8046875, -19.9814453125, -18.158203125, -16.3349609375, -14.51171875, -12.6884765625, -10.865234375, -9.0419921875, -7.21875, -5.3955078125, -3.572265625, -1.7490234375, 0.07421875, 1.8974609375, 3.720703125, 5.5439453125, 7.3671875, 9.1904296875, 11.013671875, 12.8369140625, 14.66015625, 16.4833984375, 18.306640625, 20.1298828125, 21.953125, 23.7763671875, 25.599609375, 27.4228515625, 29.24609375, 31.0693359375, 32.892578125, 34.7158203125, 36.5390625, 38.3623046875, 40.185546875, 42.0087890625, 43.83203125, 45.6552734375, 47.478515625, 49.3017578125, 51.125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 8.0, 11.0, 19.0, 48.0, 58.0, 187.0, 3240.0, 303.0, 76.0, 46.0, 16.0, 7.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9609375, -10.5921630859375, -10.223388671875, -9.8546142578125, -9.48583984375, -9.1170654296875, -8.748291015625, -8.3795166015625, -8.0107421875, -7.6419677734375, -7.273193359375, -6.9044189453125, -6.53564453125, -6.1668701171875, -5.798095703125, -5.4293212890625, -5.060546875, -4.6917724609375, -4.322998046875, -3.9542236328125, -3.58544921875, -3.2166748046875, -2.847900390625, -2.4791259765625, -2.1103515625, -1.7415771484375, -1.372802734375, -1.0040283203125, -0.63525390625, -0.2664794921875, 0.102294921875, 0.4710693359375, 0.83984375, 1.2086181640625, 1.577392578125, 1.9461669921875, 2.31494140625, 2.6837158203125, 3.052490234375, 3.4212646484375, 3.7900390625, 4.1588134765625, 4.527587890625, 4.8963623046875, 5.26513671875, 5.6339111328125, 6.002685546875, 6.3714599609375, 6.740234375, 7.1090087890625, 7.477783203125, 7.8465576171875, 8.21533203125, 8.5841064453125, 8.952880859375, 9.3216552734375, 9.6904296875, 10.0592041015625, 10.427978515625, 10.7967529296875, 11.16552734375, 11.5343017578125, 11.903076171875, 12.2718505859375, 12.640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 12.0, 26.0, 30.0, 51.0, 87.0, 88.0, 117.0, 140.0, 139.0, 99.0, 75.0, 44.0, 37.0, 19.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.23152160644531, -55.60279083251953, -53.974056243896484, -52.3453254699707, -50.716590881347656, -49.087860107421875, -47.459129333496094, -45.83039855957031, -44.201663970947266, -42.572933197021484, -40.94419860839844, -39.315467834472656, -37.686737060546875, -36.05800247192383, -34.42927169799805, -32.800537109375, -31.17180633544922, -29.543073654174805, -27.91434097290039, -26.28561019897461, -24.656877517700195, -23.02814483642578, -21.3994140625, -19.770681381225586, -18.141948699951172, -16.513216018676758, -14.88448429107666, -13.255752563476562, -11.627019882202148, -9.998287200927734, -8.369555473327637, -6.740823745727539, -5.112087249755859, -3.4833550453186035, -1.8546228408813477, -0.2258906364440918, 1.402841567993164, 3.031574249267578, 4.660305976867676, 6.289037704467773, 7.9177703857421875, 9.546503067016602, 11.1752347946167, 12.803966522216797, 14.432699203491211, 16.061431884765625, 17.690162658691406, 19.31889533996582, 20.947628021240234, 22.57636070251465, 24.205093383789062, 25.833824157714844, 27.462556838989258, 29.091289520263672, 30.720020294189453, 32.3487548828125, 33.97748565673828, 35.60621643066406, 37.23495101928711, 38.86368179321289, 40.49241638183594, 42.12114715576172, 43.7498779296875, 45.37860870361328, 47.00734329223633]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 10.0, 11.0, 9.0, 9.0, 13.0, 20.0, 9.0, 24.0, 22.0, 29.0, 28.0, 39.0, 35.0, 39.0, 37.0, 40.0, 38.0, 38.0, 40.0, 38.0, 44.0, 40.0, 37.0, 31.0, 25.0, 34.0, 37.0, 30.0, 30.0, 25.0, 20.0, 17.0, 19.0, 14.0, 15.0, 8.0, 10.0, 8.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.760135650634766, -17.093189239501953, -16.426244735717773, -15.759298324584961, -15.092351913452148, -14.425406455993652, -13.758460998535156, -13.091514587402344, -12.424568176269531, -11.757622718811035, -11.090676307678223, -10.423730850219727, -9.756784439086914, -9.089838981628418, -8.422893524169922, -7.755947113037109, -7.089001655578613, -6.422055721282959, -5.755109786987305, -5.088164329528809, -4.421217918395996, -3.754272222518921, -3.0873265266418457, -2.4203805923461914, -1.753434658050537, -1.0864887237548828, -0.41954290866851807, 0.24740290641784668, 0.914348840713501, 1.5812947750091553, 2.2482404708862305, 2.9151864051818848, 3.582132339477539, 4.249078273773193, 4.916024208068848, 5.582969665527344, 6.249916076660156, 6.916861534118652, 7.583807468414307, 8.250753402709961, 8.917699813842773, 9.58464527130127, 10.251591682434082, 10.918537139892578, 11.58548355102539, 12.252429008483887, 12.919374465942383, 13.586320877075195, 14.253266334533691, 14.920211791992188, 15.587158203125, 16.254104614257812, 16.921049118041992, 17.587995529174805, 18.254941940307617, 18.921886444091797, 19.58883285522461, 20.255779266357422, 20.9227237701416, 21.589670181274414, 22.256616592407227, 22.92356300354004, 23.59050750732422, 24.25745391845703, 24.924400329589844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 3.0, 7.0, 6.0, 6.0, 11.0, 15.0, 24.0, 37.0, 55.0, 96.0, 142.0, 294.0, 434.0, 733.0, 1357.0, 2429.0, 4463.0, 8506.0, 16945.0, 33613.0, 65998.0, 126819.0, 215370.0, 238573.0, 159333.0, 84604.0, 43082.0, 21886.0, 11042.0, 5780.0, 2983.0, 1646.0, 928.0, 524.0, 311.0, 185.0, 106.0, 64.0, 47.0, 27.0, 27.0, 13.0, 5.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.1875, -20.549072265625, -19.91064453125, -19.272216796875, -18.6337890625, -17.995361328125, -17.35693359375, -16.718505859375, -16.080078125, -15.441650390625, -14.80322265625, -14.164794921875, -13.5263671875, -12.887939453125, -12.24951171875, -11.611083984375, -10.97265625, -10.334228515625, -9.69580078125, -9.057373046875, -8.4189453125, -7.780517578125, -7.14208984375, -6.503662109375, -5.865234375, -5.226806640625, -4.58837890625, -3.949951171875, -3.3115234375, -2.673095703125, -2.03466796875, -1.396240234375, -0.7578125, -0.119384765625, 0.51904296875, 1.157470703125, 1.7958984375, 2.434326171875, 3.07275390625, 3.711181640625, 4.349609375, 4.988037109375, 5.62646484375, 6.264892578125, 6.9033203125, 7.541748046875, 8.18017578125, 8.818603515625, 9.45703125, 10.095458984375, 10.73388671875, 11.372314453125, 12.0107421875, 12.649169921875, 13.28759765625, 13.926025390625, 14.564453125, 15.202880859375, 15.84130859375, 16.479736328125, 17.1181640625, 17.756591796875, 18.39501953125, 19.033447265625, 19.671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 11.0, 10.0, 20.0, 17.0, 15.0, 26.0, 23.0, 42.0, 40.0, 35.0, 33.0, 47.0, 55.0, 60.0, 66.0, 75.0, 55.0, 53.0, 43.0, 39.0, 35.0, 23.0, 32.0, 30.0, 22.0, 17.0, 18.0, 8.0, 14.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.9765625, -10.6494140625, -10.322265625, -9.9951171875, -9.66796875, -9.3408203125, -9.013671875, -8.6865234375, -8.359375, -8.0322265625, -7.705078125, -7.3779296875, -7.05078125, -6.7236328125, -6.396484375, -6.0693359375, -5.7421875, -5.4150390625, -5.087890625, -4.7607421875, -4.43359375, -4.1064453125, -3.779296875, -3.4521484375, -3.125, -2.7978515625, -2.470703125, -2.1435546875, -1.81640625, -1.4892578125, -1.162109375, -0.8349609375, -0.5078125, -0.1806640625, 0.146484375, 0.4736328125, 0.80078125, 1.1279296875, 1.455078125, 1.7822265625, 2.109375, 2.4365234375, 2.763671875, 3.0908203125, 3.41796875, 3.7451171875, 4.072265625, 4.3994140625, 4.7265625, 5.0537109375, 5.380859375, 5.7080078125, 6.03515625, 6.3623046875, 6.689453125, 7.0166015625, 7.34375, 7.6708984375, 7.998046875, 8.3251953125, 8.65234375, 8.9794921875, 9.306640625, 9.6337890625, 9.9609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 8.0, 13.0, 12.0, 24.0, 17.0, 30.0, 41.0, 78.0, 94.0, 161.0, 243.0, 431.0, 986.0, 2761.0, 9771.0, 48528.0, 292871.0, 551306.0, 113073.0, 20141.0, 4776.0, 1630.0, 654.0, 312.0, 179.0, 123.0, 80.0, 47.0, 40.0, 38.0, 16.0, 16.0, 12.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.15625, -49.46435546875, -47.7724609375, -46.08056640625, -44.388671875, -42.69677734375, -41.0048828125, -39.31298828125, -37.62109375, -35.92919921875, -34.2373046875, -32.54541015625, -30.853515625, -29.16162109375, -27.4697265625, -25.77783203125, -24.0859375, -22.39404296875, -20.7021484375, -19.01025390625, -17.318359375, -15.62646484375, -13.9345703125, -12.24267578125, -10.55078125, -8.85888671875, -7.1669921875, -5.47509765625, -3.783203125, -2.09130859375, -0.3994140625, 1.29248046875, 2.984375, 4.67626953125, 6.3681640625, 8.06005859375, 9.751953125, 11.44384765625, 13.1357421875, 14.82763671875, 16.51953125, 18.21142578125, 19.9033203125, 21.59521484375, 23.287109375, 24.97900390625, 26.6708984375, 28.36279296875, 30.0546875, 31.74658203125, 33.4384765625, 35.13037109375, 36.822265625, 38.51416015625, 40.2060546875, 41.89794921875, 43.58984375, 45.28173828125, 46.9736328125, 48.66552734375, 50.357421875, 52.04931640625, 53.7412109375, 55.43310546875, 57.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 6.0, 10.0, 8.0, 8.0, 11.0, 10.0, 14.0, 25.0, 23.0, 23.0, 32.0, 23.0, 55.0, 50.0, 51.0, 55.0, 56.0, 48.0, 66.0, 64.0, 48.0, 56.0, 38.0, 38.0, 33.0, 27.0, 27.0, 21.0, 18.0, 13.0, 11.0, 7.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-71.0, -69.0048828125, -67.009765625, -65.0146484375, -63.01953125, -61.0244140625, -59.029296875, -57.0341796875, -55.0390625, -53.0439453125, -51.048828125, -49.0537109375, -47.05859375, -45.0634765625, -43.068359375, -41.0732421875, -39.078125, -37.0830078125, -35.087890625, -33.0927734375, -31.09765625, -29.1025390625, -27.107421875, -25.1123046875, -23.1171875, -21.1220703125, -19.126953125, -17.1318359375, -15.13671875, -13.1416015625, -11.146484375, -9.1513671875, -7.15625, -5.1611328125, -3.166015625, -1.1708984375, 0.82421875, 2.8193359375, 4.814453125, 6.8095703125, 8.8046875, 10.7998046875, 12.794921875, 14.7900390625, 16.78515625, 18.7802734375, 20.775390625, 22.7705078125, 24.765625, 26.7607421875, 28.755859375, 30.7509765625, 32.74609375, 34.7412109375, 36.736328125, 38.7314453125, 40.7265625, 42.7216796875, 44.716796875, 46.7119140625, 48.70703125, 50.7021484375, 52.697265625, 54.6923828125, 56.6875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 9.0, 19.0, 33.0, 52.0, 71.0, 122.0, 190.0, 307.0, 633.0, 1244.0, 2714.0, 6338.0, 18297.0, 64703.0, 253734.0, 468371.0, 167032.0, 42876.0, 12731.0, 4713.0, 2070.0, 936.0, 577.0, 281.0, 179.0, 107.0, 62.0, 34.0, 24.0, 14.0, 16.0, 12.0, 6.0, 6.0, 2.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.8125, -17.2938232421875, -16.775146484375, -16.2564697265625, -15.73779296875, -15.2191162109375, -14.700439453125, -14.1817626953125, -13.6630859375, -13.1444091796875, -12.625732421875, -12.1070556640625, -11.58837890625, -11.0697021484375, -10.551025390625, -10.0323486328125, -9.513671875, -8.9949951171875, -8.476318359375, -7.9576416015625, -7.43896484375, -6.9202880859375, -6.401611328125, -5.8829345703125, -5.3642578125, -4.8455810546875, -4.326904296875, -3.8082275390625, -3.28955078125, -2.7708740234375, -2.252197265625, -1.7335205078125, -1.21484375, -0.6961669921875, -0.177490234375, 0.3411865234375, 0.85986328125, 1.3785400390625, 1.897216796875, 2.4158935546875, 2.9345703125, 3.4532470703125, 3.971923828125, 4.4906005859375, 5.00927734375, 5.5279541015625, 6.046630859375, 6.5653076171875, 7.083984375, 7.6026611328125, 8.121337890625, 8.6400146484375, 9.15869140625, 9.6773681640625, 10.196044921875, 10.7147216796875, 11.2333984375, 11.7520751953125, 12.270751953125, 12.7894287109375, 13.30810546875, 13.8267822265625, 14.345458984375, 14.8641357421875, 15.3828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 9.0, 4.0, 8.0, 7.0, 13.0, 17.0, 35.0, 33.0, 37.0, 43.0, 51.0, 73.0, 63.0, 72.0, 85.0, 69.0, 71.0, 61.0, 45.0, 52.0, 27.0, 24.0, 18.0, 20.0, 15.0, 11.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034122467041015625, -0.003303736448287964, -0.0031952261924743652, -0.0030867159366607666, -0.002978205680847168, -0.0028696954250335693, -0.0027611851692199707, -0.002652674913406372, -0.0025441646575927734, -0.002435654401779175, -0.002327144145965576, -0.0022186338901519775, -0.002110123634338379, -0.0020016133785247803, -0.0018931031227111816, -0.001784592866897583, -0.0016760826110839844, -0.0015675723552703857, -0.0014590620994567871, -0.0013505518436431885, -0.0012420415878295898, -0.0011335313320159912, -0.0010250210762023926, -0.0009165108203887939, -0.0008080005645751953, -0.0006994903087615967, -0.000590980052947998, -0.0004824697971343994, -0.0003739595413208008, -0.00026544928550720215, -0.00015693902969360352, -4.842877388000488e-05, 6.008148193359375e-05, 0.00016859173774719238, 0.000277101993560791, 0.00038561224937438965, 0.0004941225051879883, 0.0006026327610015869, 0.0007111430168151855, 0.0008196532726287842, 0.0009281635284423828, 0.0010366737842559814, 0.00114518404006958, 0.0012536942958831787, 0.0013622045516967773, 0.001470714807510376, 0.0015792250633239746, 0.0016877353191375732, 0.0017962455749511719, 0.0019047558307647705, 0.002013266086578369, 0.0021217763423919678, 0.0022302865982055664, 0.002338796854019165, 0.0024473071098327637, 0.0025558173656463623, 0.002664327621459961, 0.0027728378772735596, 0.002881348133087158, 0.002989858388900757, 0.0030983686447143555, 0.003206878900527954, 0.0033153891563415527, 0.0034238994121551514, 0.00353240966796875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 18.0, 6.0, 16.0, 21.0, 33.0, 72.0, 82.0, 172.0, 242.0, 418.0, 807.0, 1747.0, 3995.0, 11487.0, 44385.0, 199211.0, 504531.0, 213379.0, 47318.0, 12608.0, 4216.0, 1803.0, 837.0, 465.0, 259.0, 136.0, 104.0, 44.0, 35.0, 30.0, 20.0, 14.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.421875, -17.85546875, -17.2890625, -16.72265625, -16.15625, -15.58984375, -15.0234375, -14.45703125, -13.890625, -13.32421875, -12.7578125, -12.19140625, -11.625, -11.05859375, -10.4921875, -9.92578125, -9.359375, -8.79296875, -8.2265625, -7.66015625, -7.09375, -6.52734375, -5.9609375, -5.39453125, -4.828125, -4.26171875, -3.6953125, -3.12890625, -2.5625, -1.99609375, -1.4296875, -0.86328125, -0.296875, 0.26953125, 0.8359375, 1.40234375, 1.96875, 2.53515625, 3.1015625, 3.66796875, 4.234375, 4.80078125, 5.3671875, 5.93359375, 6.5, 7.06640625, 7.6328125, 8.19921875, 8.765625, 9.33203125, 9.8984375, 10.46484375, 11.03125, 11.59765625, 12.1640625, 12.73046875, 13.296875, 13.86328125, 14.4296875, 14.99609375, 15.5625, 16.12890625, 16.6953125, 17.26171875, 17.828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 11.0, 5.0, 17.0, 27.0, 21.0, 45.0, 49.0, 63.0, 47.0, 60.0, 67.0, 97.0, 77.0, 73.0, 60.0, 65.0, 52.0, 26.0, 25.0, 25.0, 27.0, 8.0, 9.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.921875, -21.310302734375, -20.69873046875, -20.087158203125, -19.4755859375, -18.864013671875, -18.25244140625, -17.640869140625, -17.029296875, -16.417724609375, -15.80615234375, -15.194580078125, -14.5830078125, -13.971435546875, -13.35986328125, -12.748291015625, -12.13671875, -11.525146484375, -10.91357421875, -10.302001953125, -9.6904296875, -9.078857421875, -8.46728515625, -7.855712890625, -7.244140625, -6.632568359375, -6.02099609375, -5.409423828125, -4.7978515625, -4.186279296875, -3.57470703125, -2.963134765625, -2.3515625, -1.739990234375, -1.12841796875, -0.516845703125, 0.0947265625, 0.706298828125, 1.31787109375, 1.929443359375, 2.541015625, 3.152587890625, 3.76416015625, 4.375732421875, 4.9873046875, 5.598876953125, 6.21044921875, 6.822021484375, 7.43359375, 8.045166015625, 8.65673828125, 9.268310546875, 9.8798828125, 10.491455078125, 11.10302734375, 11.714599609375, 12.326171875, 12.937744140625, 13.54931640625, 14.160888671875, 14.7724609375, 15.384033203125, 15.99560546875, 16.607177734375, 17.21875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 9.0, 7.0, 29.0, 45.0, 78.0, 136.0, 173.0, 173.0, 108.0, 112.0, 68.0, 35.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-622.3218994140625, -608.274169921875, -594.2264404296875, -580.1787719726562, -566.1310424804688, -552.0833129882812, -538.0355834960938, -523.9878540039062, -509.9401550292969, -495.8924255371094, -481.8447265625, -467.7969970703125, -453.7492980957031, -439.7015686035156, -425.65386962890625, -411.60614013671875, -397.55841064453125, -383.51068115234375, -369.4629821777344, -355.4152526855469, -341.3675537109375, -327.31982421875, -313.2720947265625, -299.2243957519531, -285.17669677734375, -271.12896728515625, -257.0812683105469, -243.03353881835938, -228.98582458496094, -214.9381103515625, -200.89039611816406, -186.84268188476562, -172.79495239257812, -158.7472381591797, -144.69952392578125, -130.65179443359375, -116.60408020019531, -102.55636596679688, -88.50865173339844, -74.46092987060547, -60.41321563720703, -46.36549758911133, -32.317779541015625, -18.270065307617188, -4.222347259521484, 9.825370788574219, 23.873085021972656, 37.920806884765625, 51.96852111816406, 66.0162353515625, 80.06395721435547, 94.1116714477539, 108.15939331054688, 122.20710754394531, 136.25482177734375, 150.30255126953125, 164.35025024414062, 178.39796447753906, 192.4456787109375, 206.493408203125, 220.54112243652344, 234.58883666992188, 248.6365509033203, 262.68426513671875, 276.73199462890625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 3.0, 6.0, 10.0, 13.0, 8.0, 14.0, 15.0, 19.0, 17.0, 17.0, 26.0, 26.0, 29.0, 32.0, 31.0, 41.0, 39.0, 43.0, 38.0, 46.0, 36.0, 57.0, 39.0, 45.0, 38.0, 29.0, 27.0, 32.0, 35.0, 31.0, 24.0, 17.0, 16.0, 11.0, 12.0, 12.0, 13.0, 8.0, 6.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-229.58389282226562, -222.65179443359375, -215.71969604492188, -208.78759765625, -201.85549926757812, -194.92340087890625, -187.9912872314453, -181.05918884277344, -174.12709045410156, -167.1949920654297, -160.2628936767578, -153.33079528808594, -146.398681640625, -139.46658325195312, -132.53448486328125, -125.60238647460938, -118.6702880859375, -111.73818969726562, -104.80609130859375, -97.87398529052734, -90.94188690185547, -84.0097885131836, -77.07768249511719, -70.14558410644531, -63.21348571777344, -56.28138732910156, -49.34928512573242, -42.41718292236328, -35.485084533691406, -28.55298614501953, -21.62088394165039, -14.68878173828125, -7.7566680908203125, -0.8245677947998047, 6.107532501220703, 13.039632797241211, 19.97173309326172, 26.903831481933594, 33.835933685302734, 40.768035888671875, 47.70013427734375, 54.632232666015625, 61.564334869384766, 68.4964370727539, 75.42853546142578, 82.36063385009766, 89.29273986816406, 96.22483825683594, 103.15693664550781, 110.08903503417969, 117.02113342285156, 123.95323944091797, 130.88534545898438, 137.81744384765625, 144.74954223632812, 151.681640625, 158.61373901367188, 165.54583740234375, 172.47793579101562, 179.4100341796875, 186.34213256835938, 193.27423095703125, 200.2063446044922, 207.13844299316406, 214.07054138183594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 14.0, 15.0, 23.0, 26.0, 21.0, 35.0, 31.0, 62.0, 85.0, 121.0, 157.0, 246.0, 397.0, 681.0, 1306.0, 2544.0, 5885.0, 17354.0, 95306.0, 3991038.0, 55839.0, 13191.0, 4876.0, 2149.0, 1120.0, 594.0, 378.0, 240.0, 145.0, 100.0, 90.0, 48.0, 38.0, 27.0, 25.0, 13.0, 13.0, 8.0, 6.0, 12.0, 8.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-51.21875, -49.72900390625, -48.2392578125, -46.74951171875, -45.259765625, -43.77001953125, -42.2802734375, -40.79052734375, -39.30078125, -37.81103515625, -36.3212890625, -34.83154296875, -33.341796875, -31.85205078125, -30.3623046875, -28.87255859375, -27.3828125, -25.89306640625, -24.4033203125, -22.91357421875, -21.423828125, -19.93408203125, -18.4443359375, -16.95458984375, -15.46484375, -13.97509765625, -12.4853515625, -10.99560546875, -9.505859375, -8.01611328125, -6.5263671875, -5.03662109375, -3.546875, -2.05712890625, -0.5673828125, 0.92236328125, 2.412109375, 3.90185546875, 5.3916015625, 6.88134765625, 8.37109375, 9.86083984375, 11.3505859375, 12.84033203125, 14.330078125, 15.81982421875, 17.3095703125, 18.79931640625, 20.2890625, 21.77880859375, 23.2685546875, 24.75830078125, 26.248046875, 27.73779296875, 29.2275390625, 30.71728515625, 32.20703125, 33.69677734375, 35.1865234375, 36.67626953125, 38.166015625, 39.65576171875, 41.1455078125, 42.63525390625, 44.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 9.0, 13.0, 12.0, 24.0, 21.0, 20.0, 30.0, 37.0, 57.0, 49.0, 66.0, 43.0, 43.0, 53.0, 48.0, 50.0, 65.0, 45.0, 49.0, 40.0, 36.0, 30.0, 30.0, 20.0, 16.0, 20.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.9453125, -9.62451171875, -9.3037109375, -8.98291015625, -8.662109375, -8.34130859375, -8.0205078125, -7.69970703125, -7.37890625, -7.05810546875, -6.7373046875, -6.41650390625, -6.095703125, -5.77490234375, -5.4541015625, -5.13330078125, -4.8125, -4.49169921875, -4.1708984375, -3.85009765625, -3.529296875, -3.20849609375, -2.8876953125, -2.56689453125, -2.24609375, -1.92529296875, -1.6044921875, -1.28369140625, -0.962890625, -0.64208984375, -0.3212890625, -0.00048828125, 0.3203125, 0.64111328125, 0.9619140625, 1.28271484375, 1.603515625, 1.92431640625, 2.2451171875, 2.56591796875, 2.88671875, 3.20751953125, 3.5283203125, 3.84912109375, 4.169921875, 4.49072265625, 4.8115234375, 5.13232421875, 5.453125, 5.77392578125, 6.0947265625, 6.41552734375, 6.736328125, 7.05712890625, 7.3779296875, 7.69873046875, 8.01953125, 8.34033203125, 8.6611328125, 8.98193359375, 9.302734375, 9.62353515625, 9.9443359375, 10.26513671875, 10.5859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 28.0, 18.0, 28.0, 37.0, 55.0, 71.0, 96.0, 122.0, 167.0, 241.0, 314.0, 451.0, 623.0, 826.0, 1313.0, 1838.0, 2982.0, 4717.0, 8598.0, 17651.0, 45961.0, 256101.0, 3702210.0, 92798.0, 27437.0, 11897.0, 6370.0, 3718.0, 2316.0, 1547.0, 1022.0, 726.0, 516.0, 375.0, 294.0, 200.0, 139.0, 116.0, 81.0, 73.0, 32.0, 30.0, 39.0, 27.0, 10.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-30.84375, -29.85693359375, -28.8701171875, -27.88330078125, -26.896484375, -25.90966796875, -24.9228515625, -23.93603515625, -22.94921875, -21.96240234375, -20.9755859375, -19.98876953125, -19.001953125, -18.01513671875, -17.0283203125, -16.04150390625, -15.0546875, -14.06787109375, -13.0810546875, -12.09423828125, -11.107421875, -10.12060546875, -9.1337890625, -8.14697265625, -7.16015625, -6.17333984375, -5.1865234375, -4.19970703125, -3.212890625, -2.22607421875, -1.2392578125, -0.25244140625, 0.734375, 1.72119140625, 2.7080078125, 3.69482421875, 4.681640625, 5.66845703125, 6.6552734375, 7.64208984375, 8.62890625, 9.61572265625, 10.6025390625, 11.58935546875, 12.576171875, 13.56298828125, 14.5498046875, 15.53662109375, 16.5234375, 17.51025390625, 18.4970703125, 19.48388671875, 20.470703125, 21.45751953125, 22.4443359375, 23.43115234375, 24.41796875, 25.40478515625, 26.3916015625, 27.37841796875, 28.365234375, 29.35205078125, 30.3388671875, 31.32568359375, 32.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 5.0, 8.0, 3.0, 10.0, 12.0, 11.0, 22.0, 35.0, 47.0, 143.0, 402.0, 3015.0, 162.0, 60.0, 40.0, 25.0, 24.0, 11.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.138916015625, -10.77001953125, -10.401123046875, -10.0322265625, -9.663330078125, -9.29443359375, -8.925537109375, -8.556640625, -8.187744140625, -7.81884765625, -7.449951171875, -7.0810546875, -6.712158203125, -6.34326171875, -5.974365234375, -5.60546875, -5.236572265625, -4.86767578125, -4.498779296875, -4.1298828125, -3.760986328125, -3.39208984375, -3.023193359375, -2.654296875, -2.285400390625, -1.91650390625, -1.547607421875, -1.1787109375, -0.809814453125, -0.44091796875, -0.072021484375, 0.296875, 0.665771484375, 1.03466796875, 1.403564453125, 1.7724609375, 2.141357421875, 2.51025390625, 2.879150390625, 3.248046875, 3.616943359375, 3.98583984375, 4.354736328125, 4.7236328125, 5.092529296875, 5.46142578125, 5.830322265625, 6.19921875, 6.568115234375, 6.93701171875, 7.305908203125, 7.6748046875, 8.043701171875, 8.41259765625, 8.781494140625, 9.150390625, 9.519287109375, 9.88818359375, 10.257080078125, 10.6259765625, 10.994873046875, 11.36376953125, 11.732666015625, 12.1015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 6.0, 11.0, 19.0, 29.0, 43.0, 62.0, 72.0, 107.0, 110.0, 117.0, 118.0, 95.0, 63.0, 49.0, 32.0, 9.0, 23.0, 5.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.309356689453125, -34.74346923828125, -33.177581787109375, -31.611692428588867, -30.045804977416992, -28.479915618896484, -26.91402816772461, -25.348140716552734, -23.78225326538086, -22.216365814208984, -20.650476455688477, -19.0845890045166, -17.518701553344727, -15.952813148498535, -14.386924743652344, -12.821037292480469, -11.255147933959961, -9.68925952911377, -8.123372077941895, -6.557483673095703, -4.99159574508667, -3.4257078170776367, -1.8598194122314453, -0.2939319610595703, 1.271956443786621, 2.8378443717956543, 4.4037322998046875, 5.969620704650879, 7.535508632659912, 9.101396560668945, 10.667284965515137, 12.233172416687012, 13.799060821533203, 15.364949226379395, 16.930837631225586, 18.49672508239746, 20.062612533569336, 21.628501892089844, 23.19438934326172, 24.760276794433594, 26.32616424560547, 27.892051696777344, 29.45794105529785, 31.023828506469727, 32.589717864990234, 34.15560531616211, 35.721492767333984, 37.28738021850586, 38.853271484375, 40.419158935546875, 41.98504638671875, 43.550933837890625, 45.116825103759766, 46.68271255493164, 48.248600006103516, 49.81448745727539, 51.380374908447266, 52.94626235961914, 54.512149810791016, 56.078041076660156, 57.64392852783203, 59.209815979003906, 60.77570343017578, 62.341590881347656, 63.90747833251953]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 5.0, 7.0, 9.0, 7.0, 12.0, 11.0, 14.0, 12.0, 21.0, 19.0, 17.0, 27.0, 32.0, 34.0, 34.0, 44.0, 44.0, 32.0, 27.0, 44.0, 35.0, 49.0, 41.0, 48.0, 35.0, 39.0, 28.0, 39.0, 30.0, 30.0, 29.0, 18.0, 19.0, 20.0, 8.0, 13.0, 8.0, 11.0, 11.0, 5.0, 5.0, 4.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.32943344116211, -23.56981086730957, -22.81018829345703, -22.050565719604492, -21.290943145751953, -20.531320571899414, -19.771697998046875, -19.012075424194336, -18.252452850341797, -17.492830276489258, -16.73320770263672, -15.97358512878418, -15.21396255493164, -14.454339981079102, -13.694717407226562, -12.935094833374023, -12.175472259521484, -11.415849685668945, -10.656227111816406, -9.896604537963867, -9.136981964111328, -8.377359390258789, -7.61773681640625, -6.858114242553711, -6.098491668701172, -5.338869094848633, -4.579246520996094, -3.8196239471435547, -3.0600013732910156, -2.3003787994384766, -1.5407562255859375, -0.7811336517333984, -0.021511077880859375, 0.7381114959716797, 1.4977340698242188, 2.257356643676758, 3.016979217529297, 3.776601791381836, 4.536224365234375, 5.295846939086914, 6.055469512939453, 6.815092086791992, 7.574714660644531, 8.33433723449707, 9.09395980834961, 9.853582382202148, 10.613204956054688, 11.372827529907227, 12.132450103759766, 12.892072677612305, 13.651695251464844, 14.411317825317383, 15.170940399169922, 15.930562973022461, 16.690185546875, 17.44980812072754, 18.209430694580078, 18.969053268432617, 19.728675842285156, 20.488298416137695, 21.247920989990234, 22.007543563842773, 22.767166137695312, 23.52678871154785, 24.28641128540039]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 6.0, 12.0, 12.0, 14.0, 29.0, 47.0, 68.0, 122.0, 232.0, 317.0, 557.0, 945.0, 1656.0, 3059.0, 5459.0, 10270.0, 19096.0, 35877.0, 67991.0, 124539.0, 199140.0, 223959.0, 160088.0, 90668.0, 48488.0, 25755.0, 13597.0, 7350.0, 3949.0, 2257.0, 1230.0, 684.0, 434.0, 243.0, 144.0, 77.0, 64.0, 42.0, 25.0, 18.0, 13.0, 8.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.63916015625, -16.1064453125, -15.57373046875, -15.041015625, -14.50830078125, -13.9755859375, -13.44287109375, -12.91015625, -12.37744140625, -11.8447265625, -11.31201171875, -10.779296875, -10.24658203125, -9.7138671875, -9.18115234375, -8.6484375, -8.11572265625, -7.5830078125, -7.05029296875, -6.517578125, -5.98486328125, -5.4521484375, -4.91943359375, -4.38671875, -3.85400390625, -3.3212890625, -2.78857421875, -2.255859375, -1.72314453125, -1.1904296875, -0.65771484375, -0.125, 0.40771484375, 0.9404296875, 1.47314453125, 2.005859375, 2.53857421875, 3.0712890625, 3.60400390625, 4.13671875, 4.66943359375, 5.2021484375, 5.73486328125, 6.267578125, 6.80029296875, 7.3330078125, 7.86572265625, 8.3984375, 8.93115234375, 9.4638671875, 9.99658203125, 10.529296875, 11.06201171875, 11.5947265625, 12.12744140625, 12.66015625, 13.19287109375, 13.7255859375, 14.25830078125, 14.791015625, 15.32373046875, 15.8564453125, 16.38916015625, 16.921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 6.0, 5.0, 8.0, 15.0, 10.0, 14.0, 14.0, 16.0, 25.0, 25.0, 23.0, 36.0, 31.0, 38.0, 44.0, 52.0, 41.0, 40.0, 56.0, 47.0, 42.0, 49.0, 46.0, 40.0, 25.0, 34.0, 35.0, 24.0, 27.0, 20.0, 20.0, 9.0, 11.0, 12.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0, -8.714599609375, -8.42919921875, -8.143798828125, -7.8583984375, -7.572998046875, -7.28759765625, -7.002197265625, -6.716796875, -6.431396484375, -6.14599609375, -5.860595703125, -5.5751953125, -5.289794921875, -5.00439453125, -4.718994140625, -4.43359375, -4.148193359375, -3.86279296875, -3.577392578125, -3.2919921875, -3.006591796875, -2.72119140625, -2.435791015625, -2.150390625, -1.864990234375, -1.57958984375, -1.294189453125, -1.0087890625, -0.723388671875, -0.43798828125, -0.152587890625, 0.1328125, 0.418212890625, 0.70361328125, 0.989013671875, 1.2744140625, 1.559814453125, 1.84521484375, 2.130615234375, 2.416015625, 2.701416015625, 2.98681640625, 3.272216796875, 3.5576171875, 3.843017578125, 4.12841796875, 4.413818359375, 4.69921875, 4.984619140625, 5.27001953125, 5.555419921875, 5.8408203125, 6.126220703125, 6.41162109375, 6.697021484375, 6.982421875, 7.267822265625, 7.55322265625, 7.838623046875, 8.1240234375, 8.409423828125, 8.69482421875, 8.980224609375, 9.265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 8.0, 9.0, 20.0, 22.0, 41.0, 62.0, 82.0, 159.0, 323.0, 764.0, 2208.0, 10501.0, 105367.0, 748967.0, 161335.0, 14342.0, 2622.0, 869.0, 382.0, 185.0, 85.0, 56.0, 45.0, 27.0, 18.0, 13.0, 8.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.4375, -70.2802734375, -68.123046875, -65.9658203125, -63.80859375, -61.6513671875, -59.494140625, -57.3369140625, -55.1796875, -53.0224609375, -50.865234375, -48.7080078125, -46.55078125, -44.3935546875, -42.236328125, -40.0791015625, -37.921875, -35.7646484375, -33.607421875, -31.4501953125, -29.29296875, -27.1357421875, -24.978515625, -22.8212890625, -20.6640625, -18.5068359375, -16.349609375, -14.1923828125, -12.03515625, -9.8779296875, -7.720703125, -5.5634765625, -3.40625, -1.2490234375, 0.908203125, 3.0654296875, 5.22265625, 7.3798828125, 9.537109375, 11.6943359375, 13.8515625, 16.0087890625, 18.166015625, 20.3232421875, 22.48046875, 24.6376953125, 26.794921875, 28.9521484375, 31.109375, 33.2666015625, 35.423828125, 37.5810546875, 39.73828125, 41.8955078125, 44.052734375, 46.2099609375, 48.3671875, 50.5244140625, 52.681640625, 54.8388671875, 56.99609375, 59.1533203125, 61.310546875, 63.4677734375, 65.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 9.0, 7.0, 11.0, 12.0, 8.0, 17.0, 31.0, 31.0, 24.0, 40.0, 35.0, 36.0, 35.0, 44.0, 59.0, 48.0, 69.0, 45.0, 57.0, 51.0, 46.0, 38.0, 31.0, 32.0, 30.0, 25.0, 24.0, 16.0, 14.0, 14.0, 11.0, 9.0, 7.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.0, -63.27294921875, -61.5458984375, -59.81884765625, -58.091796875, -56.36474609375, -54.6376953125, -52.91064453125, -51.18359375, -49.45654296875, -47.7294921875, -46.00244140625, -44.275390625, -42.54833984375, -40.8212890625, -39.09423828125, -37.3671875, -35.64013671875, -33.9130859375, -32.18603515625, -30.458984375, -28.73193359375, -27.0048828125, -25.27783203125, -23.55078125, -21.82373046875, -20.0966796875, -18.36962890625, -16.642578125, -14.91552734375, -13.1884765625, -11.46142578125, -9.734375, -8.00732421875, -6.2802734375, -4.55322265625, -2.826171875, -1.09912109375, 0.6279296875, 2.35498046875, 4.08203125, 5.80908203125, 7.5361328125, 9.26318359375, 10.990234375, 12.71728515625, 14.4443359375, 16.17138671875, 17.8984375, 19.62548828125, 21.3525390625, 23.07958984375, 24.806640625, 26.53369140625, 28.2607421875, 29.98779296875, 31.71484375, 33.44189453125, 35.1689453125, 36.89599609375, 38.623046875, 40.35009765625, 42.0771484375, 43.80419921875, 45.53125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 5.0, 5.0, 6.0, 9.0, 13.0, 13.0, 35.0, 44.0, 65.0, 105.0, 182.0, 397.0, 748.0, 1967.0, 6927.0, 34491.0, 321655.0, 596530.0, 69359.0, 11004.0, 2861.0, 1018.0, 499.0, 261.0, 136.0, 87.0, 45.0, 34.0, 16.0, 9.0, 11.0, 6.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.75, -25.91845703125, -25.0869140625, -24.25537109375, -23.423828125, -22.59228515625, -21.7607421875, -20.92919921875, -20.09765625, -19.26611328125, -18.4345703125, -17.60302734375, -16.771484375, -15.93994140625, -15.1083984375, -14.27685546875, -13.4453125, -12.61376953125, -11.7822265625, -10.95068359375, -10.119140625, -9.28759765625, -8.4560546875, -7.62451171875, -6.79296875, -5.96142578125, -5.1298828125, -4.29833984375, -3.466796875, -2.63525390625, -1.8037109375, -0.97216796875, -0.140625, 0.69091796875, 1.5224609375, 2.35400390625, 3.185546875, 4.01708984375, 4.8486328125, 5.68017578125, 6.51171875, 7.34326171875, 8.1748046875, 9.00634765625, 9.837890625, 10.66943359375, 11.5009765625, 12.33251953125, 13.1640625, 13.99560546875, 14.8271484375, 15.65869140625, 16.490234375, 17.32177734375, 18.1533203125, 18.98486328125, 19.81640625, 20.64794921875, 21.4794921875, 22.31103515625, 23.142578125, 23.97412109375, 24.8056640625, 25.63720703125, 26.46875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 12.0, 14.0, 23.0, 21.0, 31.0, 52.0, 64.0, 67.0, 112.0, 129.0, 109.0, 89.0, 72.0, 56.0, 45.0, 25.0, 18.0, 22.0, 12.0, 12.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00499725341796875, -0.004824697971343994, -0.004652142524719238, -0.004479587078094482, -0.0043070316314697266, -0.004134476184844971, -0.003961920738220215, -0.003789365291595459, -0.003616809844970703, -0.0034442543983459473, -0.0032716989517211914, -0.0030991435050964355, -0.0029265880584716797, -0.002754032611846924, -0.002581477165222168, -0.002408921718597412, -0.0022363662719726562, -0.0020638108253479004, -0.0018912553787231445, -0.0017186999320983887, -0.0015461444854736328, -0.001373589038848877, -0.001201033592224121, -0.0010284781455993652, -0.0008559226989746094, -0.0006833672523498535, -0.0005108118057250977, -0.0003382563591003418, -0.00016570091247558594, 6.854534149169922e-06, 0.00017940998077392578, 0.00035196542739868164, 0.0005245208740234375, 0.0006970763206481934, 0.0008696317672729492, 0.001042187213897705, 0.001214742660522461, 0.0013872981071472168, 0.0015598535537719727, 0.0017324090003967285, 0.0019049644470214844, 0.0020775198936462402, 0.002250075340270996, 0.002422630786895752, 0.002595186233520508, 0.0027677416801452637, 0.0029402971267700195, 0.0031128525733947754, 0.0032854080200195312, 0.003457963466644287, 0.003630518913269043, 0.003803074359893799, 0.003975629806518555, 0.0041481852531433105, 0.004320740699768066, 0.004493296146392822, 0.004665851593017578, 0.004838407039642334, 0.00501096248626709, 0.005183517932891846, 0.0053560733795166016, 0.005528628826141357, 0.005701184272766113, 0.005873739719390869, 0.006046295166015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 14.0, 9.0, 11.0, 29.0, 38.0, 79.0, 125.0, 188.0, 383.0, 862.0, 2285.0, 7655.0, 42870.0, 432204.0, 499263.0, 49716.0, 8476.0, 2448.0, 917.0, 424.0, 243.0, 124.0, 66.0, 36.0, 37.0, 17.0, 13.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.484375, -30.63427734375, -29.7841796875, -28.93408203125, -28.083984375, -27.23388671875, -26.3837890625, -25.53369140625, -24.68359375, -23.83349609375, -22.9833984375, -22.13330078125, -21.283203125, -20.43310546875, -19.5830078125, -18.73291015625, -17.8828125, -17.03271484375, -16.1826171875, -15.33251953125, -14.482421875, -13.63232421875, -12.7822265625, -11.93212890625, -11.08203125, -10.23193359375, -9.3818359375, -8.53173828125, -7.681640625, -6.83154296875, -5.9814453125, -5.13134765625, -4.28125, -3.43115234375, -2.5810546875, -1.73095703125, -0.880859375, -0.03076171875, 0.8193359375, 1.66943359375, 2.51953125, 3.36962890625, 4.2197265625, 5.06982421875, 5.919921875, 6.77001953125, 7.6201171875, 8.47021484375, 9.3203125, 10.17041015625, 11.0205078125, 11.87060546875, 12.720703125, 13.57080078125, 14.4208984375, 15.27099609375, 16.12109375, 16.97119140625, 17.8212890625, 18.67138671875, 19.521484375, 20.37158203125, 21.2216796875, 22.07177734375, 22.921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 15.0, 19.0, 28.0, 55.0, 108.0, 115.0, 157.0, 137.0, 127.0, 85.0, 78.0, 34.0, 19.0, 11.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -55.279052734375, -53.99560546875, -52.712158203125, -51.4287109375, -50.145263671875, -48.86181640625, -47.578369140625, -46.294921875, -45.011474609375, -43.72802734375, -42.444580078125, -41.1611328125, -39.877685546875, -38.59423828125, -37.310791015625, -36.02734375, -34.743896484375, -33.46044921875, -32.177001953125, -30.8935546875, -29.610107421875, -28.32666015625, -27.043212890625, -25.759765625, -24.476318359375, -23.19287109375, -21.909423828125, -20.6259765625, -19.342529296875, -18.05908203125, -16.775634765625, -15.4921875, -14.208740234375, -12.92529296875, -11.641845703125, -10.3583984375, -9.074951171875, -7.79150390625, -6.508056640625, -5.224609375, -3.941162109375, -2.65771484375, -1.374267578125, -0.0908203125, 1.192626953125, 2.47607421875, 3.759521484375, 5.04296875, 6.326416015625, 7.60986328125, 8.893310546875, 10.1767578125, 11.460205078125, 12.74365234375, 14.027099609375, 15.310546875, 16.593994140625, 17.87744140625, 19.160888671875, 20.4443359375, 21.727783203125, 23.01123046875, 24.294677734375, 25.578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 8.0, 9.0, 18.0, 33.0, 48.0, 72.0, 151.0, 145.0, 144.0, 140.0, 107.0, 53.0, 33.0, 19.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.70428466796875, -259.2803955078125, -245.8564910888672, -232.43260192871094, -219.00869750976562, -205.58480834960938, -192.16091918945312, -178.73703002929688, -165.31312561035156, -151.8892364501953, -138.46533203125, -125.04144287109375, -111.61754608154297, -98.19364929199219, -84.76976013183594, -71.34586334228516, -57.921966552734375, -44.498069763183594, -31.074176788330078, -17.650283813476562, -4.226387023925781, 9.197509765625, 22.62139892578125, 36.04529571533203, 49.46919250488281, 62.893089294433594, 76.31698608398438, 89.74087524414062, 103.1647720336914, 116.58866882324219, 130.01255798339844, 143.43646240234375, 156.8603515625, 170.28424072265625, 183.70814514160156, 197.1320343017578, 210.55593872070312, 223.97982788085938, 237.40371704101562, 250.82760620117188, 264.25152587890625, 277.6754150390625, 291.09930419921875, 304.523193359375, 317.9471130371094, 331.3710021972656, 344.7948913574219, 358.2187805175781, 371.6426696777344, 385.0665588378906, 398.4904479980469, 411.91436767578125, 425.3382568359375, 438.76214599609375, 452.18603515625, 465.60992431640625, 479.0338134765625, 492.45770263671875, 505.881591796875, 519.3054809570312, 532.7293701171875, 546.1533203125, 559.5771484375, 573.0010986328125, 586.4249877929688]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 4.0, 10.0, 13.0, 10.0, 20.0, 12.0, 26.0, 27.0, 30.0, 30.0, 40.0, 52.0, 32.0, 40.0, 43.0, 53.0, 51.0, 50.0, 59.0, 36.0, 51.0, 53.0, 35.0, 39.0, 29.0, 13.0, 23.0, 17.0, 19.0, 9.0, 12.0, 13.0, 9.0, 3.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.95574951171875, -244.38369750976562, -236.81163024902344, -229.2395782470703, -221.66751098632812, -214.095458984375, -206.5233917236328, -198.9513397216797, -191.3792724609375, -183.80722045898438, -176.2351531982422, -168.66310119628906, -161.09103393554688, -153.51898193359375, -145.94691467285156, -138.37486267089844, -130.80279541015625, -123.2307357788086, -115.65867614746094, -108.08661651611328, -100.51455688476562, -92.9425048828125, -85.37043762207031, -77.79838562011719, -70.22633361816406, -62.654273986816406, -55.08221435546875, -47.510154724121094, -39.93809509277344, -32.36603927612305, -24.79397964477539, -17.221920013427734, -9.649856567382812, -2.0777974128723145, 5.494261741638184, 13.066320419311523, 20.63838005065918, 28.210437774658203, 35.78249740600586, 43.354557037353516, 50.92661666870117, 58.49867630004883, 66.07073211669922, 73.64279174804688, 81.21485137939453, 88.78691101074219, 96.35897064208984, 103.9310302734375, 111.50308990478516, 119.07514953613281, 126.64720916748047, 134.21926879882812, 141.79132080078125, 149.36338806152344, 156.93544006347656, 164.50750732421875, 172.07955932617188, 179.651611328125, 187.2236785888672, 194.7957305908203, 202.3677978515625, 209.93984985351562, 217.5119171142578, 225.08396911621094, 232.65603637695312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 6.0, 11.0, 17.0, 24.0, 26.0, 41.0, 50.0, 77.0, 123.0, 192.0, 301.0, 581.0, 1064.0, 2219.0, 5477.0, 17363.0, 3944348.0, 198028.0, 14802.0, 5003.0, 2121.0, 1012.0, 471.0, 344.0, 197.0, 114.0, 85.0, 53.0, 38.0, 28.0, 14.0, 10.0, 9.0, 15.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-76.25, -74.2919921875, -72.333984375, -70.3759765625, -68.41796875, -66.4599609375, -64.501953125, -62.5439453125, -60.5859375, -58.6279296875, -56.669921875, -54.7119140625, -52.75390625, -50.7958984375, -48.837890625, -46.8798828125, -44.921875, -42.9638671875, -41.005859375, -39.0478515625, -37.08984375, -35.1318359375, -33.173828125, -31.2158203125, -29.2578125, -27.2998046875, -25.341796875, -23.3837890625, -21.42578125, -19.4677734375, -17.509765625, -15.5517578125, -13.59375, -11.6357421875, -9.677734375, -7.7197265625, -5.76171875, -3.8037109375, -1.845703125, 0.1123046875, 2.0703125, 4.0283203125, 5.986328125, 7.9443359375, 9.90234375, 11.8603515625, 13.818359375, 15.7763671875, 17.734375, 19.6923828125, 21.650390625, 23.6083984375, 25.56640625, 27.5244140625, 29.482421875, 31.4404296875, 33.3984375, 35.3564453125, 37.314453125, 39.2724609375, 41.23046875, 43.1884765625, 45.146484375, 47.1044921875, 49.0625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 14.0, 20.0, 18.0, 21.0, 29.0, 38.0, 59.0, 59.0, 73.0, 71.0, 68.0, 82.0, 60.0, 66.0, 68.0, 48.0, 42.0, 38.0, 34.0, 15.0, 15.0, 14.0, 10.0, 1.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.359375, -19.863525390625, -19.36767578125, -18.871826171875, -18.3759765625, -17.880126953125, -17.38427734375, -16.888427734375, -16.392578125, -15.896728515625, -15.40087890625, -14.905029296875, -14.4091796875, -13.913330078125, -13.41748046875, -12.921630859375, -12.42578125, -11.929931640625, -11.43408203125, -10.938232421875, -10.4423828125, -9.946533203125, -9.45068359375, -8.954833984375, -8.458984375, -7.963134765625, -7.46728515625, -6.971435546875, -6.4755859375, -5.979736328125, -5.48388671875, -4.988037109375, -4.4921875, -3.996337890625, -3.50048828125, -3.004638671875, -2.5087890625, -2.012939453125, -1.51708984375, -1.021240234375, -0.525390625, -0.029541015625, 0.46630859375, 0.962158203125, 1.4580078125, 1.953857421875, 2.44970703125, 2.945556640625, 3.44140625, 3.937255859375, 4.43310546875, 4.928955078125, 5.4248046875, 5.920654296875, 6.41650390625, 6.912353515625, 7.408203125, 7.904052734375, 8.39990234375, 8.895751953125, 9.3916015625, 9.887451171875, 10.38330078125, 10.879150390625, 11.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 23.0, 31.0, 30.0, 51.0, 56.0, 69.0, 120.0, 147.0, 187.0, 304.0, 456.0, 652.0, 1108.0, 1901.0, 3977.0, 11190.0, 54705.0, 4022416.0, 73891.0, 12820.0, 4437.0, 2146.0, 1231.0, 721.0, 436.0, 308.0, 238.0, 168.0, 120.0, 83.0, 66.0, 43.0, 29.0, 29.0, 21.0, 8.0, 14.0, 4.0, 1.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.3388671875, -46.646484375, -44.9541015625, -43.26171875, -41.5693359375, -39.876953125, -38.1845703125, -36.4921875, -34.7998046875, -33.107421875, -31.4150390625, -29.72265625, -28.0302734375, -26.337890625, -24.6455078125, -22.953125, -21.2607421875, -19.568359375, -17.8759765625, -16.18359375, -14.4912109375, -12.798828125, -11.1064453125, -9.4140625, -7.7216796875, -6.029296875, -4.3369140625, -2.64453125, -0.9521484375, 0.740234375, 2.4326171875, 4.125, 5.8173828125, 7.509765625, 9.2021484375, 10.89453125, 12.5869140625, 14.279296875, 15.9716796875, 17.6640625, 19.3564453125, 21.048828125, 22.7412109375, 24.43359375, 26.1259765625, 27.818359375, 29.5107421875, 31.203125, 32.8955078125, 34.587890625, 36.2802734375, 37.97265625, 39.6650390625, 41.357421875, 43.0498046875, 44.7421875, 46.4345703125, 48.126953125, 49.8193359375, 51.51171875, 53.2041015625, 54.896484375, 56.5888671875, 58.28125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 13.0, 15.0, 41.0, 66.0, 554.0, 3218.0, 80.0, 37.0, 15.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.2119140625, -15.689453125, -15.1669921875, -14.64453125, -14.1220703125, -13.599609375, -13.0771484375, -12.5546875, -12.0322265625, -11.509765625, -10.9873046875, -10.46484375, -9.9423828125, -9.419921875, -8.8974609375, -8.375, -7.8525390625, -7.330078125, -6.8076171875, -6.28515625, -5.7626953125, -5.240234375, -4.7177734375, -4.1953125, -3.6728515625, -3.150390625, -2.6279296875, -2.10546875, -1.5830078125, -1.060546875, -0.5380859375, -0.015625, 0.5068359375, 1.029296875, 1.5517578125, 2.07421875, 2.5966796875, 3.119140625, 3.6416015625, 4.1640625, 4.6865234375, 5.208984375, 5.7314453125, 6.25390625, 6.7763671875, 7.298828125, 7.8212890625, 8.34375, 8.8662109375, 9.388671875, 9.9111328125, 10.43359375, 10.9560546875, 11.478515625, 12.0009765625, 12.5234375, 13.0458984375, 13.568359375, 14.0908203125, 14.61328125, 15.1357421875, 15.658203125, 16.1806640625, 16.703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 15.0, 15.0, 13.0, 26.0, 38.0, 32.0, 55.0, 68.0, 84.0, 93.0, 84.0, 72.0, 89.0, 52.0, 58.0, 28.0, 34.0, 31.0, 19.0, 17.0, 16.0, 9.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.59568786621094, -31.655426025390625, -30.715166091918945, -29.774904251098633, -28.834644317626953, -27.89438247680664, -26.954120635986328, -26.01386070251465, -25.07360076904297, -24.133338928222656, -23.193078994750977, -22.252817153930664, -21.312557220458984, -20.372295379638672, -19.43203353881836, -18.49177360534668, -17.551511764526367, -16.611249923706055, -15.670989990234375, -14.730728149414062, -13.790468215942383, -12.85020637512207, -11.909945487976074, -10.969684600830078, -10.029423713684082, -9.089162826538086, -8.14890193939209, -7.2086405754089355, -6.2683796882629395, -5.328118801116943, -4.387857437133789, -3.447596549987793, -2.5073375701904297, -1.567076563835144, -0.6268155574798584, 0.3134455680847168, 1.253706455230713, 2.193967342376709, 3.1342287063598633, 4.074489593505859, 5.0147504806518555, 5.955011367797852, 6.895272254943848, 7.835533618927002, 8.775794982910156, 9.716054916381836, 10.656316757202148, 11.596577644348145, 12.53683853149414, 13.477099418640137, 14.417360305786133, 15.357622146606445, 16.297882080078125, 17.238143920898438, 18.17840576171875, 19.11866569519043, 20.05892562866211, 20.999187469482422, 21.9394474029541, 22.879709243774414, 23.819969177246094, 24.760231018066406, 25.70049285888672, 26.6407527923584, 27.58101463317871]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 5.0, 18.0, 5.0, 11.0, 10.0, 16.0, 14.0, 19.0, 25.0, 24.0, 30.0, 26.0, 27.0, 32.0, 29.0, 33.0, 41.0, 46.0, 46.0, 34.0, 44.0, 38.0, 47.0, 33.0, 48.0, 32.0, 42.0, 33.0, 34.0, 26.0, 15.0, 13.0, 15.0, 10.0, 16.0, 7.0, 11.0, 10.0, 8.0, 4.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-22.058170318603516, -21.379589080810547, -20.70100975036621, -20.022430419921875, -19.343849182128906, -18.665267944335938, -17.9866886138916, -17.308109283447266, -16.629528045654297, -15.950947761535645, -15.272367477416992, -14.59378719329834, -13.915206909179688, -13.236626625061035, -12.558046340942383, -11.87946605682373, -11.200885772705078, -10.522305488586426, -9.843725204467773, -9.165144920349121, -8.486564636230469, -7.807984352111816, -7.129404067993164, -6.450823783874512, -5.772243499755859, -5.093663215637207, -4.415082931518555, -3.7365026473999023, -3.05792236328125, -2.3793420791625977, -1.7007617950439453, -1.022181510925293, -0.3436012268066406, 0.3349790573120117, 1.013559341430664, 1.6921396255493164, 2.3707199096679688, 3.049300193786621, 3.7278804779052734, 4.406460762023926, 5.085041046142578, 5.7636213302612305, 6.442201614379883, 7.120781898498535, 7.7993621826171875, 8.47794246673584, 9.156522750854492, 9.835103034973145, 10.513683319091797, 11.19226360321045, 11.870843887329102, 12.549424171447754, 13.228004455566406, 13.906584739685059, 14.585165023803711, 15.263745307922363, 15.942325592041016, 16.620906829833984, 17.29948616027832, 17.978065490722656, 18.656646728515625, 19.335227966308594, 20.01380729675293, 20.692386627197266, 21.370967864990234]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 39.0, 67.0, 127.0, 226.0, 411.0, 965.0, 2225.0, 6468.0, 19107.0, 65871.0, 230055.0, 443187.0, 197632.0, 56225.0, 16695.0, 5529.0, 2042.0, 834.0, 385.0, 198.0, 106.0, 51.0, 32.0, 17.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.765625, -25.753173828125, -24.74072265625, -23.728271484375, -22.7158203125, -21.703369140625, -20.69091796875, -19.678466796875, -18.666015625, -17.653564453125, -16.64111328125, -15.628662109375, -14.6162109375, -13.603759765625, -12.59130859375, -11.578857421875, -10.56640625, -9.553955078125, -8.54150390625, -7.529052734375, -6.5166015625, -5.504150390625, -4.49169921875, -3.479248046875, -2.466796875, -1.454345703125, -0.44189453125, 0.570556640625, 1.5830078125, 2.595458984375, 3.60791015625, 4.620361328125, 5.6328125, 6.645263671875, 7.65771484375, 8.670166015625, 9.6826171875, 10.695068359375, 11.70751953125, 12.719970703125, 13.732421875, 14.744873046875, 15.75732421875, 16.769775390625, 17.7822265625, 18.794677734375, 19.80712890625, 20.819580078125, 21.83203125, 22.844482421875, 23.85693359375, 24.869384765625, 25.8818359375, 26.894287109375, 27.90673828125, 28.919189453125, 29.931640625, 30.944091796875, 31.95654296875, 32.968994140625, 33.9814453125, 34.993896484375, 36.00634765625, 37.018798828125, 38.03125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 14.0, 15.0, 13.0, 25.0, 32.0, 24.0, 38.0, 54.0, 41.0, 53.0, 47.0, 62.0, 65.0, 57.0, 47.0, 66.0, 55.0, 48.0, 38.0, 31.0, 28.0, 29.0, 24.0, 22.0, 9.0, 10.0, 9.0, 5.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.640625, -15.204345703125, -14.76806640625, -14.331787109375, -13.8955078125, -13.459228515625, -13.02294921875, -12.586669921875, -12.150390625, -11.714111328125, -11.27783203125, -10.841552734375, -10.4052734375, -9.968994140625, -9.53271484375, -9.096435546875, -8.66015625, -8.223876953125, -7.78759765625, -7.351318359375, -6.9150390625, -6.478759765625, -6.04248046875, -5.606201171875, -5.169921875, -4.733642578125, -4.29736328125, -3.861083984375, -3.4248046875, -2.988525390625, -2.55224609375, -2.115966796875, -1.6796875, -1.243408203125, -0.80712890625, -0.370849609375, 0.0654296875, 0.501708984375, 0.93798828125, 1.374267578125, 1.810546875, 2.246826171875, 2.68310546875, 3.119384765625, 3.5556640625, 3.991943359375, 4.42822265625, 4.864501953125, 5.30078125, 5.737060546875, 6.17333984375, 6.609619140625, 7.0458984375, 7.482177734375, 7.91845703125, 8.354736328125, 8.791015625, 9.227294921875, 9.66357421875, 10.099853515625, 10.5361328125, 10.972412109375, 11.40869140625, 11.844970703125, 12.28125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 17.0, 20.0, 30.0, 28.0, 45.0, 84.0, 125.0, 167.0, 287.0, 557.0, 1094.0, 2404.0, 8373.0, 55530.0, 602467.0, 337339.0, 30509.0, 5526.0, 1869.0, 805.0, 476.0, 264.0, 150.0, 101.0, 83.0, 46.0, 33.0, 31.0, 21.0, 15.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-74.875, -72.84375, -70.8125, -68.78125, -66.75, -64.71875, -62.6875, -60.65625, -58.625, -56.59375, -54.5625, -52.53125, -50.5, -48.46875, -46.4375, -44.40625, -42.375, -40.34375, -38.3125, -36.28125, -34.25, -32.21875, -30.1875, -28.15625, -26.125, -24.09375, -22.0625, -20.03125, -18.0, -15.96875, -13.9375, -11.90625, -9.875, -7.84375, -5.8125, -3.78125, -1.75, 0.28125, 2.3125, 4.34375, 6.375, 8.40625, 10.4375, 12.46875, 14.5, 16.53125, 18.5625, 20.59375, 22.625, 24.65625, 26.6875, 28.71875, 30.75, 32.78125, 34.8125, 36.84375, 38.875, 40.90625, 42.9375, 44.96875, 47.0, 49.03125, 51.0625, 53.09375, 55.125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 10.0, 13.0, 21.0, 21.0, 23.0, 30.0, 38.0, 46.0, 53.0, 65.0, 62.0, 79.0, 78.0, 73.0, 70.0, 54.0, 49.0, 39.0, 29.0, 30.0, 27.0, 18.0, 15.0, 8.0, 6.0, 12.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-112.9375, -109.9365234375, -106.935546875, -103.9345703125, -100.93359375, -97.9326171875, -94.931640625, -91.9306640625, -88.9296875, -85.9287109375, -82.927734375, -79.9267578125, -76.92578125, -73.9248046875, -70.923828125, -67.9228515625, -64.921875, -61.9208984375, -58.919921875, -55.9189453125, -52.91796875, -49.9169921875, -46.916015625, -43.9150390625, -40.9140625, -37.9130859375, -34.912109375, -31.9111328125, -28.91015625, -25.9091796875, -22.908203125, -19.9072265625, -16.90625, -13.9052734375, -10.904296875, -7.9033203125, -4.90234375, -1.9013671875, 1.099609375, 4.1005859375, 7.1015625, 10.1025390625, 13.103515625, 16.1044921875, 19.10546875, 22.1064453125, 25.107421875, 28.1083984375, 31.109375, 34.1103515625, 37.111328125, 40.1123046875, 43.11328125, 46.1142578125, 49.115234375, 52.1162109375, 55.1171875, 58.1181640625, 61.119140625, 64.1201171875, 67.12109375, 70.1220703125, 73.123046875, 76.1240234375, 79.125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 13.0, 14.0, 36.0, 32.0, 49.0, 56.0, 90.0, 129.0, 213.0, 350.0, 847.0, 2912.0, 20865.0, 721503.0, 286630.0, 11194.0, 2005.0, 689.0, 287.0, 185.0, 119.0, 74.0, 53.0, 46.0, 28.0, 16.0, 30.0, 20.0, 8.0, 15.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.78125, -59.0869140625, -57.392578125, -55.6982421875, -54.00390625, -52.3095703125, -50.615234375, -48.9208984375, -47.2265625, -45.5322265625, -43.837890625, -42.1435546875, -40.44921875, -38.7548828125, -37.060546875, -35.3662109375, -33.671875, -31.9775390625, -30.283203125, -28.5888671875, -26.89453125, -25.2001953125, -23.505859375, -21.8115234375, -20.1171875, -18.4228515625, -16.728515625, -15.0341796875, -13.33984375, -11.6455078125, -9.951171875, -8.2568359375, -6.5625, -4.8681640625, -3.173828125, -1.4794921875, 0.21484375, 1.9091796875, 3.603515625, 5.2978515625, 6.9921875, 8.6865234375, 10.380859375, 12.0751953125, 13.76953125, 15.4638671875, 17.158203125, 18.8525390625, 20.546875, 22.2412109375, 23.935546875, 25.6298828125, 27.32421875, 29.0185546875, 30.712890625, 32.4072265625, 34.1015625, 35.7958984375, 37.490234375, 39.1845703125, 40.87890625, 42.5732421875, 44.267578125, 45.9619140625, 47.65625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 7.0, 5.0, 8.0, 6.0, 11.0, 11.0, 13.0, 20.0, 24.0, 50.0, 50.0, 74.0, 93.0, 97.0, 108.0, 77.0, 84.0, 66.0, 38.0, 26.0, 29.0, 18.0, 22.0, 11.0, 10.0, 7.0, 10.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005313873291015625, -0.005152761936187744, -0.004991650581359863, -0.004830539226531982, -0.0046694278717041016, -0.004508316516876221, -0.00434720516204834, -0.004186093807220459, -0.004024982452392578, -0.0038638710975646973, -0.0037027597427368164, -0.0035416483879089355, -0.0033805370330810547, -0.003219425678253174, -0.003058314323425293, -0.002897202968597412, -0.0027360916137695312, -0.0025749802589416504, -0.0024138689041137695, -0.0022527575492858887, -0.002091646194458008, -0.001930534839630127, -0.001769423484802246, -0.0016083121299743652, -0.0014472007751464844, -0.0012860894203186035, -0.0011249780654907227, -0.0009638667106628418, -0.0008027553558349609, -0.0006416440010070801, -0.0004805326461791992, -0.00031942129135131836, -0.0001583099365234375, 2.8014183044433594e-06, 0.00016391277313232422, 0.0003250241279602051, 0.00048613548278808594, 0.0006472468376159668, 0.0008083581924438477, 0.0009694695472717285, 0.0011305809020996094, 0.0012916922569274902, 0.001452803611755371, 0.001613914966583252, 0.0017750263214111328, 0.0019361376762390137, 0.0020972490310668945, 0.0022583603858947754, 0.0024194717407226562, 0.002580583095550537, 0.002741694450378418, 0.002902805805206299, 0.0030639171600341797, 0.0032250285148620605, 0.0033861398696899414, 0.0035472512245178223, 0.003708362579345703, 0.003869473934173584, 0.004030585289001465, 0.004191696643829346, 0.0043528079986572266, 0.004513919353485107, 0.004675030708312988, 0.004836142063140869, 0.00499725341796875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 7.0, 9.0, 10.0, 11.0, 20.0, 23.0, 20.0, 27.0, 39.0, 41.0, 57.0, 80.0, 96.0, 176.0, 243.0, 484.0, 878.0, 2207.0, 6549.0, 30474.0, 356646.0, 590710.0, 46062.0, 8574.0, 2670.0, 1045.0, 514.0, 243.0, 161.0, 112.0, 83.0, 68.0, 46.0, 31.0, 29.0, 19.0, 15.0, 20.0, 9.0, 10.0, 6.0, 10.0, 5.0, 2.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-34.96875, -33.87939453125, -32.7900390625, -31.70068359375, -30.611328125, -29.52197265625, -28.4326171875, -27.34326171875, -26.25390625, -25.16455078125, -24.0751953125, -22.98583984375, -21.896484375, -20.80712890625, -19.7177734375, -18.62841796875, -17.5390625, -16.44970703125, -15.3603515625, -14.27099609375, -13.181640625, -12.09228515625, -11.0029296875, -9.91357421875, -8.82421875, -7.73486328125, -6.6455078125, -5.55615234375, -4.466796875, -3.37744140625, -2.2880859375, -1.19873046875, -0.109375, 0.97998046875, 2.0693359375, 3.15869140625, 4.248046875, 5.33740234375, 6.4267578125, 7.51611328125, 8.60546875, 9.69482421875, 10.7841796875, 11.87353515625, 12.962890625, 14.05224609375, 15.1416015625, 16.23095703125, 17.3203125, 18.40966796875, 19.4990234375, 20.58837890625, 21.677734375, 22.76708984375, 23.8564453125, 24.94580078125, 26.03515625, 27.12451171875, 28.2138671875, 29.30322265625, 30.392578125, 31.48193359375, 32.5712890625, 33.66064453125, 34.75]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 14.0, 13.0, 20.0, 27.0, 57.0, 71.0, 110.0, 136.0, 123.0, 110.0, 73.0, 58.0, 41.0, 32.0, 14.0, 14.0, 4.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.375, -37.1044921875, -35.833984375, -34.5634765625, -33.29296875, -32.0224609375, -30.751953125, -29.4814453125, -28.2109375, -26.9404296875, -25.669921875, -24.3994140625, -23.12890625, -21.8583984375, -20.587890625, -19.3173828125, -18.046875, -16.7763671875, -15.505859375, -14.2353515625, -12.96484375, -11.6943359375, -10.423828125, -9.1533203125, -7.8828125, -6.6123046875, -5.341796875, -4.0712890625, -2.80078125, -1.5302734375, -0.259765625, 1.0107421875, 2.28125, 3.5517578125, 4.822265625, 6.0927734375, 7.36328125, 8.6337890625, 9.904296875, 11.1748046875, 12.4453125, 13.7158203125, 14.986328125, 16.2568359375, 17.52734375, 18.7978515625, 20.068359375, 21.3388671875, 22.609375, 23.8798828125, 25.150390625, 26.4208984375, 27.69140625, 28.9619140625, 30.232421875, 31.5029296875, 32.7734375, 34.0439453125, 35.314453125, 36.5849609375, 37.85546875, 39.1259765625, 40.396484375, 41.6669921875, 42.9375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 26.0, 85.0, 239.0, 338.0, 191.0, 79.0, 22.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1312.932373046875, -1284.653076171875, -1256.3736572265625, -1228.0943603515625, -1199.8150634765625, -1171.53564453125, -1143.25634765625, -1114.97705078125, -1086.69775390625, -1058.41845703125, -1030.1390380859375, -1001.8597412109375, -973.5804443359375, -945.3010864257812, -917.021728515625, -888.742431640625, -860.4630126953125, -832.1836547851562, -803.9043579101562, -775.625, -747.345703125, -719.0663452148438, -690.7869873046875, -662.5076904296875, -634.2283325195312, -605.948974609375, -577.669677734375, -549.3903198242188, -521.1109619140625, -492.8316650390625, -464.55230712890625, -436.2729797363281, -407.9936828613281, -379.71435546875, -351.43499755859375, -323.1556701660156, -294.8763427734375, -266.5970153808594, -238.3176727294922, -210.038330078125, -181.75900268554688, -153.47967529296875, -125.20033264160156, -96.9209976196289, -68.64166259765625, -40.362335205078125, -12.082992553710938, 16.19635009765625, 44.475677490234375, 72.75501251220703, 101.03434753417969, 129.31369018554688, 157.593017578125, 185.87234497070312, 214.1516876220703, 242.4310302734375, 270.7103576660156, 298.98968505859375, 327.26904296875, 355.5483703613281, 383.82769775390625, 412.1070251464844, 440.3863525390625, 468.66571044921875, 496.9450378417969]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 6.0, 10.0, 17.0, 18.0, 14.0, 15.0, 23.0, 30.0, 24.0, 29.0, 33.0, 38.0, 54.0, 54.0, 42.0, 56.0, 43.0, 43.0, 42.0, 41.0, 51.0, 34.0, 32.0, 27.0, 32.0, 28.0, 24.0, 21.0, 16.0, 17.0, 14.0, 8.0, 8.0, 9.0, 7.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-265.7063903808594, -257.3807373046875, -249.05506896972656, -240.72940063476562, -232.40374755859375, -224.07809448242188, -215.75242614746094, -207.4267578125, -199.10110473632812, -190.77545166015625, -182.4497833251953, -174.12411499023438, -165.7984619140625, -157.47280883789062, -149.1471405029297, -140.82147216796875, -132.49581909179688, -124.17015838623047, -115.84449768066406, -107.51883697509766, -99.19317626953125, -90.86751556396484, -82.54185485839844, -74.21619415283203, -65.89053344726562, -57.56487274169922, -49.23921203613281, -40.913551330566406, -32.587890625, -24.262229919433594, -15.936569213867188, -7.610908508300781, 0.7147216796875, 9.040382385253906, 17.366043090820312, 25.69170379638672, 34.017364501953125, 42.34302520751953, 50.66868591308594, 58.994346618652344, 67.32000732421875, 75.64566802978516, 83.97132873535156, 92.29698944091797, 100.62265014648438, 108.94831085205078, 117.27397155761719, 125.5996322631836, 133.92529296875, 142.25094604492188, 150.5766143798828, 158.90228271484375, 167.22793579101562, 175.5535888671875, 183.87925720214844, 192.20492553710938, 200.53057861328125, 208.85623168945312, 217.18190002441406, 225.507568359375, 233.83322143554688, 242.15887451171875, 250.4845428466797, 258.8102111816406, 267.1358642578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 6.0, 9.0, 10.0, 12.0, 15.0, 42.0, 65.0, 95.0, 195.0, 484.0, 1739.0, 17797.0, 4120615.0, 48862.0, 3085.0, 669.0, 256.0, 131.0, 74.0, 38.0, 35.0, 22.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-150.0, -146.5634765625, -143.126953125, -139.6904296875, -136.25390625, -132.8173828125, -129.380859375, -125.9443359375, -122.5078125, -119.0712890625, -115.634765625, -112.1982421875, -108.76171875, -105.3251953125, -101.888671875, -98.4521484375, -95.015625, -91.5791015625, -88.142578125, -84.7060546875, -81.26953125, -77.8330078125, -74.396484375, -70.9599609375, -67.5234375, -64.0869140625, -60.650390625, -57.2138671875, -53.77734375, -50.3408203125, -46.904296875, -43.4677734375, -40.03125, -36.5947265625, -33.158203125, -29.7216796875, -26.28515625, -22.8486328125, -19.412109375, -15.9755859375, -12.5390625, -9.1025390625, -5.666015625, -2.2294921875, 1.20703125, 4.6435546875, 8.080078125, 11.5166015625, 14.953125, 18.3896484375, 21.826171875, 25.2626953125, 28.69921875, 32.1357421875, 35.572265625, 39.0087890625, 42.4453125, 45.8818359375, 49.318359375, 52.7548828125, 56.19140625, 59.6279296875, 63.064453125, 66.5009765625, 69.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 10.0, 11.0, 9.0, 20.0, 23.0, 28.0, 34.0, 44.0, 41.0, 63.0, 66.0, 59.0, 55.0, 66.0, 57.0, 63.0, 57.0, 41.0, 43.0, 36.0, 32.0, 32.0, 12.0, 24.0, 7.0, 16.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5234375, -11.0843505859375, -10.645263671875, -10.2061767578125, -9.76708984375, -9.3280029296875, -8.888916015625, -8.4498291015625, -8.0107421875, -7.5716552734375, -7.132568359375, -6.6934814453125, -6.25439453125, -5.8153076171875, -5.376220703125, -4.9371337890625, -4.498046875, -4.0589599609375, -3.619873046875, -3.1807861328125, -2.74169921875, -2.3026123046875, -1.863525390625, -1.4244384765625, -0.9853515625, -0.5462646484375, -0.107177734375, 0.3319091796875, 0.77099609375, 1.2100830078125, 1.649169921875, 2.0882568359375, 2.52734375, 2.9664306640625, 3.405517578125, 3.8446044921875, 4.28369140625, 4.7227783203125, 5.161865234375, 5.6009521484375, 6.0400390625, 6.4791259765625, 6.918212890625, 7.3572998046875, 7.79638671875, 8.2354736328125, 8.674560546875, 9.1136474609375, 9.552734375, 9.9918212890625, 10.430908203125, 10.8699951171875, 11.30908203125, 11.7481689453125, 12.187255859375, 12.6263427734375, 13.0654296875, 13.5045166015625, 13.943603515625, 14.3826904296875, 14.82177734375, 15.2608642578125, 15.699951171875, 16.1390380859375, 16.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 2.0, 3.0, 8.0, 15.0, 9.0, 14.0, 21.0, 30.0, 41.0, 61.0, 82.0, 113.0, 217.0, 278.0, 443.0, 645.0, 1084.0, 1814.0, 4142.0, 10422.0, 36338.0, 436843.0, 3625341.0, 52674.0, 13229.0, 4936.0, 2182.0, 1213.0, 665.0, 417.0, 305.0, 212.0, 131.0, 78.0, 79.0, 52.0, 40.0, 24.0, 23.0, 13.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-49.125, -47.7646484375, -46.404296875, -45.0439453125, -43.68359375, -42.3232421875, -40.962890625, -39.6025390625, -38.2421875, -36.8818359375, -35.521484375, -34.1611328125, -32.80078125, -31.4404296875, -30.080078125, -28.7197265625, -27.359375, -25.9990234375, -24.638671875, -23.2783203125, -21.91796875, -20.5576171875, -19.197265625, -17.8369140625, -16.4765625, -15.1162109375, -13.755859375, -12.3955078125, -11.03515625, -9.6748046875, -8.314453125, -6.9541015625, -5.59375, -4.2333984375, -2.873046875, -1.5126953125, -0.15234375, 1.2080078125, 2.568359375, 3.9287109375, 5.2890625, 6.6494140625, 8.009765625, 9.3701171875, 10.73046875, 12.0908203125, 13.451171875, 14.8115234375, 16.171875, 17.5322265625, 18.892578125, 20.2529296875, 21.61328125, 22.9736328125, 24.333984375, 25.6943359375, 27.0546875, 28.4150390625, 29.775390625, 31.1357421875, 32.49609375, 33.8564453125, 35.216796875, 36.5771484375, 37.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 11.0, 9.0, 27.0, 41.0, 67.0, 144.0, 2443.0, 975.0, 148.0, 77.0, 30.0, 26.0, 18.0, 10.0, 7.0, 4.0, 10.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.95849609375, -25.2919921875, -24.62548828125, -23.958984375, -23.29248046875, -22.6259765625, -21.95947265625, -21.29296875, -20.62646484375, -19.9599609375, -19.29345703125, -18.626953125, -17.96044921875, -17.2939453125, -16.62744140625, -15.9609375, -15.29443359375, -14.6279296875, -13.96142578125, -13.294921875, -12.62841796875, -11.9619140625, -11.29541015625, -10.62890625, -9.96240234375, -9.2958984375, -8.62939453125, -7.962890625, -7.29638671875, -6.6298828125, -5.96337890625, -5.296875, -4.63037109375, -3.9638671875, -3.29736328125, -2.630859375, -1.96435546875, -1.2978515625, -0.63134765625, 0.03515625, 0.70166015625, 1.3681640625, 2.03466796875, 2.701171875, 3.36767578125, 4.0341796875, 4.70068359375, 5.3671875, 6.03369140625, 6.7001953125, 7.36669921875, 8.033203125, 8.69970703125, 9.3662109375, 10.03271484375, 10.69921875, 11.36572265625, 12.0322265625, 12.69873046875, 13.365234375, 14.03173828125, 14.6982421875, 15.36474609375, 16.03125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 13.0, 11.0, 18.0, 32.0, 35.0, 53.0, 76.0, 84.0, 130.0, 130.0, 123.0, 79.0, 59.0, 52.0, 32.0, 22.0, 14.0, 2.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.0392837524414, -97.57948303222656, -95.11967468261719, -92.65987396240234, -90.2000732421875, -87.74026489257812, -85.28046417236328, -82.82066345214844, -80.36085510253906, -77.90105438232422, -75.44124603271484, -72.9814453125, -70.52163696289062, -68.06183624267578, -65.60203552246094, -63.14223098754883, -60.68242645263672, -58.22262191772461, -55.7628173828125, -53.303016662597656, -50.84321212768555, -48.38340759277344, -45.923606872558594, -43.463802337646484, -41.003997802734375, -38.544193267822266, -36.084388732910156, -33.62458801269531, -31.164783477783203, -28.704978942871094, -26.245176315307617, -23.78537368774414, -21.32556915283203, -18.865764617919922, -16.405961990356445, -13.946158409118652, -11.48635482788086, -9.026551246643066, -6.566747665405273, -4.106945037841797, -1.6471405029296875, 0.8126630783081055, 3.2724666595458984, 5.732270240783691, 8.192073822021484, 10.651877403259277, 13.11168098449707, 15.571483612060547, 18.031288146972656, 20.491092681884766, 22.950895309448242, 25.41069793701172, 27.870502471923828, 30.330307006835938, 32.79010772705078, 35.24991226196289, 37.709716796875, 40.16952133178711, 42.62932586669922, 45.08912658691406, 47.54893112182617, 50.00873565673828, 52.468536376953125, 54.928340911865234, 57.388145446777344]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 13.0, 18.0, 10.0, 11.0, 18.0, 11.0, 20.0, 23.0, 22.0, 25.0, 42.0, 35.0, 44.0, 46.0, 35.0, 57.0, 41.0, 42.0, 55.0, 46.0, 41.0, 33.0, 42.0, 37.0, 28.0, 29.0, 28.0, 25.0, 17.0, 16.0, 22.0, 11.0, 10.0, 10.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.80430603027344, -43.32239532470703, -41.84048843383789, -40.358577728271484, -38.87666702270508, -37.39475631713867, -35.91284942626953, -34.430938720703125, -32.94902801513672, -31.467119216918945, -29.98520851135254, -28.503299713134766, -27.02138900756836, -25.539480209350586, -24.057571411132812, -22.575660705566406, -21.093751907348633, -19.61184310913086, -18.129932403564453, -16.64802360534668, -15.166112899780273, -13.6842041015625, -12.20229434967041, -10.72038459777832, -9.23847484588623, -7.756565093994141, -6.274655342102051, -4.792746067047119, -3.3108363151550293, -1.8289265632629395, -0.3470172882080078, 1.134892463684082, 2.616802215576172, 4.098711967468262, 5.580621719360352, 7.062530994415283, 8.544441223144531, 10.026350021362305, 11.508259773254395, 12.990169525146484, 14.472079277038574, 15.953989028930664, 17.435897827148438, 18.917808532714844, 20.399717330932617, 21.881628036499023, 23.363536834716797, 24.845447540283203, 26.327356338500977, 27.80926513671875, 29.291175842285156, 30.77308464050293, 32.2549934387207, 33.73690414428711, 35.218814849853516, 36.700721740722656, 38.18263244628906, 39.66454315185547, 41.14645004272461, 42.628360748291016, 44.11027145385742, 45.59218215942383, 47.07408905029297, 48.555999755859375, 50.03791046142578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 10.0, 10.0, 15.0, 18.0, 37.0, 66.0, 94.0, 228.0, 530.0, 1512.0, 4490.0, 16565.0, 68036.0, 278272.0, 486094.0, 144262.0, 35300.0, 8895.0, 2565.0, 861.0, 344.0, 161.0, 91.0, 38.0, 21.0, 10.0, 11.0, 6.0, 5.0, 9.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34375, -43.9384765625, -42.533203125, -41.1279296875, -39.72265625, -38.3173828125, -36.912109375, -35.5068359375, -34.1015625, -32.6962890625, -31.291015625, -29.8857421875, -28.48046875, -27.0751953125, -25.669921875, -24.2646484375, -22.859375, -21.4541015625, -20.048828125, -18.6435546875, -17.23828125, -15.8330078125, -14.427734375, -13.0224609375, -11.6171875, -10.2119140625, -8.806640625, -7.4013671875, -5.99609375, -4.5908203125, -3.185546875, -1.7802734375, -0.375, 1.0302734375, 2.435546875, 3.8408203125, 5.24609375, 6.6513671875, 8.056640625, 9.4619140625, 10.8671875, 12.2724609375, 13.677734375, 15.0830078125, 16.48828125, 17.8935546875, 19.298828125, 20.7041015625, 22.109375, 23.5146484375, 24.919921875, 26.3251953125, 27.73046875, 29.1357421875, 30.541015625, 31.9462890625, 33.3515625, 34.7568359375, 36.162109375, 37.5673828125, 38.97265625, 40.3779296875, 41.783203125, 43.1884765625, 44.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 8.0, 12.0, 11.0, 17.0, 16.0, 33.0, 38.0, 36.0, 42.0, 40.0, 47.0, 56.0, 66.0, 61.0, 72.0, 62.0, 50.0, 46.0, 42.0, 47.0, 41.0, 20.0, 26.0, 26.0, 18.0, 15.0, 11.0, 7.0, 7.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.75341796875, -11.2880859375, -10.82275390625, -10.357421875, -9.89208984375, -9.4267578125, -8.96142578125, -8.49609375, -8.03076171875, -7.5654296875, -7.10009765625, -6.634765625, -6.16943359375, -5.7041015625, -5.23876953125, -4.7734375, -4.30810546875, -3.8427734375, -3.37744140625, -2.912109375, -2.44677734375, -1.9814453125, -1.51611328125, -1.05078125, -0.58544921875, -0.1201171875, 0.34521484375, 0.810546875, 1.27587890625, 1.7412109375, 2.20654296875, 2.671875, 3.13720703125, 3.6025390625, 4.06787109375, 4.533203125, 4.99853515625, 5.4638671875, 5.92919921875, 6.39453125, 6.85986328125, 7.3251953125, 7.79052734375, 8.255859375, 8.72119140625, 9.1865234375, 9.65185546875, 10.1171875, 10.58251953125, 11.0478515625, 11.51318359375, 11.978515625, 12.44384765625, 12.9091796875, 13.37451171875, 13.83984375, 14.30517578125, 14.7705078125, 15.23583984375, 15.701171875, 16.16650390625, 16.6318359375, 17.09716796875, 17.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 10.0, 5.0, 11.0, 14.0, 22.0, 30.0, 22.0, 38.0, 67.0, 101.0, 172.0, 267.0, 421.0, 821.0, 1788.0, 4884.0, 23710.0, 295515.0, 657395.0, 50644.0, 7748.0, 2474.0, 1003.0, 567.0, 290.0, 193.0, 109.0, 55.0, 50.0, 28.0, 23.0, 27.0, 24.0, 7.0, 9.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.1875, -73.8193359375, -71.451171875, -69.0830078125, -66.71484375, -64.3466796875, -61.978515625, -59.6103515625, -57.2421875, -54.8740234375, -52.505859375, -50.1376953125, -47.76953125, -45.4013671875, -43.033203125, -40.6650390625, -38.296875, -35.9287109375, -33.560546875, -31.1923828125, -28.82421875, -26.4560546875, -24.087890625, -21.7197265625, -19.3515625, -16.9833984375, -14.615234375, -12.2470703125, -9.87890625, -7.5107421875, -5.142578125, -2.7744140625, -0.40625, 1.9619140625, 4.330078125, 6.6982421875, 9.06640625, 11.4345703125, 13.802734375, 16.1708984375, 18.5390625, 20.9072265625, 23.275390625, 25.6435546875, 28.01171875, 30.3798828125, 32.748046875, 35.1162109375, 37.484375, 39.8525390625, 42.220703125, 44.5888671875, 46.95703125, 49.3251953125, 51.693359375, 54.0615234375, 56.4296875, 58.7978515625, 61.166015625, 63.5341796875, 65.90234375, 68.2705078125, 70.638671875, 73.0068359375, 75.375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 5.0, 13.0, 14.0, 25.0, 25.0, 24.0, 29.0, 29.0, 41.0, 52.0, 51.0, 57.0, 59.0, 63.0, 59.0, 57.0, 40.0, 52.0, 61.0, 32.0, 27.0, 19.0, 29.0, 29.0, 19.0, 11.0, 15.0, 9.0, 8.0, 9.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-78.0, -75.94775390625, -73.8955078125, -71.84326171875, -69.791015625, -67.73876953125, -65.6865234375, -63.63427734375, -61.58203125, -59.52978515625, -57.4775390625, -55.42529296875, -53.373046875, -51.32080078125, -49.2685546875, -47.21630859375, -45.1640625, -43.11181640625, -41.0595703125, -39.00732421875, -36.955078125, -34.90283203125, -32.8505859375, -30.79833984375, -28.74609375, -26.69384765625, -24.6416015625, -22.58935546875, -20.537109375, -18.48486328125, -16.4326171875, -14.38037109375, -12.328125, -10.27587890625, -8.2236328125, -6.17138671875, -4.119140625, -2.06689453125, -0.0146484375, 2.03759765625, 4.08984375, 6.14208984375, 8.1943359375, 10.24658203125, 12.298828125, 14.35107421875, 16.4033203125, 18.45556640625, 20.5078125, 22.56005859375, 24.6123046875, 26.66455078125, 28.716796875, 30.76904296875, 32.8212890625, 34.87353515625, 36.92578125, 38.97802734375, 41.0302734375, 43.08251953125, 45.134765625, 47.18701171875, 49.2392578125, 51.29150390625, 53.34375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 6.0, 11.0, 15.0, 15.0, 17.0, 35.0, 32.0, 38.0, 60.0, 58.0, 115.0, 189.0, 292.0, 397.0, 646.0, 1033.0, 1867.0, 3555.0, 9017.0, 38219.0, 290303.0, 597948.0, 78763.0, 14932.0, 5103.0, 2271.0, 1305.0, 762.0, 513.0, 333.0, 206.0, 129.0, 96.0, 87.0, 57.0, 40.0, 23.0, 18.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.5, -20.810791015625, -20.12158203125, -19.432373046875, -18.7431640625, -18.053955078125, -17.36474609375, -16.675537109375, -15.986328125, -15.297119140625, -14.60791015625, -13.918701171875, -13.2294921875, -12.540283203125, -11.85107421875, -11.161865234375, -10.47265625, -9.783447265625, -9.09423828125, -8.405029296875, -7.7158203125, -7.026611328125, -6.33740234375, -5.648193359375, -4.958984375, -4.269775390625, -3.58056640625, -2.891357421875, -2.2021484375, -1.512939453125, -0.82373046875, -0.134521484375, 0.5546875, 1.243896484375, 1.93310546875, 2.622314453125, 3.3115234375, 4.000732421875, 4.68994140625, 5.379150390625, 6.068359375, 6.757568359375, 7.44677734375, 8.135986328125, 8.8251953125, 9.514404296875, 10.20361328125, 10.892822265625, 11.58203125, 12.271240234375, 12.96044921875, 13.649658203125, 14.3388671875, 15.028076171875, 15.71728515625, 16.406494140625, 17.095703125, 17.784912109375, 18.47412109375, 19.163330078125, 19.8525390625, 20.541748046875, 21.23095703125, 21.920166015625, 22.609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 13.0, 24.0, 37.0, 59.0, 94.0, 196.0, 238.0, 134.0, 81.0, 50.0, 23.0, 22.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01397705078125, -0.013590455055236816, -0.013203859329223633, -0.01281726360321045, -0.012430667877197266, -0.012044072151184082, -0.011657476425170898, -0.011270880699157715, -0.010884284973144531, -0.010497689247131348, -0.010111093521118164, -0.00972449779510498, -0.009337902069091797, -0.008951306343078613, -0.00856471061706543, -0.008178114891052246, -0.0077915191650390625, -0.007404923439025879, -0.007018327713012695, -0.006631731986999512, -0.006245136260986328, -0.0058585405349731445, -0.005471944808959961, -0.005085349082946777, -0.004698753356933594, -0.00431215763092041, -0.0039255619049072266, -0.003538966178894043, -0.0031523704528808594, -0.0027657747268676758, -0.002379179000854492, -0.0019925832748413086, -0.001605987548828125, -0.0012193918228149414, -0.0008327960968017578, -0.0004462003707885742, -5.9604644775390625e-05, 0.00032699108123779297, 0.0007135868072509766, 0.0011001825332641602, 0.0014867782592773438, 0.0018733739852905273, 0.002259969711303711, 0.0026465654373168945, 0.003033161163330078, 0.0034197568893432617, 0.0038063526153564453, 0.004192948341369629, 0.0045795440673828125, 0.004966139793395996, 0.00535273551940918, 0.005739331245422363, 0.006125926971435547, 0.0065125226974487305, 0.006899118423461914, 0.007285714149475098, 0.007672309875488281, 0.008058905601501465, 0.008445501327514648, 0.008832097053527832, 0.009218692779541016, 0.0096052885055542, 0.009991884231567383, 0.010378479957580566, 0.01076507568359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 5.0, 6.0, 3.0, 9.0, 10.0, 11.0, 14.0, 13.0, 25.0, 32.0, 62.0, 71.0, 84.0, 168.0, 264.0, 431.0, 919.0, 2041.0, 5364.0, 22726.0, 233137.0, 695807.0, 70249.0, 10937.0, 3255.0, 1310.0, 646.0, 307.0, 206.0, 120.0, 90.0, 48.0, 39.0, 22.0, 27.0, 18.0, 15.0, 12.0, 10.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.4375, -24.6240234375, -23.810546875, -22.9970703125, -22.18359375, -21.3701171875, -20.556640625, -19.7431640625, -18.9296875, -18.1162109375, -17.302734375, -16.4892578125, -15.67578125, -14.8623046875, -14.048828125, -13.2353515625, -12.421875, -11.6083984375, -10.794921875, -9.9814453125, -9.16796875, -8.3544921875, -7.541015625, -6.7275390625, -5.9140625, -5.1005859375, -4.287109375, -3.4736328125, -2.66015625, -1.8466796875, -1.033203125, -0.2197265625, 0.59375, 1.4072265625, 2.220703125, 3.0341796875, 3.84765625, 4.6611328125, 5.474609375, 6.2880859375, 7.1015625, 7.9150390625, 8.728515625, 9.5419921875, 10.35546875, 11.1689453125, 11.982421875, 12.7958984375, 13.609375, 14.4228515625, 15.236328125, 16.0498046875, 16.86328125, 17.6767578125, 18.490234375, 19.3037109375, 20.1171875, 20.9306640625, 21.744140625, 22.5576171875, 23.37109375, 24.1845703125, 24.998046875, 25.8115234375, 26.625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 7.0, 17.0, 15.0, 22.0, 22.0, 41.0, 50.0, 77.0, 113.0, 101.0, 116.0, 93.0, 68.0, 73.0, 45.0, 30.0, 21.0, 19.0, 10.0, 12.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.131103515625, -22.34033203125, -21.549560546875, -20.7587890625, -19.968017578125, -19.17724609375, -18.386474609375, -17.595703125, -16.804931640625, -16.01416015625, -15.223388671875, -14.4326171875, -13.641845703125, -12.85107421875, -12.060302734375, -11.26953125, -10.478759765625, -9.68798828125, -8.897216796875, -8.1064453125, -7.315673828125, -6.52490234375, -5.734130859375, -4.943359375, -4.152587890625, -3.36181640625, -2.571044921875, -1.7802734375, -0.989501953125, -0.19873046875, 0.592041015625, 1.3828125, 2.173583984375, 2.96435546875, 3.755126953125, 4.5458984375, 5.336669921875, 6.12744140625, 6.918212890625, 7.708984375, 8.499755859375, 9.29052734375, 10.081298828125, 10.8720703125, 11.662841796875, 12.45361328125, 13.244384765625, 14.03515625, 14.825927734375, 15.61669921875, 16.407470703125, 17.1982421875, 17.989013671875, 18.77978515625, 19.570556640625, 20.361328125, 21.152099609375, 21.94287109375, 22.733642578125, 23.5244140625, 24.315185546875, 25.10595703125, 25.896728515625, 26.6875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 28.0, 51.0, 140.0, 256.0, 241.0, 179.0, 66.0, 17.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-515.661376953125, -491.096923828125, -466.5324401855469, -441.9679870605469, -417.40350341796875, -392.83905029296875, -368.27459716796875, -343.71014404296875, -319.1456604003906, -294.5812072753906, -270.0167236328125, -245.4522705078125, -220.88780212402344, -196.32333374023438, -171.75888061523438, -147.1944122314453, -122.62994384765625, -98.06547546386719, -73.50101470947266, -48.936553955078125, -24.372085571289062, 0.1923828125, 24.7568359375, 49.32130432128906, 73.88577270507812, 98.45024108886719, 123.01470184326172, 147.57916259765625, 172.1436309814453, 196.70809936523438, 221.27255249023438, 245.83702087402344, 270.4014892578125, 294.9659423828125, 319.5304260253906, 344.0948791503906, 368.65936279296875, 393.22381591796875, 417.78826904296875, 442.35272216796875, 466.9172058105469, 491.4816589355469, 516.046142578125, 540.610595703125, 565.175048828125, 589.739501953125, 614.303955078125, 638.8684692382812, 663.4329223632812, 687.9973754882812, 712.5618286132812, 737.1263427734375, 761.6907958984375, 786.2552490234375, 810.8197021484375, 835.3841552734375, 859.9486083984375, 884.5130615234375, 909.0775146484375, 933.6419677734375, 958.2064819335938, 982.7709350585938, 1007.3353881835938, 1031.89990234375, 1056.46435546875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 5.0, 5.0, 8.0, 17.0, 20.0, 33.0, 22.0, 21.0, 22.0, 30.0, 50.0, 30.0, 36.0, 48.0, 45.0, 40.0, 40.0, 50.0, 48.0, 45.0, 42.0, 39.0, 34.0, 28.0, 39.0, 31.0, 30.0, 23.0, 18.0, 11.0, 13.0, 10.0, 10.0, 9.0, 11.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.60385131835938, -213.53805541992188, -205.47225952148438, -197.40646362304688, -189.34066772460938, -181.27487182617188, -173.20907592773438, -165.14328002929688, -157.07748413085938, -149.01168823242188, -140.94589233398438, -132.88009643554688, -124.81430053710938, -116.74850463867188, -108.68270874023438, -100.61691284179688, -92.55111694335938, -84.48532104492188, -76.41952514648438, -68.35372924804688, -60.287933349609375, -52.222137451171875, -44.156341552734375, -36.090545654296875, -28.024749755859375, -19.958953857421875, -11.893157958984375, -3.827362060546875, 4.238433837890625, 12.304229736328125, 20.370025634765625, 28.435821533203125, 36.50164794921875, 44.56744384765625, 52.63323974609375, 60.69903564453125, 68.76483154296875, 76.83062744140625, 84.89642333984375, 92.96221923828125, 101.02801513671875, 109.09381103515625, 117.15960693359375, 125.22540283203125, 133.29119873046875, 141.35699462890625, 149.42279052734375, 157.48858642578125, 165.55438232421875, 173.62017822265625, 181.68597412109375, 189.75177001953125, 197.81756591796875, 205.88336181640625, 213.94915771484375, 222.01495361328125, 230.08074951171875, 238.14654541015625, 246.21234130859375, 254.27813720703125, 262.34393310546875, 270.40972900390625, 278.47552490234375, 286.54132080078125, 294.60711669921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 6.0, 7.0, 13.0, 28.0, 41.0, 73.0, 130.0, 310.0, 934.0, 3796.0, 22337.0, 391578.0, 3667322.0, 93952.0, 10779.0, 2105.0, 557.0, 180.0, 69.0, 30.0, 17.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-81.4375, -79.715576171875, -77.99365234375, -76.271728515625, -74.5498046875, -72.827880859375, -71.10595703125, -69.384033203125, -67.662109375, -65.940185546875, -64.21826171875, -62.496337890625, -60.7744140625, -59.052490234375, -57.33056640625, -55.608642578125, -53.88671875, -52.164794921875, -50.44287109375, -48.720947265625, -46.9990234375, -45.277099609375, -43.55517578125, -41.833251953125, -40.111328125, -38.389404296875, -36.66748046875, -34.945556640625, -33.2236328125, -31.501708984375, -29.77978515625, -28.057861328125, -26.3359375, -24.614013671875, -22.89208984375, -21.170166015625, -19.4482421875, -17.726318359375, -16.00439453125, -14.282470703125, -12.560546875, -10.838623046875, -9.11669921875, -7.394775390625, -5.6728515625, -3.950927734375, -2.22900390625, -0.507080078125, 1.21484375, 2.936767578125, 4.65869140625, 6.380615234375, 8.1025390625, 9.824462890625, 11.54638671875, 13.268310546875, 14.990234375, 16.712158203125, 18.43408203125, 20.156005859375, 21.8779296875, 23.599853515625, 25.32177734375, 27.043701171875, 28.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 7.0, 6.0, 12.0, 14.0, 21.0, 13.0, 19.0, 45.0, 49.0, 43.0, 40.0, 53.0, 73.0, 72.0, 66.0, 73.0, 62.0, 50.0, 57.0, 47.0, 32.0, 36.0, 21.0, 23.0, 19.0, 10.0, 11.0, 9.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.09375, -18.595947265625, -18.09814453125, -17.600341796875, -17.1025390625, -16.604736328125, -16.10693359375, -15.609130859375, -15.111328125, -14.613525390625, -14.11572265625, -13.617919921875, -13.1201171875, -12.622314453125, -12.12451171875, -11.626708984375, -11.12890625, -10.631103515625, -10.13330078125, -9.635498046875, -9.1376953125, -8.639892578125, -8.14208984375, -7.644287109375, -7.146484375, -6.648681640625, -6.15087890625, -5.653076171875, -5.1552734375, -4.657470703125, -4.15966796875, -3.661865234375, -3.1640625, -2.666259765625, -2.16845703125, -1.670654296875, -1.1728515625, -0.675048828125, -0.17724609375, 0.320556640625, 0.818359375, 1.316162109375, 1.81396484375, 2.311767578125, 2.8095703125, 3.307373046875, 3.80517578125, 4.302978515625, 4.80078125, 5.298583984375, 5.79638671875, 6.294189453125, 6.7919921875, 7.289794921875, 7.78759765625, 8.285400390625, 8.783203125, 9.281005859375, 9.77880859375, 10.276611328125, 10.7744140625, 11.272216796875, 11.77001953125, 12.267822265625, 12.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 7.0, 14.0, 17.0, 22.0, 39.0, 67.0, 115.0, 246.0, 725.0, 2549.0, 13152.0, 144688.0, 3818930.0, 193980.0, 15706.0, 2809.0, 711.0, 237.0, 118.0, 63.0, 27.0, 18.0, 13.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.25, -54.130859375, -52.01171875, -49.892578125, -47.7734375, -45.654296875, -43.53515625, -41.416015625, -39.296875, -37.177734375, -35.05859375, -32.939453125, -30.8203125, -28.701171875, -26.58203125, -24.462890625, -22.34375, -20.224609375, -18.10546875, -15.986328125, -13.8671875, -11.748046875, -9.62890625, -7.509765625, -5.390625, -3.271484375, -1.15234375, 0.966796875, 3.0859375, 5.205078125, 7.32421875, 9.443359375, 11.5625, 13.681640625, 15.80078125, 17.919921875, 20.0390625, 22.158203125, 24.27734375, 26.396484375, 28.515625, 30.634765625, 32.75390625, 34.873046875, 36.9921875, 39.111328125, 41.23046875, 43.349609375, 45.46875, 47.587890625, 49.70703125, 51.826171875, 53.9453125, 56.064453125, 58.18359375, 60.302734375, 62.421875, 64.541015625, 66.66015625, 68.779296875, 70.8984375, 73.017578125, 75.13671875, 77.255859375, 79.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 6.0, 12.0, 8.0, 23.0, 27.0, 40.0, 47.0, 74.0, 129.0, 261.0, 508.0, 1054.0, 877.0, 401.0, 208.0, 124.0, 72.0, 44.0, 31.0, 22.0, 25.0, 15.0, 16.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.0, -47.59619140625, -46.1923828125, -44.78857421875, -43.384765625, -41.98095703125, -40.5771484375, -39.17333984375, -37.76953125, -36.36572265625, -34.9619140625, -33.55810546875, -32.154296875, -30.75048828125, -29.3466796875, -27.94287109375, -26.5390625, -25.13525390625, -23.7314453125, -22.32763671875, -20.923828125, -19.52001953125, -18.1162109375, -16.71240234375, -15.30859375, -13.90478515625, -12.5009765625, -11.09716796875, -9.693359375, -8.28955078125, -6.8857421875, -5.48193359375, -4.078125, -2.67431640625, -1.2705078125, 0.13330078125, 1.537109375, 2.94091796875, 4.3447265625, 5.74853515625, 7.15234375, 8.55615234375, 9.9599609375, 11.36376953125, 12.767578125, 14.17138671875, 15.5751953125, 16.97900390625, 18.3828125, 19.78662109375, 21.1904296875, 22.59423828125, 23.998046875, 25.40185546875, 26.8056640625, 28.20947265625, 29.61328125, 31.01708984375, 32.4208984375, 33.82470703125, 35.228515625, 36.63232421875, 38.0361328125, 39.43994140625, 40.84375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 16.0, 42.0, 89.0, 164.0, 234.0, 218.0, 116.0, 58.0, 29.0, 7.0, 10.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-739.2955322265625, -722.4287719726562, -705.56201171875, -688.6952514648438, -671.8284912109375, -654.9617309570312, -638.094970703125, -621.2282104492188, -604.3614501953125, -587.4946899414062, -570.6279296875, -553.7611694335938, -536.8944091796875, -520.0276489257812, -503.160888671875, -486.29412841796875, -469.4273986816406, -452.5606384277344, -435.6938781738281, -418.8271179199219, -401.9603576660156, -385.0935974121094, -368.22686767578125, -351.360107421875, -334.49334716796875, -317.6265869140625, -300.75982666015625, -283.89306640625, -267.02630615234375, -250.1595458984375, -233.2928009033203, -216.42604064941406, -199.55929565429688, -182.69253540039062, -165.82577514648438, -148.95901489257812, -132.09225463867188, -115.22550201416016, -98.35874938964844, -81.49198913574219, -64.62522888183594, -47.75846862792969, -30.891712188720703, -14.024955749511719, 2.8418045043945312, 19.70856475830078, 36.5753173828125, 53.44207763671875, 70.308837890625, 87.17559814453125, 104.0423583984375, 120.90911102294922, 137.77587890625, 154.64263916015625, 171.50938415527344, 188.3761444091797, 205.24290466308594, 222.1096649169922, 238.97642517089844, 255.84317016601562, 272.7099304199219, 289.5766906738281, 306.4434509277344, 323.3102111816406, 340.1769714355469]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 6.0, 7.0, 9.0, 20.0, 16.0, 28.0, 22.0, 27.0, 44.0, 35.0, 46.0, 51.0, 63.0, 46.0, 31.0, 47.0, 55.0, 45.0, 49.0, 43.0, 41.0, 42.0, 31.0, 29.0, 24.0, 27.0, 24.0, 13.0, 14.0, 16.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-211.08856201171875, -204.92901611328125, -198.7694549560547, -192.6099090576172, -186.4503631591797, -180.29080200195312, -174.13125610351562, -167.97171020507812, -161.81216430664062, -155.65261840820312, -149.49305725097656, -143.33351135253906, -137.17396545410156, -131.014404296875, -124.8548583984375, -118.6953125, -112.53575134277344, -106.3761978149414, -100.2166519165039, -94.05709838867188, -87.89755249023438, -81.73799896240234, -75.57844543457031, -69.41889953613281, -63.25934600830078, -57.099796295166016, -50.94024658203125, -44.78069305419922, -38.62114334106445, -32.46159362792969, -26.302040100097656, -20.14249038696289, -13.982925415039062, -7.8233747482299805, -1.6638240814208984, 4.4957275390625, 10.655277252197266, 16.81482696533203, 22.974380493164062, 29.133930206298828, 35.293479919433594, 41.45302963256836, 47.612579345703125, 53.772132873535156, 59.93168258666992, 66.09123229980469, 72.25078582763672, 78.41033935546875, 84.56988525390625, 90.72943878173828, 96.88898468017578, 103.04853820800781, 109.20808410644531, 115.36763763427734, 121.52719116210938, 127.68673706054688, 133.84628295898438, 140.00582885742188, 146.16539001464844, 152.32493591308594, 158.48448181152344, 164.64404296875, 170.8035888671875, 176.963134765625, 183.12269592285156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 0.0, 8.0, 11.0, 6.0, 14.0, 34.0, 50.0, 87.0, 139.0, 262.0, 475.0, 899.0, 1792.0, 4089.0, 9252.0, 23853.0, 66415.0, 210059.0, 435495.0, 194954.0, 61986.0, 22037.0, 8944.0, 3975.0, 1705.0, 962.0, 461.0, 265.0, 129.0, 74.0, 50.0, 31.0, 10.0, 17.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.0625, -34.014892578125, -32.96728515625, -31.919677734375, -30.8720703125, -29.824462890625, -28.77685546875, -27.729248046875, -26.681640625, -25.634033203125, -24.58642578125, -23.538818359375, -22.4912109375, -21.443603515625, -20.39599609375, -19.348388671875, -18.30078125, -17.253173828125, -16.20556640625, -15.157958984375, -14.1103515625, -13.062744140625, -12.01513671875, -10.967529296875, -9.919921875, -8.872314453125, -7.82470703125, -6.777099609375, -5.7294921875, -4.681884765625, -3.63427734375, -2.586669921875, -1.5390625, -0.491455078125, 0.55615234375, 1.603759765625, 2.6513671875, 3.698974609375, 4.74658203125, 5.794189453125, 6.841796875, 7.889404296875, 8.93701171875, 9.984619140625, 11.0322265625, 12.079833984375, 13.12744140625, 14.175048828125, 15.22265625, 16.270263671875, 17.31787109375, 18.365478515625, 19.4130859375, 20.460693359375, 21.50830078125, 22.555908203125, 23.603515625, 24.651123046875, 25.69873046875, 26.746337890625, 27.7939453125, 28.841552734375, 29.88916015625, 30.936767578125, 31.984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 8.0, 7.0, 18.0, 13.0, 22.0, 19.0, 22.0, 27.0, 36.0, 36.0, 37.0, 42.0, 40.0, 46.0, 58.0, 46.0, 62.0, 49.0, 37.0, 36.0, 44.0, 35.0, 39.0, 34.0, 22.0, 26.0, 24.0, 16.0, 20.0, 9.0, 10.0, 7.0, 13.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4375, -12.0577392578125, -11.677978515625, -11.2982177734375, -10.91845703125, -10.5386962890625, -10.158935546875, -9.7791748046875, -9.3994140625, -9.0196533203125, -8.639892578125, -8.2601318359375, -7.88037109375, -7.5006103515625, -7.120849609375, -6.7410888671875, -6.361328125, -5.9815673828125, -5.601806640625, -5.2220458984375, -4.84228515625, -4.4625244140625, -4.082763671875, -3.7030029296875, -3.3232421875, -2.9434814453125, -2.563720703125, -2.1839599609375, -1.80419921875, -1.4244384765625, -1.044677734375, -0.6649169921875, -0.28515625, 0.0946044921875, 0.474365234375, 0.8541259765625, 1.23388671875, 1.6136474609375, 1.993408203125, 2.3731689453125, 2.7529296875, 3.1326904296875, 3.512451171875, 3.8922119140625, 4.27197265625, 4.6517333984375, 5.031494140625, 5.4112548828125, 5.791015625, 6.1707763671875, 6.550537109375, 6.9302978515625, 7.31005859375, 7.6898193359375, 8.069580078125, 8.4493408203125, 8.8291015625, 9.2088623046875, 9.588623046875, 9.9683837890625, 10.34814453125, 10.7279052734375, 11.107666015625, 11.4874267578125, 11.8671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 16.0, 20.0, 28.0, 36.0, 59.0, 68.0, 121.0, 164.0, 291.0, 482.0, 909.0, 1703.0, 4428.0, 17443.0, 133714.0, 777264.0, 90996.0, 13398.0, 3782.0, 1653.0, 765.0, 423.0, 268.0, 169.0, 105.0, 66.0, 31.0, 36.0, 29.0, 13.0, 11.0, 15.0, 8.0, 6.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.9375, -68.5263671875, -66.115234375, -63.7041015625, -61.29296875, -58.8818359375, -56.470703125, -54.0595703125, -51.6484375, -49.2373046875, -46.826171875, -44.4150390625, -42.00390625, -39.5927734375, -37.181640625, -34.7705078125, -32.359375, -29.9482421875, -27.537109375, -25.1259765625, -22.71484375, -20.3037109375, -17.892578125, -15.4814453125, -13.0703125, -10.6591796875, -8.248046875, -5.8369140625, -3.42578125, -1.0146484375, 1.396484375, 3.8076171875, 6.21875, 8.6298828125, 11.041015625, 13.4521484375, 15.86328125, 18.2744140625, 20.685546875, 23.0966796875, 25.5078125, 27.9189453125, 30.330078125, 32.7412109375, 35.15234375, 37.5634765625, 39.974609375, 42.3857421875, 44.796875, 47.2080078125, 49.619140625, 52.0302734375, 54.44140625, 56.8525390625, 59.263671875, 61.6748046875, 64.0859375, 66.4970703125, 68.908203125, 71.3193359375, 73.73046875, 76.1416015625, 78.552734375, 80.9638671875, 83.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 14.0, 11.0, 25.0, 26.0, 38.0, 46.0, 57.0, 52.0, 58.0, 55.0, 76.0, 66.0, 69.0, 65.0, 54.0, 38.0, 50.0, 34.0, 32.0, 26.0, 25.0, 10.0, 8.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.8125, -61.259765625, -58.70703125, -56.154296875, -53.6015625, -51.048828125, -48.49609375, -45.943359375, -43.390625, -40.837890625, -38.28515625, -35.732421875, -33.1796875, -30.626953125, -28.07421875, -25.521484375, -22.96875, -20.416015625, -17.86328125, -15.310546875, -12.7578125, -10.205078125, -7.65234375, -5.099609375, -2.546875, 0.005859375, 2.55859375, 5.111328125, 7.6640625, 10.216796875, 12.76953125, 15.322265625, 17.875, 20.427734375, 22.98046875, 25.533203125, 28.0859375, 30.638671875, 33.19140625, 35.744140625, 38.296875, 40.849609375, 43.40234375, 45.955078125, 48.5078125, 51.060546875, 53.61328125, 56.166015625, 58.71875, 61.271484375, 63.82421875, 66.376953125, 68.9296875, 71.482421875, 74.03515625, 76.587890625, 79.140625, 81.693359375, 84.24609375, 86.798828125, 89.3515625, 91.904296875, 94.45703125, 97.009765625, 99.5625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 11.0, 12.0, 17.0, 21.0, 34.0, 48.0, 49.0, 91.0, 174.0, 302.0, 453.0, 1200.0, 3484.0, 15459.0, 173898.0, 791178.0, 50857.0, 7423.0, 2076.0, 761.0, 364.0, 210.0, 127.0, 87.0, 57.0, 37.0, 29.0, 21.0, 17.0, 13.0, 9.0, 10.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.42041015625, -36.1845703125, -34.94873046875, -33.712890625, -32.47705078125, -31.2412109375, -30.00537109375, -28.76953125, -27.53369140625, -26.2978515625, -25.06201171875, -23.826171875, -22.59033203125, -21.3544921875, -20.11865234375, -18.8828125, -17.64697265625, -16.4111328125, -15.17529296875, -13.939453125, -12.70361328125, -11.4677734375, -10.23193359375, -8.99609375, -7.76025390625, -6.5244140625, -5.28857421875, -4.052734375, -2.81689453125, -1.5810546875, -0.34521484375, 0.890625, 2.12646484375, 3.3623046875, 4.59814453125, 5.833984375, 7.06982421875, 8.3056640625, 9.54150390625, 10.77734375, 12.01318359375, 13.2490234375, 14.48486328125, 15.720703125, 16.95654296875, 18.1923828125, 19.42822265625, 20.6640625, 21.89990234375, 23.1357421875, 24.37158203125, 25.607421875, 26.84326171875, 28.0791015625, 29.31494140625, 30.55078125, 31.78662109375, 33.0224609375, 34.25830078125, 35.494140625, 36.72998046875, 37.9658203125, 39.20166015625, 40.4375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 20.0, 20.0, 21.0, 40.0, 55.0, 84.0, 120.0, 199.0, 133.0, 95.0, 46.0, 46.0, 28.0, 12.0, 17.0, 21.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01050567626953125, -0.010217547416687012, -0.009929418563842773, -0.009641289710998535, -0.009353160858154297, -0.009065032005310059, -0.00877690315246582, -0.008488774299621582, -0.008200645446777344, -0.007912516593933105, -0.007624387741088867, -0.007336258888244629, -0.007048130035400391, -0.006760001182556152, -0.006471872329711914, -0.006183743476867676, -0.0058956146240234375, -0.005607485771179199, -0.005319356918334961, -0.005031228065490723, -0.004743099212646484, -0.004454970359802246, -0.004166841506958008, -0.0038787126541137695, -0.0035905838012695312, -0.003302454948425293, -0.0030143260955810547, -0.0027261972427368164, -0.002438068389892578, -0.00214993953704834, -0.0018618106842041016, -0.0015736818313598633, -0.001285552978515625, -0.0009974241256713867, -0.0007092952728271484, -0.00042116641998291016, -0.00013303756713867188, 0.0001550912857055664, 0.0004432201385498047, 0.000731348991394043, 0.0010194778442382812, 0.0013076066970825195, 0.0015957355499267578, 0.001883864402770996, 0.0021719932556152344, 0.0024601221084594727, 0.002748250961303711, 0.0030363798141479492, 0.0033245086669921875, 0.0036126375198364258, 0.003900766372680664, 0.004188895225524902, 0.004477024078369141, 0.004765152931213379, 0.005053281784057617, 0.0053414106369018555, 0.005629539489746094, 0.005917668342590332, 0.00620579719543457, 0.006493926048278809, 0.006782054901123047, 0.007070183753967285, 0.0073583126068115234, 0.007646441459655762, 0.0079345703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 10.0, 14.0, 11.0, 27.0, 30.0, 31.0, 57.0, 101.0, 131.0, 222.0, 392.0, 781.0, 1822.0, 4895.0, 20933.0, 203279.0, 741770.0, 58644.0, 9768.0, 3029.0, 1201.0, 583.0, 309.0, 178.0, 106.0, 76.0, 45.0, 35.0, 16.0, 19.0, 9.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-39.5625, -38.500732421875, -37.43896484375, -36.377197265625, -35.3154296875, -34.253662109375, -33.19189453125, -32.130126953125, -31.068359375, -30.006591796875, -28.94482421875, -27.883056640625, -26.8212890625, -25.759521484375, -24.69775390625, -23.635986328125, -22.57421875, -21.512451171875, -20.45068359375, -19.388916015625, -18.3271484375, -17.265380859375, -16.20361328125, -15.141845703125, -14.080078125, -13.018310546875, -11.95654296875, -10.894775390625, -9.8330078125, -8.771240234375, -7.70947265625, -6.647705078125, -5.5859375, -4.524169921875, -3.46240234375, -2.400634765625, -1.3388671875, -0.277099609375, 0.78466796875, 1.846435546875, 2.908203125, 3.969970703125, 5.03173828125, 6.093505859375, 7.1552734375, 8.217041015625, 9.27880859375, 10.340576171875, 11.40234375, 12.464111328125, 13.52587890625, 14.587646484375, 15.6494140625, 16.711181640625, 17.77294921875, 18.834716796875, 19.896484375, 20.958251953125, 22.02001953125, 23.081787109375, 24.1435546875, 25.205322265625, 26.26708984375, 27.328857421875, 28.390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 6.0, 1.0, 4.0, 4.0, 12.0, 9.0, 9.0, 11.0, 22.0, 36.0, 45.0, 55.0, 56.0, 89.0, 115.0, 108.0, 96.0, 85.0, 58.0, 40.0, 24.0, 32.0, 19.0, 14.0, 14.0, 5.0, 12.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -36.147705078125, -35.20166015625, -34.255615234375, -33.3095703125, -32.363525390625, -31.41748046875, -30.471435546875, -29.525390625, -28.579345703125, -27.63330078125, -26.687255859375, -25.7412109375, -24.795166015625, -23.84912109375, -22.903076171875, -21.95703125, -21.010986328125, -20.06494140625, -19.118896484375, -18.1728515625, -17.226806640625, -16.28076171875, -15.334716796875, -14.388671875, -13.442626953125, -12.49658203125, -11.550537109375, -10.6044921875, -9.658447265625, -8.71240234375, -7.766357421875, -6.8203125, -5.874267578125, -4.92822265625, -3.982177734375, -3.0361328125, -2.090087890625, -1.14404296875, -0.197998046875, 0.748046875, 1.694091796875, 2.64013671875, 3.586181640625, 4.5322265625, 5.478271484375, 6.42431640625, 7.370361328125, 8.31640625, 9.262451171875, 10.20849609375, 11.154541015625, 12.1005859375, 13.046630859375, 13.99267578125, 14.938720703125, 15.884765625, 16.830810546875, 17.77685546875, 18.722900390625, 19.6689453125, 20.614990234375, 21.56103515625, 22.507080078125, 23.453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 17.0, 52.0, 149.0, 211.0, 289.0, 162.0, 50.0, 28.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1084.7186279296875, -1061.2403564453125, -1037.7620849609375, -1014.2838745117188, -990.8056640625, -967.327392578125, -943.84912109375, -920.3709106445312, -896.8926391601562, -873.4143676757812, -849.9361572265625, -826.4578857421875, -802.9796752929688, -779.5014038085938, -756.023193359375, -732.544921875, -709.066650390625, -685.58837890625, -662.1101684570312, -638.6318969726562, -615.1536865234375, -591.6754150390625, -568.1971435546875, -544.7189331054688, -521.24072265625, -497.7624816894531, -474.28424072265625, -450.80596923828125, -427.3277282714844, -403.8494873046875, -380.3712463378906, -356.89300537109375, -333.41473388671875, -309.9364929199219, -286.458251953125, -262.97998046875, -239.50173950195312, -216.02349853515625, -192.54525756835938, -169.06700134277344, -145.58876037597656, -122.11051177978516, -98.63226318359375, -75.15402221679688, -51.67577362060547, -28.197525024414062, -4.7192840576171875, 18.75897216796875, 42.237213134765625, 65.71546173095703, 89.19371032714844, 112.67195129394531, 136.15020751953125, 159.62844848632812, 183.106689453125, 206.58494567871094, 230.0631866455078, 253.5414276123047, 277.0196838378906, 300.4979248046875, 323.9761657714844, 347.45440673828125, 370.93267822265625, 394.4109191894531, 417.88916015625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 6.0, 5.0, 10.0, 8.0, 7.0, 14.0, 18.0, 26.0, 30.0, 23.0, 27.0, 27.0, 31.0, 34.0, 38.0, 34.0, 40.0, 55.0, 38.0, 57.0, 41.0, 38.0, 30.0, 45.0, 35.0, 33.0, 37.0, 28.0, 19.0, 28.0, 23.0, 16.0, 23.0, 18.0, 9.0, 12.0, 8.0, 2.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-212.09805297851562, -205.34762573242188, -198.59719848632812, -191.84677124023438, -185.0963592529297, -178.34593200683594, -171.5955047607422, -164.84507751464844, -158.09466552734375, -151.34423828125, -144.59381103515625, -137.8433837890625, -131.0929718017578, -124.34254455566406, -117.59211730957031, -110.84169006347656, -104.09126281738281, -97.34083557128906, -90.59041595458984, -83.8399887084961, -77.08956909179688, -70.33914184570312, -63.588714599609375, -56.83829116821289, -50.087867736816406, -43.33744430541992, -36.58702087402344, -29.836593627929688, -23.086170196533203, -16.33574676513672, -9.585319519042969, -2.8348960876464844, 3.91552734375, 10.6659517288208, 17.4163761138916, 24.16680145263672, 30.917224884033203, 37.66764831542969, 44.41807556152344, 51.16849899291992, 57.918922424316406, 64.66934967041016, 71.41976928710938, 78.17019653320312, 84.92062377929688, 91.6710433959961, 98.42147064208984, 105.17189025878906, 111.92231750488281, 118.67274475097656, 125.42316436767578, 132.173583984375, 138.92401123046875, 145.6744384765625, 152.42486572265625, 159.17529296875, 165.92572021484375, 172.6761474609375, 179.42657470703125, 186.177001953125, 192.9274139404297, 199.67784118652344, 206.4282684326172, 213.17869567871094, 219.92910766601562]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 8.0, 8.0, 13.0, 16.0, 27.0, 52.0, 108.0, 242.0, 688.0, 3584.0, 65027.0, 4069529.0, 50779.0, 3074.0, 650.0, 240.0, 110.0, 52.0, 24.0, 14.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.3125, -100.4794921875, -97.646484375, -94.8134765625, -91.98046875, -89.1474609375, -86.314453125, -83.4814453125, -80.6484375, -77.8154296875, -74.982421875, -72.1494140625, -69.31640625, -66.4833984375, -63.650390625, -60.8173828125, -57.984375, -55.1513671875, -52.318359375, -49.4853515625, -46.65234375, -43.8193359375, -40.986328125, -38.1533203125, -35.3203125, -32.4873046875, -29.654296875, -26.8212890625, -23.98828125, -21.1552734375, -18.322265625, -15.4892578125, -12.65625, -9.8232421875, -6.990234375, -4.1572265625, -1.32421875, 1.5087890625, 4.341796875, 7.1748046875, 10.0078125, 12.8408203125, 15.673828125, 18.5068359375, 21.33984375, 24.1728515625, 27.005859375, 29.8388671875, 32.671875, 35.5048828125, 38.337890625, 41.1708984375, 44.00390625, 46.8369140625, 49.669921875, 52.5029296875, 55.3359375, 58.1689453125, 61.001953125, 63.8349609375, 66.66796875, 69.5009765625, 72.333984375, 75.1669921875, 78.0]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 8.0, 10.0, 20.0, 15.0, 15.0, 26.0, 27.0, 45.0, 36.0, 43.0, 52.0, 67.0, 58.0, 58.0, 62.0, 68.0, 58.0, 41.0, 47.0, 37.0, 36.0, 32.0, 22.0, 19.0, 10.0, 19.0, 9.0, 14.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6484375, -13.207763671875, -12.76708984375, -12.326416015625, -11.8857421875, -11.445068359375, -11.00439453125, -10.563720703125, -10.123046875, -9.682373046875, -9.24169921875, -8.801025390625, -8.3603515625, -7.919677734375, -7.47900390625, -7.038330078125, -6.59765625, -6.156982421875, -5.71630859375, -5.275634765625, -4.8349609375, -4.394287109375, -3.95361328125, -3.512939453125, -3.072265625, -2.631591796875, -2.19091796875, -1.750244140625, -1.3095703125, -0.868896484375, -0.42822265625, 0.012451171875, 0.453125, 0.893798828125, 1.33447265625, 1.775146484375, 2.2158203125, 2.656494140625, 3.09716796875, 3.537841796875, 3.978515625, 4.419189453125, 4.85986328125, 5.300537109375, 5.7412109375, 6.181884765625, 6.62255859375, 7.063232421875, 7.50390625, 7.944580078125, 8.38525390625, 8.825927734375, 9.2666015625, 9.707275390625, 10.14794921875, 10.588623046875, 11.029296875, 11.469970703125, 11.91064453125, 12.351318359375, 12.7919921875, 13.232666015625, 13.67333984375, 14.114013671875, 14.5546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 4.0, 11.0, 16.0, 20.0, 36.0, 42.0, 61.0, 112.0, 179.0, 329.0, 720.0, 1634.0, 4038.0, 12703.0, 59044.0, 861178.0, 3086193.0, 135389.0, 22064.0, 6088.0, 2172.0, 1014.0, 516.0, 215.0, 155.0, 105.0, 63.0, 43.0, 32.0, 25.0, 16.0, 12.0, 13.0, 4.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.21875, -41.73876953125, -40.2587890625, -38.77880859375, -37.298828125, -35.81884765625, -34.3388671875, -32.85888671875, -31.37890625, -29.89892578125, -28.4189453125, -26.93896484375, -25.458984375, -23.97900390625, -22.4990234375, -21.01904296875, -19.5390625, -18.05908203125, -16.5791015625, -15.09912109375, -13.619140625, -12.13916015625, -10.6591796875, -9.17919921875, -7.69921875, -6.21923828125, -4.7392578125, -3.25927734375, -1.779296875, -0.29931640625, 1.1806640625, 2.66064453125, 4.140625, 5.62060546875, 7.1005859375, 8.58056640625, 10.060546875, 11.54052734375, 13.0205078125, 14.50048828125, 15.98046875, 17.46044921875, 18.9404296875, 20.42041015625, 21.900390625, 23.38037109375, 24.8603515625, 26.34033203125, 27.8203125, 29.30029296875, 30.7802734375, 32.26025390625, 33.740234375, 35.22021484375, 36.7001953125, 38.18017578125, 39.66015625, 41.14013671875, 42.6201171875, 44.10009765625, 45.580078125, 47.06005859375, 48.5400390625, 50.02001953125, 51.5]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 8.0, 23.0, 13.0, 19.0, 29.0, 49.0, 46.0, 77.0, 120.0, 212.0, 341.0, 569.0, 792.0, 669.0, 380.0, 238.0, 141.0, 91.0, 66.0, 38.0, 41.0, 12.0, 24.0, 13.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.80419921875, -30.7333984375, -29.66259765625, -28.591796875, -27.52099609375, -26.4501953125, -25.37939453125, -24.30859375, -23.23779296875, -22.1669921875, -21.09619140625, -20.025390625, -18.95458984375, -17.8837890625, -16.81298828125, -15.7421875, -14.67138671875, -13.6005859375, -12.52978515625, -11.458984375, -10.38818359375, -9.3173828125, -8.24658203125, -7.17578125, -6.10498046875, -5.0341796875, -3.96337890625, -2.892578125, -1.82177734375, -0.7509765625, 0.31982421875, 1.390625, 2.46142578125, 3.5322265625, 4.60302734375, 5.673828125, 6.74462890625, 7.8154296875, 8.88623046875, 9.95703125, 11.02783203125, 12.0986328125, 13.16943359375, 14.240234375, 15.31103515625, 16.3818359375, 17.45263671875, 18.5234375, 19.59423828125, 20.6650390625, 21.73583984375, 22.806640625, 23.87744140625, 24.9482421875, 26.01904296875, 27.08984375, 28.16064453125, 29.2314453125, 30.30224609375, 31.373046875, 32.44384765625, 33.5146484375, 34.58544921875, 35.65625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 12.0, 23.0, 32.0, 58.0, 98.0, 152.0, 200.0, 156.0, 101.0, 61.0, 34.0, 18.0, 15.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-529.5617065429688, -512.80517578125, -496.048583984375, -479.29205322265625, -462.5354919433594, -445.7789306640625, -429.02239990234375, -412.2658386230469, -395.50927734375, -378.7527160644531, -361.99615478515625, -345.2396240234375, -328.4830627441406, -311.72650146484375, -294.969970703125, -278.2134094238281, -261.45684814453125, -244.70028686523438, -227.94374084472656, -211.18719482421875, -194.43063354492188, -177.674072265625, -160.9175262451172, -144.16098022460938, -127.4044189453125, -110.64786529541016, -93.89131164550781, -77.13475799560547, -60.378204345703125, -43.62165069580078, -26.865097045898438, -10.108543395996094, 6.64801025390625, 23.404563903808594, 40.16111755371094, 56.91767120361328, 73.67422485351562, 90.43077850341797, 107.18733215332031, 123.94388580322266, 140.700439453125, 157.45700073242188, 174.2135467529297, 190.9700927734375, 207.72665405273438, 224.48321533203125, 241.23976135253906, 257.9963073730469, 274.75286865234375, 291.5094299316406, 308.2659912109375, 325.02252197265625, 341.7790832519531, 358.53564453125, 375.29217529296875, 392.0487365722656, 408.8052978515625, 425.5618591308594, 442.31842041015625, 459.074951171875, 475.8315124511719, 492.58807373046875, 509.3446044921875, 526.1011962890625, 542.8577270507812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 6.0, 9.0, 15.0, 13.0, 22.0, 28.0, 23.0, 37.0, 38.0, 55.0, 46.0, 60.0, 70.0, 72.0, 66.0, 64.0, 66.0, 47.0, 47.0, 40.0, 35.0, 27.0, 26.0, 12.0, 15.0, 12.0, 17.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.57196044921875, -299.9285888671875, -291.2852478027344, -282.6418762207031, -273.99853515625, -265.35516357421875, -256.7117919921875, -248.0684356689453, -239.42507934570312, -230.78172302246094, -222.13836669921875, -213.4949951171875, -204.8516387939453, -196.20828247070312, -187.56491088867188, -178.9215545654297, -170.2781982421875, -161.6348419189453, -152.99148559570312, -144.34811401367188, -135.7047576904297, -127.0614013671875, -118.41803741455078, -109.77467346191406, -101.13131713867188, -92.48796081542969, -83.84459686279297, -75.20123291015625, -66.55787658691406, -57.91451644897461, -49.271156311035156, -40.6277961730957, -31.984466552734375, -23.341106414794922, -14.697746276855469, -6.054386138916016, 2.5889739990234375, 11.23233413696289, 19.875694274902344, 28.519054412841797, 37.16241455078125, 45.8057746887207, 54.449134826660156, 63.09249496459961, 71.73585510253906, 80.37921142578125, 89.02257537841797, 97.66593933105469, 106.30929565429688, 114.95265197753906, 123.59601593017578, 132.2393798828125, 140.8827362060547, 149.52609252929688, 158.16946411132812, 166.8128204345703, 175.4561767578125, 184.0995330810547, 192.74288940429688, 201.38626098632812, 210.0296173095703, 218.6729736328125, 227.31634521484375, 235.95970153808594, 244.60305786132812]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 12.0, 17.0, 17.0, 35.0, 35.0, 48.0, 77.0, 121.0, 201.0, 293.0, 501.0, 831.0, 1686.0, 3570.0, 8298.0, 21339.0, 68128.0, 284722.0, 479663.0, 121415.0, 34756.0, 12554.0, 5189.0, 2268.0, 1172.0, 628.0, 332.0, 207.0, 123.0, 78.0, 59.0, 35.0, 42.0, 23.0, 13.0, 9.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.15625, -45.595703125, -44.03515625, -42.474609375, -40.9140625, -39.353515625, -37.79296875, -36.232421875, -34.671875, -33.111328125, -31.55078125, -29.990234375, -28.4296875, -26.869140625, -25.30859375, -23.748046875, -22.1875, -20.626953125, -19.06640625, -17.505859375, -15.9453125, -14.384765625, -12.82421875, -11.263671875, -9.703125, -8.142578125, -6.58203125, -5.021484375, -3.4609375, -1.900390625, -0.33984375, 1.220703125, 2.78125, 4.341796875, 5.90234375, 7.462890625, 9.0234375, 10.583984375, 12.14453125, 13.705078125, 15.265625, 16.826171875, 18.38671875, 19.947265625, 21.5078125, 23.068359375, 24.62890625, 26.189453125, 27.75, 29.310546875, 30.87109375, 32.431640625, 33.9921875, 35.552734375, 37.11328125, 38.673828125, 40.234375, 41.794921875, 43.35546875, 44.916015625, 46.4765625, 48.037109375, 49.59765625, 51.158203125, 52.71875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 9.0, 8.0, 19.0, 21.0, 35.0, 35.0, 55.0, 63.0, 74.0, 96.0, 96.0, 94.0, 84.0, 79.0, 74.0, 50.0, 28.0, 27.0, 14.0, 13.0, 8.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.0625, -28.14892578125, -27.2353515625, -26.32177734375, -25.408203125, -24.49462890625, -23.5810546875, -22.66748046875, -21.75390625, -20.84033203125, -19.9267578125, -19.01318359375, -18.099609375, -17.18603515625, -16.2724609375, -15.35888671875, -14.4453125, -13.53173828125, -12.6181640625, -11.70458984375, -10.791015625, -9.87744140625, -8.9638671875, -8.05029296875, -7.13671875, -6.22314453125, -5.3095703125, -4.39599609375, -3.482421875, -2.56884765625, -1.6552734375, -0.74169921875, 0.171875, 1.08544921875, 1.9990234375, 2.91259765625, 3.826171875, 4.73974609375, 5.6533203125, 6.56689453125, 7.48046875, 8.39404296875, 9.3076171875, 10.22119140625, 11.134765625, 12.04833984375, 12.9619140625, 13.87548828125, 14.7890625, 15.70263671875, 16.6162109375, 17.52978515625, 18.443359375, 19.35693359375, 20.2705078125, 21.18408203125, 22.09765625, 23.01123046875, 23.9248046875, 24.83837890625, 25.751953125, 26.66552734375, 27.5791015625, 28.49267578125, 29.40625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 1.0, 2.0, 5.0, 14.0, 15.0, 17.0, 32.0, 39.0, 70.0, 88.0, 131.0, 253.0, 506.0, 1054.0, 2637.0, 8953.0, 80743.0, 883190.0, 58753.0, 7669.0, 2268.0, 991.0, 472.0, 227.0, 129.0, 87.0, 61.0, 39.0, 23.0, 14.0, 13.0, 12.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-164.5, -159.859375, -155.21875, -150.578125, -145.9375, -141.296875, -136.65625, -132.015625, -127.375, -122.734375, -118.09375, -113.453125, -108.8125, -104.171875, -99.53125, -94.890625, -90.25, -85.609375, -80.96875, -76.328125, -71.6875, -67.046875, -62.40625, -57.765625, -53.125, -48.484375, -43.84375, -39.203125, -34.5625, -29.921875, -25.28125, -20.640625, -16.0, -11.359375, -6.71875, -2.078125, 2.5625, 7.203125, 11.84375, 16.484375, 21.125, 25.765625, 30.40625, 35.046875, 39.6875, 44.328125, 48.96875, 53.609375, 58.25, 62.890625, 67.53125, 72.171875, 76.8125, 81.453125, 86.09375, 90.734375, 95.375, 100.015625, 104.65625, 109.296875, 113.9375, 118.578125, 123.21875, 127.859375, 132.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 8.0, 11.0, 11.0, 14.0, 19.0, 25.0, 40.0, 46.0, 47.0, 62.0, 70.0, 73.0, 75.0, 70.0, 54.0, 57.0, 46.0, 53.0, 44.0, 29.0, 29.0, 17.0, 13.0, 18.0, 9.0, 7.0, 9.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-111.4375, -108.3466796875, -105.255859375, -102.1650390625, -99.07421875, -95.9833984375, -92.892578125, -89.8017578125, -86.7109375, -83.6201171875, -80.529296875, -77.4384765625, -74.34765625, -71.2568359375, -68.166015625, -65.0751953125, -61.984375, -58.8935546875, -55.802734375, -52.7119140625, -49.62109375, -46.5302734375, -43.439453125, -40.3486328125, -37.2578125, -34.1669921875, -31.076171875, -27.9853515625, -24.89453125, -21.8037109375, -18.712890625, -15.6220703125, -12.53125, -9.4404296875, -6.349609375, -3.2587890625, -0.16796875, 2.9228515625, 6.013671875, 9.1044921875, 12.1953125, 15.2861328125, 18.376953125, 21.4677734375, 24.55859375, 27.6494140625, 30.740234375, 33.8310546875, 36.921875, 40.0126953125, 43.103515625, 46.1943359375, 49.28515625, 52.3759765625, 55.466796875, 58.5576171875, 61.6484375, 64.7392578125, 67.830078125, 70.9208984375, 74.01171875, 77.1025390625, 80.193359375, 83.2841796875, 86.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 9.0, 13.0, 13.0, 22.0, 36.0, 70.0, 100.0, 158.0, 271.0, 421.0, 884.0, 1814.0, 4470.0, 18727.0, 921483.0, 86983.0, 7560.0, 2758.0, 1254.0, 601.0, 331.0, 186.0, 123.0, 71.0, 59.0, 39.0, 20.0, 17.0, 14.0, 13.0, 8.0, 0.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.0, -100.501953125, -97.00390625, -93.505859375, -90.0078125, -86.509765625, -83.01171875, -79.513671875, -76.015625, -72.517578125, -69.01953125, -65.521484375, -62.0234375, -58.525390625, -55.02734375, -51.529296875, -48.03125, -44.533203125, -41.03515625, -37.537109375, -34.0390625, -30.541015625, -27.04296875, -23.544921875, -20.046875, -16.548828125, -13.05078125, -9.552734375, -6.0546875, -2.556640625, 0.94140625, 4.439453125, 7.9375, 11.435546875, 14.93359375, 18.431640625, 21.9296875, 25.427734375, 28.92578125, 32.423828125, 35.921875, 39.419921875, 42.91796875, 46.416015625, 49.9140625, 53.412109375, 56.91015625, 60.408203125, 63.90625, 67.404296875, 70.90234375, 74.400390625, 77.8984375, 81.396484375, 84.89453125, 88.392578125, 91.890625, 95.388671875, 98.88671875, 102.384765625, 105.8828125, 109.380859375, 112.87890625, 116.376953125, 119.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 26.0, 84.0, 335.0, 384.0, 87.0, 35.0, 13.0, 10.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03781318664550781, -0.036594390869140625, -0.03537559509277344, -0.03415679931640625, -0.03293800354003906, -0.031719207763671875, -0.030500411987304688, -0.0292816162109375, -0.028062820434570312, -0.026844024658203125, -0.025625228881835938, -0.02440643310546875, -0.023187637329101562, -0.021968841552734375, -0.020750045776367188, -0.01953125, -0.018312454223632812, -0.017093658447265625, -0.015874862670898438, -0.01465606689453125, -0.013437271118164062, -0.012218475341796875, -0.010999679565429688, -0.0097808837890625, -0.008562088012695312, -0.007343292236328125, -0.0061244964599609375, -0.00490570068359375, -0.0036869049072265625, -0.002468109130859375, -0.0012493133544921875, -3.0517578125e-05, 0.0011882781982421875, 0.002407073974609375, 0.0036258697509765625, 0.00484466552734375, 0.0060634613037109375, 0.007282257080078125, 0.008501052856445312, 0.0097198486328125, 0.010938644409179688, 0.012157440185546875, 0.013376235961914062, 0.01459503173828125, 0.015813827514648438, 0.017032623291015625, 0.018251419067382812, 0.01947021484375, 0.020689010620117188, 0.021907806396484375, 0.023126602172851562, 0.02434539794921875, 0.025564193725585938, 0.026782989501953125, 0.028001785278320312, 0.0292205810546875, 0.030439376831054688, 0.031658172607421875, 0.03287696838378906, 0.03409576416015625, 0.03531455993652344, 0.036533355712890625, 0.03775215148925781, 0.038970947265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 20.0, 34.0, 50.0, 75.0, 151.0, 292.0, 625.0, 1588.0, 5565.0, 52461.0, 959017.0, 22672.0, 3768.0, 1163.0, 475.0, 240.0, 128.0, 71.0, 38.0, 22.0, 18.0, 10.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5, -95.416015625, -91.33203125, -87.248046875, -83.1640625, -79.080078125, -74.99609375, -70.912109375, -66.828125, -62.744140625, -58.66015625, -54.576171875, -50.4921875, -46.408203125, -42.32421875, -38.240234375, -34.15625, -30.072265625, -25.98828125, -21.904296875, -17.8203125, -13.736328125, -9.65234375, -5.568359375, -1.484375, 2.599609375, 6.68359375, 10.767578125, 14.8515625, 18.935546875, 23.01953125, 27.103515625, 31.1875, 35.271484375, 39.35546875, 43.439453125, 47.5234375, 51.607421875, 55.69140625, 59.775390625, 63.859375, 67.943359375, 72.02734375, 76.111328125, 80.1953125, 84.279296875, 88.36328125, 92.447265625, 96.53125, 100.615234375, 104.69921875, 108.783203125, 112.8671875, 116.951171875, 121.03515625, 125.119140625, 129.203125, 133.287109375, 137.37109375, 141.455078125, 145.5390625, 149.623046875, 153.70703125, 157.791015625, 161.875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 5.0, 10.0, 32.0, 32.0, 84.0, 197.0, 284.0, 169.0, 74.0, 39.0, 21.0, 9.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.59765625, -64.9453125, -62.29296875, -59.640625, -56.98828125, -54.3359375, -51.68359375, -49.03125, -46.37890625, -43.7265625, -41.07421875, -38.421875, -35.76953125, -33.1171875, -30.46484375, -27.8125, -25.16015625, -22.5078125, -19.85546875, -17.203125, -14.55078125, -11.8984375, -9.24609375, -6.59375, -3.94140625, -1.2890625, 1.36328125, 4.015625, 6.66796875, 9.3203125, 11.97265625, 14.625, 17.27734375, 19.9296875, 22.58203125, 25.234375, 27.88671875, 30.5390625, 33.19140625, 35.84375, 38.49609375, 41.1484375, 43.80078125, 46.453125, 49.10546875, 51.7578125, 54.41015625, 57.0625, 59.71484375, 62.3671875, 65.01953125, 67.671875, 70.32421875, 72.9765625, 75.62890625, 78.28125, 80.93359375, 83.5859375, 86.23828125, 88.890625, 91.54296875, 94.1953125, 96.84765625, 99.5]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 11.0, 16.0, 41.0, 193.0, 453.0, 203.0, 56.0, 20.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2727.38623046875, -2661.7666015625, -2596.14697265625, -2530.527099609375, -2464.907470703125, -2399.287841796875, -2333.668212890625, -2268.04833984375, -2202.4287109375, -2136.80908203125, -2071.189453125, -2005.5697021484375, -1939.949951171875, -1874.330322265625, -1808.710693359375, -1743.0909423828125, -1677.4713134765625, -1611.8516845703125, -1546.23193359375, -1480.6123046875, -1414.9925537109375, -1349.3729248046875, -1283.753173828125, -1218.133544921875, -1152.513916015625, -1086.894287109375, -1021.2745361328125, -955.6549072265625, -890.03515625, -824.41552734375, -758.7958374023438, -693.1761474609375, -627.5562744140625, -561.9365844726562, -496.31689453125, -430.6972351074219, -365.0775451660156, -299.4578552246094, -233.83819580078125, -168.218505859375, -102.59881591796875, -36.97913360595703, 28.640548706054688, 94.26022338867188, 159.87991333007812, 225.49960327148438, 291.1192626953125, 356.73895263671875, 422.358642578125, 487.97833251953125, 553.5980224609375, 619.2176513671875, 684.83740234375, 750.45703125, 816.0767211914062, 881.6964111328125, 947.3161010742188, 1012.935791015625, 1078.555419921875, 1144.1751708984375, 1209.7947998046875, 1275.41455078125, 1341.0341796875, 1406.65380859375, 1472.2735595703125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 3.0, 11.0, 6.0, 2.0, 7.0, 17.0, 19.0, 23.0, 24.0, 23.0, 34.0, 42.0, 48.0, 32.0, 45.0, 75.0, 94.0, 82.0, 63.0, 47.0, 48.0, 45.0, 37.0, 35.0, 20.0, 28.0, 17.0, 15.0, 20.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-403.5238952636719, -387.91912841796875, -372.3143615722656, -356.7095947265625, -341.1048278808594, -325.50006103515625, -309.895263671875, -294.29052734375, -278.68572998046875, -263.0809631347656, -247.4761962890625, -231.87142944335938, -216.26666259765625, -200.66189575195312, -185.05711364746094, -169.4523468017578, -153.84759521484375, -138.24282836914062, -122.6380615234375, -107.03328704833984, -91.42852020263672, -75.8237533569336, -60.21897888183594, -44.61421203613281, -29.009445190429688, -13.40467643737793, 2.200092315673828, 17.80486297607422, 33.409629821777344, 49.01439666748047, 64.61917114257812, 80.22393798828125, 95.82867431640625, 111.43344116210938, 127.0382080078125, 142.64297485351562, 158.24774169921875, 173.85250854492188, 189.45729064941406, 205.0620574951172, 220.6668243408203, 236.27159118652344, 251.87635803222656, 267.48114013671875, 283.0859069824219, 298.690673828125, 314.2954406738281, 329.90020751953125, 345.5049743652344, 361.1097412109375, 376.7145080566406, 392.31927490234375, 407.9240417480469, 423.52880859375, 439.13360595703125, 454.73834228515625, 470.3431396484375, 485.9479064941406, 501.55267333984375, 517.157470703125, 532.76220703125, 548.3670043945312, 563.9717407226562, 579.5765380859375, 595.1812744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 10.0, 11.0, 12.0, 25.0, 22.0, 32.0, 40.0, 63.0, 95.0, 146.0, 238.0, 277.0, 514.0, 894.0, 1818.0, 4080.0, 12683.0, 62945.0, 1120385.0, 2825849.0, 131242.0, 21673.0, 6218.0, 2330.0, 1071.0, 588.0, 322.0, 220.0, 121.0, 115.0, 67.0, 48.0, 24.0, 29.0, 12.0, 14.0, 8.0, 5.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.09375, -49.4541015625, -47.814453125, -46.1748046875, -44.53515625, -42.8955078125, -41.255859375, -39.6162109375, -37.9765625, -36.3369140625, -34.697265625, -33.0576171875, -31.41796875, -29.7783203125, -28.138671875, -26.4990234375, -24.859375, -23.2197265625, -21.580078125, -19.9404296875, -18.30078125, -16.6611328125, -15.021484375, -13.3818359375, -11.7421875, -10.1025390625, -8.462890625, -6.8232421875, -5.18359375, -3.5439453125, -1.904296875, -0.2646484375, 1.375, 3.0146484375, 4.654296875, 6.2939453125, 7.93359375, 9.5732421875, 11.212890625, 12.8525390625, 14.4921875, 16.1318359375, 17.771484375, 19.4111328125, 21.05078125, 22.6904296875, 24.330078125, 25.9697265625, 27.609375, 29.2490234375, 30.888671875, 32.5283203125, 34.16796875, 35.8076171875, 37.447265625, 39.0869140625, 40.7265625, 42.3662109375, 44.005859375, 45.6455078125, 47.28515625, 48.9248046875, 50.564453125, 52.2041015625, 53.84375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 20.0, 29.0, 31.0, 37.0, 49.0, 51.0, 58.0, 63.0, 68.0, 73.0, 86.0, 67.0, 72.0, 55.0, 50.0, 33.0, 21.0, 20.0, 21.0, 14.0, 9.0, 9.0, 3.0, 4.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.406005859375, -22.70263671875, -21.999267578125, -21.2958984375, -20.592529296875, -19.88916015625, -19.185791015625, -18.482421875, -17.779052734375, -17.07568359375, -16.372314453125, -15.6689453125, -14.965576171875, -14.26220703125, -13.558837890625, -12.85546875, -12.152099609375, -11.44873046875, -10.745361328125, -10.0419921875, -9.338623046875, -8.63525390625, -7.931884765625, -7.228515625, -6.525146484375, -5.82177734375, -5.118408203125, -4.4150390625, -3.711669921875, -3.00830078125, -2.304931640625, -1.6015625, -0.898193359375, -0.19482421875, 0.508544921875, 1.2119140625, 1.915283203125, 2.61865234375, 3.322021484375, 4.025390625, 4.728759765625, 5.43212890625, 6.135498046875, 6.8388671875, 7.542236328125, 8.24560546875, 8.948974609375, 9.65234375, 10.355712890625, 11.05908203125, 11.762451171875, 12.4658203125, 13.169189453125, 13.87255859375, 14.575927734375, 15.279296875, 15.982666015625, 16.68603515625, 17.389404296875, 18.0927734375, 18.796142578125, 19.49951171875, 20.202880859375, 20.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 15.0, 11.0, 30.0, 41.0, 40.0, 104.0, 247.0, 6294.0, 4184951.0, 1994.0, 190.0, 98.0, 86.0, 59.0, 36.0, 36.0, 21.0, 15.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-393.0, -374.625, -356.25, -337.875, -319.5, -301.125, -282.75, -264.375, -246.0, -227.625, -209.25, -190.875, -172.5, -154.125, -135.75, -117.375, -99.0, -80.625, -62.25, -43.875, -25.5, -7.125, 11.25, 29.625, 48.0, 66.375, 84.75, 103.125, 121.5, 139.875, 158.25, 176.625, 195.0, 213.375, 231.75, 250.125, 268.5, 286.875, 305.25, 323.625, 342.0, 360.375, 378.75, 397.125, 415.5, 433.875, 452.25, 470.625, 489.0, 507.375, 525.75, 544.125, 562.5, 580.875, 599.25, 617.625, 636.0, 654.375, 672.75, 691.125, 709.5, 727.875, 746.25, 764.625, 783.0]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 20.0, 105.0, 736.0, 2712.0, 393.0, 79.0, 21.0, 9.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.375, -143.998046875, -134.62109375, -125.244140625, -115.8671875, -106.490234375, -97.11328125, -87.736328125, -78.359375, -68.982421875, -59.60546875, -50.228515625, -40.8515625, -31.474609375, -22.09765625, -12.720703125, -3.34375, 6.033203125, 15.41015625, 24.787109375, 34.1640625, 43.541015625, 52.91796875, 62.294921875, 71.671875, 81.048828125, 90.42578125, 99.802734375, 109.1796875, 118.556640625, 127.93359375, 137.310546875, 146.6875, 156.064453125, 165.44140625, 174.818359375, 184.1953125, 193.572265625, 202.94921875, 212.326171875, 221.703125, 231.080078125, 240.45703125, 249.833984375, 259.2109375, 268.587890625, 277.96484375, 287.341796875, 296.71875, 306.095703125, 315.47265625, 324.849609375, 334.2265625, 343.603515625, 352.98046875, 362.357421875, 371.734375, 381.111328125, 390.48828125, 399.865234375, 409.2421875, 418.619140625, 427.99609375, 437.373046875, 446.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 12.0, 15.0, 20.0, 56.0, 92.0, 207.0, 254.0, 158.0, 64.0, 31.0, 26.0, 13.0, 15.0, 12.0, 5.0, 10.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1908.9403076171875, -1856.1849365234375, -1803.429443359375, -1750.674072265625, -1697.9185791015625, -1645.1632080078125, -1592.40771484375, -1539.65234375, -1486.89697265625, -1434.1416015625, -1381.3861083984375, -1328.6307373046875, -1275.875244140625, -1223.119873046875, -1170.364501953125, -1117.6090087890625, -1064.853515625, -1012.0980834960938, -959.3426513671875, -906.5872802734375, -853.831787109375, -801.076416015625, -748.3209838867188, -695.5655517578125, -642.8101196289062, -590.0546875, -537.2992553710938, -484.5438537597656, -431.7884216308594, -379.0329895019531, -326.277587890625, -273.52215576171875, -220.7667236328125, -168.01129150390625, -115.25587463378906, -62.500457763671875, -9.745025634765625, 43.010406494140625, 95.76580810546875, 148.521240234375, 201.27667236328125, 254.0321044921875, 306.78753662109375, 359.5429382324219, 412.2983703613281, 465.0538024902344, 517.8092041015625, 570.5646362304688, 623.320068359375, 676.0755004882812, 728.8309326171875, 781.5863037109375, 834.341796875, 887.09716796875, 939.8526000976562, 992.6080322265625, 1045.363525390625, 1098.118896484375, 1150.8743896484375, 1203.6297607421875, 1256.38525390625, 1309.140625, 1361.89599609375, 1414.6514892578125, 1467.4068603515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 13.0, 17.0, 20.0, 26.0, 27.0, 36.0, 27.0, 33.0, 45.0, 39.0, 46.0, 44.0, 54.0, 50.0, 49.0, 39.0, 54.0, 28.0, 39.0, 37.0, 32.0, 29.0, 20.0, 21.0, 29.0, 13.0, 14.0, 20.0, 9.0, 9.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-631.1177978515625, -611.6443481445312, -592.1708374023438, -572.6973876953125, -553.223876953125, -533.7504272460938, -514.2769775390625, -494.803466796875, -475.33001708984375, -455.8565368652344, -436.383056640625, -416.90960693359375, -397.4361267089844, -377.962646484375, -358.4891662597656, -339.01568603515625, -319.5422058105469, -300.0687255859375, -280.5952453613281, -261.12176513671875, -241.6483154296875, -222.17483520507812, -202.70135498046875, -183.22789001464844, -163.75440979003906, -144.2809295654297, -124.80746459960938, -105.333984375, -85.86051177978516, -66.38703918457031, -46.91355895996094, -27.440093994140625, -7.96661376953125, 11.506860733032227, 30.980335235595703, 50.45381164550781, 69.92728424072266, 89.4007568359375, 108.87423706054688, 128.3477020263672, 147.82118225097656, 167.29466247558594, 186.76812744140625, 206.24160766601562, 225.715087890625, 245.1885528564453, 264.66204833984375, 284.135498046875, 303.6089782714844, 323.08245849609375, 342.5559387207031, 362.0294189453125, 381.50286865234375, 400.9763488769531, 420.4498291015625, 439.92327880859375, 459.39678955078125, 478.8702697753906, 498.34375, 517.8171997070312, 537.2907104492188, 556.76416015625, 576.2376708984375, 595.7111206054688, 615.1845703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 14.0, 21.0, 29.0, 35.0, 59.0, 90.0, 123.0, 205.0, 328.0, 550.0, 950.0, 1755.0, 3705.0, 8205.0, 22202.0, 77930.0, 394728.0, 416063.0, 81762.0, 23064.0, 8632.0, 3754.0, 1861.0, 1003.0, 557.0, 329.0, 211.0, 116.0, 87.0, 54.0, 32.0, 23.0, 16.0, 15.0, 9.0, 5.0, 3.0, 7.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5, -76.4443359375, -73.388671875, -70.3330078125, -67.27734375, -64.2216796875, -61.166015625, -58.1103515625, -55.0546875, -51.9990234375, -48.943359375, -45.8876953125, -42.83203125, -39.7763671875, -36.720703125, -33.6650390625, -30.609375, -27.5537109375, -24.498046875, -21.4423828125, -18.38671875, -15.3310546875, -12.275390625, -9.2197265625, -6.1640625, -3.1083984375, -0.052734375, 3.0029296875, 6.05859375, 9.1142578125, 12.169921875, 15.2255859375, 18.28125, 21.3369140625, 24.392578125, 27.4482421875, 30.50390625, 33.5595703125, 36.615234375, 39.6708984375, 42.7265625, 45.7822265625, 48.837890625, 51.8935546875, 54.94921875, 58.0048828125, 61.060546875, 64.1162109375, 67.171875, 70.2275390625, 73.283203125, 76.3388671875, 79.39453125, 82.4501953125, 85.505859375, 88.5615234375, 91.6171875, 94.6728515625, 97.728515625, 100.7841796875, 103.83984375, 106.8955078125, 109.951171875, 113.0068359375, 116.0625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 7.0, 4.0, 6.0, 13.0, 11.0, 9.0, 11.0, 19.0, 21.0, 31.0, 38.0, 33.0, 49.0, 56.0, 44.0, 38.0, 46.0, 62.0, 52.0, 61.0, 62.0, 61.0, 47.0, 34.0, 29.0, 22.0, 21.0, 15.0, 10.0, 18.0, 16.0, 8.0, 9.0, 10.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.921875, -26.947998046875, -25.97412109375, -25.000244140625, -24.0263671875, -23.052490234375, -22.07861328125, -21.104736328125, -20.130859375, -19.156982421875, -18.18310546875, -17.209228515625, -16.2353515625, -15.261474609375, -14.28759765625, -13.313720703125, -12.33984375, -11.365966796875, -10.39208984375, -9.418212890625, -8.4443359375, -7.470458984375, -6.49658203125, -5.522705078125, -4.548828125, -3.574951171875, -2.60107421875, -1.627197265625, -0.6533203125, 0.320556640625, 1.29443359375, 2.268310546875, 3.2421875, 4.216064453125, 5.18994140625, 6.163818359375, 7.1376953125, 8.111572265625, 9.08544921875, 10.059326171875, 11.033203125, 12.007080078125, 12.98095703125, 13.954833984375, 14.9287109375, 15.902587890625, 16.87646484375, 17.850341796875, 18.82421875, 19.798095703125, 20.77197265625, 21.745849609375, 22.7197265625, 23.693603515625, 24.66748046875, 25.641357421875, 26.615234375, 27.589111328125, 28.56298828125, 29.536865234375, 30.5107421875, 31.484619140625, 32.45849609375, 33.432373046875, 34.40625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 9.0, 16.0, 18.0, 33.0, 44.0, 73.0, 172.0, 364.0, 894.0, 3561.0, 48695.0, 975898.0, 15374.0, 2143.0, 627.0, 264.0, 141.0, 67.0, 41.0, 37.0, 14.0, 12.0, 12.0, 8.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-530.5, -514.09375, -497.6875, -481.28125, -464.875, -448.46875, -432.0625, -415.65625, -399.25, -382.84375, -366.4375, -350.03125, -333.625, -317.21875, -300.8125, -284.40625, -268.0, -251.59375, -235.1875, -218.78125, -202.375, -185.96875, -169.5625, -153.15625, -136.75, -120.34375, -103.9375, -87.53125, -71.125, -54.71875, -38.3125, -21.90625, -5.5, 10.90625, 27.3125, 43.71875, 60.125, 76.53125, 92.9375, 109.34375, 125.75, 142.15625, 158.5625, 174.96875, 191.375, 207.78125, 224.1875, 240.59375, 257.0, 273.40625, 289.8125, 306.21875, 322.625, 339.03125, 355.4375, 371.84375, 388.25, 404.65625, 421.0625, 437.46875, 453.875, 470.28125, 486.6875, 503.09375, 519.5]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 0.0, 2.0, 5.0, 5.0, 7.0, 18.0, 15.0, 28.0, 33.0, 41.0, 59.0, 75.0, 68.0, 90.0, 74.0, 86.0, 69.0, 69.0, 54.0, 46.0, 34.0, 30.0, 17.0, 19.0, 13.0, 6.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-246.125, -238.81640625, -231.5078125, -224.19921875, -216.890625, -209.58203125, -202.2734375, -194.96484375, -187.65625, -180.34765625, -173.0390625, -165.73046875, -158.421875, -151.11328125, -143.8046875, -136.49609375, -129.1875, -121.87890625, -114.5703125, -107.26171875, -99.953125, -92.64453125, -85.3359375, -78.02734375, -70.71875, -63.41015625, -56.1015625, -48.79296875, -41.484375, -34.17578125, -26.8671875, -19.55859375, -12.25, -4.94140625, 2.3671875, 9.67578125, 16.984375, 24.29296875, 31.6015625, 38.91015625, 46.21875, 53.52734375, 60.8359375, 68.14453125, 75.453125, 82.76171875, 90.0703125, 97.37890625, 104.6875, 111.99609375, 119.3046875, 126.61328125, 133.921875, 141.23046875, 148.5390625, 155.84765625, 163.15625, 170.46484375, 177.7734375, 185.08203125, 192.390625, 199.69921875, 207.0078125, 214.31640625, 221.625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 12.0, 7.0, 13.0, 24.0, 30.0, 43.0, 63.0, 69.0, 125.0, 223.0, 388.0, 671.0, 1242.0, 2907.0, 7721.0, 34378.0, 834559.0, 142439.0, 14878.0, 4641.0, 1940.0, 935.0, 493.0, 263.0, 148.0, 76.0, 58.0, 50.0, 36.0, 19.0, 30.0, 11.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-130.125, -126.380859375, -122.63671875, -118.892578125, -115.1484375, -111.404296875, -107.66015625, -103.916015625, -100.171875, -96.427734375, -92.68359375, -88.939453125, -85.1953125, -81.451171875, -77.70703125, -73.962890625, -70.21875, -66.474609375, -62.73046875, -58.986328125, -55.2421875, -51.498046875, -47.75390625, -44.009765625, -40.265625, -36.521484375, -32.77734375, -29.033203125, -25.2890625, -21.544921875, -17.80078125, -14.056640625, -10.3125, -6.568359375, -2.82421875, 0.919921875, 4.6640625, 8.408203125, 12.15234375, 15.896484375, 19.640625, 23.384765625, 27.12890625, 30.873046875, 34.6171875, 38.361328125, 42.10546875, 45.849609375, 49.59375, 53.337890625, 57.08203125, 60.826171875, 64.5703125, 68.314453125, 72.05859375, 75.802734375, 79.546875, 83.291015625, 87.03515625, 90.779296875, 94.5234375, 98.267578125, 102.01171875, 105.755859375, 109.5]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 12.0, 19.0, 29.0, 46.0, 106.0, 205.0, 270.0, 130.0, 60.0, 38.0, 23.0, 12.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0435791015625, -0.04226350784301758, -0.040947914123535156, -0.039632320404052734, -0.03831672668457031, -0.03700113296508789, -0.03568553924560547, -0.03436994552612305, -0.033054351806640625, -0.0317387580871582, -0.03042316436767578, -0.02910757064819336, -0.027791976928710938, -0.026476383209228516, -0.025160789489746094, -0.023845195770263672, -0.02252960205078125, -0.021214008331298828, -0.019898414611816406, -0.018582820892333984, -0.017267227172851562, -0.01595163345336914, -0.014636039733886719, -0.013320446014404297, -0.012004852294921875, -0.010689258575439453, -0.009373664855957031, -0.00805807113647461, -0.0067424774169921875, -0.005426883697509766, -0.004111289978027344, -0.002795696258544922, -0.0014801025390625, -0.00016450881958007812, 0.0011510848999023438, 0.0024666786193847656, 0.0037822723388671875, 0.005097866058349609, 0.006413459777832031, 0.007729053497314453, 0.009044647216796875, 0.010360240936279297, 0.011675834655761719, 0.01299142837524414, 0.014307022094726562, 0.015622615814208984, 0.016938209533691406, 0.018253803253173828, 0.01956939697265625, 0.020884990692138672, 0.022200584411621094, 0.023516178131103516, 0.024831771850585938, 0.02614736557006836, 0.02746295928955078, 0.028778553009033203, 0.030094146728515625, 0.03140974044799805, 0.03272533416748047, 0.03404092788696289, 0.03535652160644531, 0.036672115325927734, 0.037987709045410156, 0.03930330276489258, 0.040618896484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 1.0, 6.0, 12.0, 20.0, 19.0, 33.0, 54.0, 72.0, 95.0, 183.0, 314.0, 745.0, 2083.0, 8802.0, 88998.0, 914640.0, 25498.0, 4472.0, 1342.0, 478.0, 244.0, 136.0, 98.0, 57.0, 36.0, 25.0, 20.0, 18.0, 14.0, 14.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-181.375, -176.234375, -171.09375, -165.953125, -160.8125, -155.671875, -150.53125, -145.390625, -140.25, -135.109375, -129.96875, -124.828125, -119.6875, -114.546875, -109.40625, -104.265625, -99.125, -93.984375, -88.84375, -83.703125, -78.5625, -73.421875, -68.28125, -63.140625, -58.0, -52.859375, -47.71875, -42.578125, -37.4375, -32.296875, -27.15625, -22.015625, -16.875, -11.734375, -6.59375, -1.453125, 3.6875, 8.828125, 13.96875, 19.109375, 24.25, 29.390625, 34.53125, 39.671875, 44.8125, 49.953125, 55.09375, 60.234375, 65.375, 70.515625, 75.65625, 80.796875, 85.9375, 91.078125, 96.21875, 101.359375, 106.5, 111.640625, 116.78125, 121.921875, 127.0625, 132.203125, 137.34375, 142.484375, 147.625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 14.0, 8.0, 18.0, 24.0, 38.0, 46.0, 66.0, 97.0, 108.0, 165.0, 117.0, 86.0, 52.0, 35.0, 19.0, 19.0, 19.0, 13.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -61.8935546875, -59.537109375, -57.1806640625, -54.82421875, -52.4677734375, -50.111328125, -47.7548828125, -45.3984375, -43.0419921875, -40.685546875, -38.3291015625, -35.97265625, -33.6162109375, -31.259765625, -28.9033203125, -26.546875, -24.1904296875, -21.833984375, -19.4775390625, -17.12109375, -14.7646484375, -12.408203125, -10.0517578125, -7.6953125, -5.3388671875, -2.982421875, -0.6259765625, 1.73046875, 4.0869140625, 6.443359375, 8.7998046875, 11.15625, 13.5126953125, 15.869140625, 18.2255859375, 20.58203125, 22.9384765625, 25.294921875, 27.6513671875, 30.0078125, 32.3642578125, 34.720703125, 37.0771484375, 39.43359375, 41.7900390625, 44.146484375, 46.5029296875, 48.859375, 51.2158203125, 53.572265625, 55.9287109375, 58.28515625, 60.6416015625, 62.998046875, 65.3544921875, 67.7109375, 70.0673828125, 72.423828125, 74.7802734375, 77.13671875, 79.4931640625, 81.849609375, 84.2060546875, 86.5625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 12.0, 16.0, 29.0, 70.0, 146.0, 319.0, 181.0, 103.0, 49.0, 26.0, 7.0, 17.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1589.79541015625, -1532.422119140625, -1475.048828125, -1417.6756591796875, -1360.3023681640625, -1302.9290771484375, -1245.5557861328125, -1188.1826171875, -1130.809326171875, -1073.43603515625, -1016.0628051757812, -958.6895141601562, -901.3162841796875, -843.9429931640625, -786.5697021484375, -729.1964721679688, -671.8231811523438, -614.4498901367188, -557.07666015625, -499.703369140625, -442.33013916015625, -384.95684814453125, -327.5835876464844, -270.2103271484375, -212.83706665039062, -155.46380615234375, -98.09053802490234, -40.71726989746094, 16.655990600585938, 74.02926635742188, 131.40252685546875, 188.77578735351562, 246.1490478515625, 303.5223083496094, 360.89556884765625, 418.26885986328125, 475.64208984375, 533.015380859375, 590.388671875, 647.7619018554688, 705.1351318359375, 762.5084228515625, 819.8816528320312, 877.2549438476562, 934.628173828125, 992.00146484375, 1049.374755859375, 1106.748046875, 1164.121337890625, 1221.49462890625, 1278.867919921875, 1336.2410888671875, 1393.6143798828125, 1450.9876708984375, 1508.3609619140625, 1565.734130859375, 1623.107421875, 1680.480712890625, 1737.85400390625, 1795.2271728515625, 1852.6004638671875, 1909.9737548828125, 1967.3470458984375, 2024.72021484375, 2082.093505859375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 18.0, 5.0, 16.0, 21.0, 14.0, 21.0, 25.0, 32.0, 30.0, 33.0, 44.0, 40.0, 56.0, 84.0, 79.0, 67.0, 50.0, 47.0, 42.0, 35.0, 32.0, 31.0, 23.0, 19.0, 15.0, 13.0, 15.0, 10.0, 15.0, 5.0, 9.0, 7.0, 3.0, 7.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-904.7769775390625, -875.1094970703125, -845.4420166015625, -815.7745361328125, -786.1071166992188, -756.4396362304688, -726.7721557617188, -697.1046752929688, -667.437255859375, -637.769775390625, -608.102294921875, -578.434814453125, -548.7673950195312, -519.0999145507812, -489.43243408203125, -459.76495361328125, -430.09747314453125, -400.42999267578125, -370.7625427246094, -341.0950622558594, -311.4276123046875, -281.7601318359375, -252.0926513671875, -222.42518615722656, -192.75772094726562, -163.0902557373047, -133.42279052734375, -103.75531005859375, -74.08784484863281, -44.420379638671875, -14.752899169921875, 14.914566040039062, 44.58209228515625, 74.24955749511719, 103.91703033447266, 133.58450317382812, 163.25196838378906, 192.91943359375, 222.5869140625, 252.25437927246094, 281.9218444824219, 311.5893249511719, 341.25677490234375, 370.92425537109375, 400.59173583984375, 430.2591857910156, 459.9266662597656, 489.5941162109375, 519.2615966796875, 548.9290771484375, 578.5965576171875, 608.2640380859375, 637.9314575195312, 667.5989379882812, 697.2664184570312, 726.9338989257812, 756.601318359375, 786.268798828125, 815.936279296875, 845.603759765625, 875.2711791992188, 904.9386596679688, 934.6061401367188, 964.2736206054688, 993.9411010742188]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 17.0, 24.0, 42.0, 67.0, 104.0, 204.0, 324.0, 696.0, 1449.0, 3857.0, 15467.0, 287532.0, 3770021.0, 99857.0, 9872.0, 2538.0, 1041.0, 485.0, 237.0, 155.0, 84.0, 66.0, 36.0, 26.0, 27.0, 10.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -78.6318359375, -74.951171875, -71.2705078125, -67.58984375, -63.9091796875, -60.228515625, -56.5478515625, -52.8671875, -49.1865234375, -45.505859375, -41.8251953125, -38.14453125, -34.4638671875, -30.783203125, -27.1025390625, -23.421875, -19.7412109375, -16.060546875, -12.3798828125, -8.69921875, -5.0185546875, -1.337890625, 2.3427734375, 6.0234375, 9.7041015625, 13.384765625, 17.0654296875, 20.74609375, 24.4267578125, 28.107421875, 31.7880859375, 35.46875, 39.1494140625, 42.830078125, 46.5107421875, 50.19140625, 53.8720703125, 57.552734375, 61.2333984375, 64.9140625, 68.5947265625, 72.275390625, 75.9560546875, 79.63671875, 83.3173828125, 86.998046875, 90.6787109375, 94.359375, 98.0400390625, 101.720703125, 105.4013671875, 109.08203125, 112.7626953125, 116.443359375, 120.1240234375, 123.8046875, 127.4853515625, 131.166015625, 134.8466796875, 138.52734375, 142.2080078125, 145.888671875, 149.5693359375, 153.25]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 12.0, 14.0, 16.0, 23.0, 35.0, 49.0, 53.0, 67.0, 80.0, 89.0, 96.0, 99.0, 89.0, 52.0, 59.0, 43.0, 33.0, 24.0, 20.0, 9.0, 8.0, 10.0, 9.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -64.068359375, -62.44921875, -60.830078125, -59.2109375, -57.591796875, -55.97265625, -54.353515625, -52.734375, -51.115234375, -49.49609375, -47.876953125, -46.2578125, -44.638671875, -43.01953125, -41.400390625, -39.78125, -38.162109375, -36.54296875, -34.923828125, -33.3046875, -31.685546875, -30.06640625, -28.447265625, -26.828125, -25.208984375, -23.58984375, -21.970703125, -20.3515625, -18.732421875, -17.11328125, -15.494140625, -13.875, -12.255859375, -10.63671875, -9.017578125, -7.3984375, -5.779296875, -4.16015625, -2.541015625, -0.921875, 0.697265625, 2.31640625, 3.935546875, 5.5546875, 7.173828125, 8.79296875, 10.412109375, 12.03125, 13.650390625, 15.26953125, 16.888671875, 18.5078125, 20.126953125, 21.74609375, 23.365234375, 24.984375, 26.603515625, 28.22265625, 29.841796875, 31.4609375, 33.080078125, 34.69921875, 36.318359375, 37.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 12.0, 28.0, 28.0, 56.0, 72.0, 111.0, 190.0, 250.0, 853.0, 26642.0, 4161580.0, 3585.0, 339.0, 162.0, 113.0, 83.0, 56.0, 37.0, 26.0, 15.0, 11.0, 6.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-658.0, -638.2421875, -618.484375, -598.7265625, -578.96875, -559.2109375, -539.453125, -519.6953125, -499.9375, -480.1796875, -460.421875, -440.6640625, -420.90625, -401.1484375, -381.390625, -361.6328125, -341.875, -322.1171875, -302.359375, -282.6015625, -262.84375, -243.0859375, -223.328125, -203.5703125, -183.8125, -164.0546875, -144.296875, -124.5390625, -104.78125, -85.0234375, -65.265625, -45.5078125, -25.75, -5.9921875, 13.765625, 33.5234375, 53.28125, 73.0390625, 92.796875, 112.5546875, 132.3125, 152.0703125, 171.828125, 191.5859375, 211.34375, 231.1015625, 250.859375, 270.6171875, 290.375, 310.1328125, 329.890625, 349.6484375, 369.40625, 389.1640625, 408.921875, 428.6796875, 448.4375, 468.1953125, 487.953125, 507.7109375, 527.46875, 547.2265625, 566.984375, 586.7421875, 606.5]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 40.0, 149.0, 1479.0, 2139.0, 192.0, 36.0, 24.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.75, -492.8046875, -479.859375, -466.9140625, -453.96875, -441.0234375, -428.078125, -415.1328125, -402.1875, -389.2421875, -376.296875, -363.3515625, -350.40625, -337.4609375, -324.515625, -311.5703125, -298.625, -285.6796875, -272.734375, -259.7890625, -246.84375, -233.8984375, -220.953125, -208.0078125, -195.0625, -182.1171875, -169.171875, -156.2265625, -143.28125, -130.3359375, -117.390625, -104.4453125, -91.5, -78.5546875, -65.609375, -52.6640625, -39.71875, -26.7734375, -13.828125, -0.8828125, 12.0625, 25.0078125, 37.953125, 50.8984375, 63.84375, 76.7890625, 89.734375, 102.6796875, 115.625, 128.5703125, 141.515625, 154.4609375, 167.40625, 180.3515625, 193.296875, 206.2421875, 219.1875, 232.1328125, 245.078125, 258.0234375, 270.96875, 283.9140625, 296.859375, 309.8046875, 322.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 16.0, 22.0, 48.0, 123.0, 351.0, 265.0, 88.0, 49.0, 13.0, 12.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2425.044921875, -2338.379150390625, -2251.713134765625, -2165.04736328125, -2078.38134765625, -1991.715576171875, -1905.0496826171875, -1818.3837890625, -1731.7178955078125, -1645.052001953125, -1558.3861083984375, -1471.72021484375, -1385.054443359375, -1298.388427734375, -1211.72265625, -1125.0567626953125, -1038.390869140625, -951.7249755859375, -865.05908203125, -778.3932495117188, -691.7273559570312, -605.0614624023438, -518.3956298828125, -431.729736328125, -345.0638427734375, -258.39794921875, -171.73208618164062, -85.06622314453125, 1.59967041015625, 88.26556396484375, 174.931396484375, 261.5972900390625, 348.263427734375, 434.9293212890625, 521.59521484375, 608.2610473632812, 694.9269409179688, 781.5928344726562, 868.2586669921875, 954.924560546875, 1041.5904541015625, 1128.25634765625, 1214.9222412109375, 1301.588134765625, 1388.25390625, 1474.919921875, 1561.585693359375, 1648.2515869140625, 1734.91748046875, 1821.5833740234375, 1908.249267578125, 1994.9150390625, 2081.5810546875, 2168.246826171875, 2254.91259765625, 2341.57861328125, 2428.24462890625, 2514.910400390625, 2601.576416015625, 2688.2421875, 2774.908203125, 2861.573974609375, 2948.23974609375, 3034.90576171875, 3121.571533203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 12.0, 9.0, 14.0, 16.0, 14.0, 18.0, 26.0, 44.0, 43.0, 54.0, 54.0, 70.0, 72.0, 50.0, 59.0, 66.0, 60.0, 55.0, 54.0, 30.0, 52.0, 38.0, 19.0, 16.0, 13.0, 15.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.1383972167969, -485.39404296875, -465.649658203125, -445.9053039550781, -426.16094970703125, -406.41656494140625, -386.6722106933594, -366.9278564453125, -347.1834716796875, -327.4391174316406, -307.6947326660156, -287.95037841796875, -268.20599365234375, -248.46163940429688, -228.71728515625, -208.97291564941406, -189.22854614257812, -169.4841766357422, -149.73980712890625, -129.99545288085938, -110.25108337402344, -90.5067138671875, -70.7623519897461, -51.01799011230469, -31.27362060546875, -11.529254913330078, 8.215110778808594, 27.959476470947266, 47.70384216308594, 67.44821166992188, 87.19257354736328, 106.93693542480469, 126.68133544921875, 146.4257049560547, 166.17007446289062, 185.9144287109375, 205.65879821777344, 225.40316772460938, 245.14752197265625, 264.89190673828125, 284.6362609863281, 304.380615234375, 324.125, 343.8693542480469, 363.61370849609375, 383.35809326171875, 403.1024475097656, 422.8468017578125, 442.5911865234375, 462.3355407714844, 482.0799255371094, 501.82427978515625, 521.5686645507812, 541.31298828125, 561.057373046875, 580.8017578125, 600.546142578125, 620.29052734375, 640.0348510742188, 659.7792358398438, 679.5236206054688, 699.2679443359375, 719.0123291015625, 738.7567138671875, 758.5010375976562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 7.0, 7.0, 15.0, 16.0, 21.0, 41.0, 54.0, 93.0, 126.0, 189.0, 359.0, 650.0, 1167.0, 2321.0, 4949.0, 11900.0, 34633.0, 162593.0, 653819.0, 126264.0, 29901.0, 10456.0, 4378.0, 2077.0, 1017.0, 610.0, 328.0, 170.0, 125.0, 71.0, 51.0, 38.0, 29.0, 18.0, 16.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-166.25, -161.421875, -156.59375, -151.765625, -146.9375, -142.109375, -137.28125, -132.453125, -127.625, -122.796875, -117.96875, -113.140625, -108.3125, -103.484375, -98.65625, -93.828125, -89.0, -84.171875, -79.34375, -74.515625, -69.6875, -64.859375, -60.03125, -55.203125, -50.375, -45.546875, -40.71875, -35.890625, -31.0625, -26.234375, -21.40625, -16.578125, -11.75, -6.921875, -2.09375, 2.734375, 7.5625, 12.390625, 17.21875, 22.046875, 26.875, 31.703125, 36.53125, 41.359375, 46.1875, 51.015625, 55.84375, 60.671875, 65.5, 70.328125, 75.15625, 79.984375, 84.8125, 89.640625, 94.46875, 99.296875, 104.125, 108.953125, 113.78125, 118.609375, 123.4375, 128.265625, 133.09375, 137.921875, 142.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 13.0, 23.0, 36.0, 30.0, 43.0, 68.0, 67.0, 65.0, 96.0, 93.0, 89.0, 82.0, 49.0, 51.0, 36.0, 29.0, 26.0, 29.0, 14.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-78.6875, -76.83056640625, -74.9736328125, -73.11669921875, -71.259765625, -69.40283203125, -67.5458984375, -65.68896484375, -63.83203125, -61.97509765625, -60.1181640625, -58.26123046875, -56.404296875, -54.54736328125, -52.6904296875, -50.83349609375, -48.9765625, -47.11962890625, -45.2626953125, -43.40576171875, -41.548828125, -39.69189453125, -37.8349609375, -35.97802734375, -34.12109375, -32.26416015625, -30.4072265625, -28.55029296875, -26.693359375, -24.83642578125, -22.9794921875, -21.12255859375, -19.265625, -17.40869140625, -15.5517578125, -13.69482421875, -11.837890625, -9.98095703125, -8.1240234375, -6.26708984375, -4.41015625, -2.55322265625, -0.6962890625, 1.16064453125, 3.017578125, 4.87451171875, 6.7314453125, 8.58837890625, 10.4453125, 12.30224609375, 14.1591796875, 16.01611328125, 17.873046875, 19.72998046875, 21.5869140625, 23.44384765625, 25.30078125, 27.15771484375, 29.0146484375, 30.87158203125, 32.728515625, 34.58544921875, 36.4423828125, 38.29931640625, 40.15625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 7.0, 18.0, 16.0, 21.0, 29.0, 30.0, 37.0, 74.0, 115.0, 174.0, 271.0, 602.0, 1420.0, 4129.0, 20276.0, 648498.0, 349110.0, 17424.0, 3638.0, 1270.0, 562.0, 312.0, 161.0, 110.0, 70.0, 42.0, 25.0, 33.0, 15.0, 17.0, 9.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-310.5, -298.5390625, -286.578125, -274.6171875, -262.65625, -250.6953125, -238.734375, -226.7734375, -214.8125, -202.8515625, -190.890625, -178.9296875, -166.96875, -155.0078125, -143.046875, -131.0859375, -119.125, -107.1640625, -95.203125, -83.2421875, -71.28125, -59.3203125, -47.359375, -35.3984375, -23.4375, -11.4765625, 0.484375, 12.4453125, 24.40625, 36.3671875, 48.328125, 60.2890625, 72.25, 84.2109375, 96.171875, 108.1328125, 120.09375, 132.0546875, 144.015625, 155.9765625, 167.9375, 179.8984375, 191.859375, 203.8203125, 215.78125, 227.7421875, 239.703125, 251.6640625, 263.625, 275.5859375, 287.546875, 299.5078125, 311.46875, 323.4296875, 335.390625, 347.3515625, 359.3125, 371.2734375, 383.234375, 395.1953125, 407.15625, 419.1171875, 431.078125, 443.0390625, 455.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 6.0, 6.0, 10.0, 11.0, 15.0, 19.0, 22.0, 29.0, 33.0, 49.0, 42.0, 47.0, 39.0, 48.0, 44.0, 53.0, 47.0, 41.0, 51.0, 50.0, 54.0, 35.0, 29.0, 36.0, 28.0, 24.0, 18.0, 19.0, 13.0, 11.0, 9.0, 5.0, 7.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-186.0, -180.703125, -175.40625, -170.109375, -164.8125, -159.515625, -154.21875, -148.921875, -143.625, -138.328125, -133.03125, -127.734375, -122.4375, -117.140625, -111.84375, -106.546875, -101.25, -95.953125, -90.65625, -85.359375, -80.0625, -74.765625, -69.46875, -64.171875, -58.875, -53.578125, -48.28125, -42.984375, -37.6875, -32.390625, -27.09375, -21.796875, -16.5, -11.203125, -5.90625, -0.609375, 4.6875, 9.984375, 15.28125, 20.578125, 25.875, 31.171875, 36.46875, 41.765625, 47.0625, 52.359375, 57.65625, 62.953125, 68.25, 73.546875, 78.84375, 84.140625, 89.4375, 94.734375, 100.03125, 105.328125, 110.625, 115.921875, 121.21875, 126.515625, 131.8125, 137.109375, 142.40625, 147.703125, 153.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 11.0, 13.0, 18.0, 30.0, 29.0, 57.0, 81.0, 108.0, 211.0, 292.0, 508.0, 914.0, 1816.0, 3947.0, 9879.0, 31135.0, 162880.0, 727409.0, 76838.0, 19313.0, 6807.0, 2965.0, 1398.0, 737.0, 463.0, 249.0, 130.0, 92.0, 55.0, 58.0, 32.0, 20.0, 11.0, 9.0, 15.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.1533203125, -63.431640625, -60.7099609375, -57.98828125, -55.2666015625, -52.544921875, -49.8232421875, -47.1015625, -44.3798828125, -41.658203125, -38.9365234375, -36.21484375, -33.4931640625, -30.771484375, -28.0498046875, -25.328125, -22.6064453125, -19.884765625, -17.1630859375, -14.44140625, -11.7197265625, -8.998046875, -6.2763671875, -3.5546875, -0.8330078125, 1.888671875, 4.6103515625, 7.33203125, 10.0537109375, 12.775390625, 15.4970703125, 18.21875, 20.9404296875, 23.662109375, 26.3837890625, 29.10546875, 31.8271484375, 34.548828125, 37.2705078125, 39.9921875, 42.7138671875, 45.435546875, 48.1572265625, 50.87890625, 53.6005859375, 56.322265625, 59.0439453125, 61.765625, 64.4873046875, 67.208984375, 69.9306640625, 72.65234375, 75.3740234375, 78.095703125, 80.8173828125, 83.5390625, 86.2607421875, 88.982421875, 91.7041015625, 94.42578125, 97.1474609375, 99.869140625, 102.5908203125, 105.3125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 9.0, 3.0, 7.0, 7.0, 10.0, 15.0, 21.0, 34.0, 41.0, 68.0, 142.0, 236.0, 154.0, 79.0, 46.0, 31.0, 14.0, 23.0, 9.0, 16.0, 4.0, 0.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02935791015625, -0.028165817260742188, -0.026973724365234375, -0.025781631469726562, -0.02458953857421875, -0.023397445678710938, -0.022205352783203125, -0.021013259887695312, -0.0198211669921875, -0.018629074096679688, -0.017436981201171875, -0.016244888305664062, -0.01505279541015625, -0.013860702514648438, -0.012668609619140625, -0.011476516723632812, -0.010284423828125, -0.009092330932617188, -0.007900238037109375, -0.0067081451416015625, -0.00551605224609375, -0.0043239593505859375, -0.003131866455078125, -0.0019397735595703125, -0.0007476806640625, 0.0004444122314453125, 0.001636505126953125, 0.0028285980224609375, 0.00402069091796875, 0.0052127838134765625, 0.006404876708984375, 0.0075969696044921875, 0.0087890625, 0.009981155395507812, 0.011173248291015625, 0.012365341186523438, 0.01355743408203125, 0.014749526977539062, 0.015941619873046875, 0.017133712768554688, 0.0183258056640625, 0.019517898559570312, 0.020709991455078125, 0.021902084350585938, 0.02309417724609375, 0.024286270141601562, 0.025478363037109375, 0.026670455932617188, 0.027862548828125, 0.029054641723632812, 0.030246734619140625, 0.03143882751464844, 0.03263092041015625, 0.03382301330566406, 0.035015106201171875, 0.03620719909667969, 0.0373992919921875, 0.03859138488769531, 0.039783477783203125, 0.04097557067871094, 0.04216766357421875, 0.04335975646972656, 0.044551849365234375, 0.04574394226074219, 0.04693603515625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 7.0, 17.0, 10.0, 28.0, 40.0, 49.0, 69.0, 121.0, 191.0, 367.0, 785.0, 1758.0, 5080.0, 24750.0, 300825.0, 669411.0, 34652.0, 6455.0, 1967.0, 833.0, 421.0, 245.0, 174.0, 93.0, 60.0, 40.0, 26.0, 23.0, 12.0, 10.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-140.625, -136.9326171875, -133.240234375, -129.5478515625, -125.85546875, -122.1630859375, -118.470703125, -114.7783203125, -111.0859375, -107.3935546875, -103.701171875, -100.0087890625, -96.31640625, -92.6240234375, -88.931640625, -85.2392578125, -81.546875, -77.8544921875, -74.162109375, -70.4697265625, -66.77734375, -63.0849609375, -59.392578125, -55.7001953125, -52.0078125, -48.3154296875, -44.623046875, -40.9306640625, -37.23828125, -33.5458984375, -29.853515625, -26.1611328125, -22.46875, -18.7763671875, -15.083984375, -11.3916015625, -7.69921875, -4.0068359375, -0.314453125, 3.3779296875, 7.0703125, 10.7626953125, 14.455078125, 18.1474609375, 21.83984375, 25.5322265625, 29.224609375, 32.9169921875, 36.609375, 40.3017578125, 43.994140625, 47.6865234375, 51.37890625, 55.0712890625, 58.763671875, 62.4560546875, 66.1484375, 69.8408203125, 73.533203125, 77.2255859375, 80.91796875, 84.6103515625, 88.302734375, 91.9951171875, 95.6875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 14.0, 11.0, 8.0, 8.0, 20.0, 30.0, 27.0, 31.0, 39.0, 64.0, 90.0, 93.0, 89.0, 77.0, 65.0, 59.0, 46.0, 38.0, 22.0, 31.0, 19.0, 15.0, 14.0, 15.0, 9.0, 10.0, 6.0, 4.0, 1.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28125, -48.51123046875, -46.7412109375, -44.97119140625, -43.201171875, -41.43115234375, -39.6611328125, -37.89111328125, -36.12109375, -34.35107421875, -32.5810546875, -30.81103515625, -29.041015625, -27.27099609375, -25.5009765625, -23.73095703125, -21.9609375, -20.19091796875, -18.4208984375, -16.65087890625, -14.880859375, -13.11083984375, -11.3408203125, -9.57080078125, -7.80078125, -6.03076171875, -4.2607421875, -2.49072265625, -0.720703125, 1.04931640625, 2.8193359375, 4.58935546875, 6.359375, 8.12939453125, 9.8994140625, 11.66943359375, 13.439453125, 15.20947265625, 16.9794921875, 18.74951171875, 20.51953125, 22.28955078125, 24.0595703125, 25.82958984375, 27.599609375, 29.36962890625, 31.1396484375, 32.90966796875, 34.6796875, 36.44970703125, 38.2197265625, 39.98974609375, 41.759765625, 43.52978515625, 45.2998046875, 47.06982421875, 48.83984375, 50.60986328125, 52.3798828125, 54.14990234375, 55.919921875, 57.68994140625, 59.4599609375, 61.22998046875, 63.0]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 13.0, 24.0, 74.0, 187.0, 348.0, 192.0, 102.0, 28.0, 11.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2627.65576171875, -2544.605712890625, -2461.555908203125, -2378.505859375, -2295.4560546875, -2212.406005859375, -2129.356201171875, -2046.30615234375, -1963.25634765625, -1880.2064208984375, -1797.156494140625, -1714.1065673828125, -1631.056640625, -1548.0067138671875, -1464.956787109375, -1381.90673828125, -1298.8568115234375, -1215.806884765625, -1132.7569580078125, -1049.70703125, -966.6571044921875, -883.607177734375, -800.5571899414062, -717.5072631835938, -634.4573364257812, -551.4074096679688, -468.35748291015625, -385.3075256347656, -302.2575988769531, -219.20767211914062, -136.15771484375, -53.1077880859375, 29.942138671875, 112.99207305908203, 196.04200744628906, 279.0919494628906, 362.1418762207031, 445.1918029785156, 528.2417602539062, 611.2916870117188, 694.3416137695312, 777.3915405273438, 860.4414672851562, 943.491455078125, 1026.5413818359375, 1109.59130859375, 1192.6412353515625, 1275.691162109375, 1358.7410888671875, 1441.791015625, 1524.8409423828125, 1607.890869140625, 1690.9407958984375, 1773.99072265625, 1857.040771484375, 1940.090576171875, 2023.140625, 2106.190673828125, 2189.240478515625, 2272.29052734375, 2355.34033203125, 2438.390380859375, 2521.440185546875, 2604.490234375, 2687.5400390625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 10.0, 6.0, 10.0, 6.0, 13.0, 12.0, 20.0, 18.0, 22.0, 26.0, 34.0, 33.0, 45.0, 29.0, 60.0, 62.0, 88.0, 69.0, 72.0, 58.0, 41.0, 39.0, 28.0, 39.0, 22.0, 23.0, 20.0, 16.0, 17.0, 17.0, 6.0, 12.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-700.0050048828125, -673.2182006835938, -646.431396484375, -619.6445922851562, -592.8577880859375, -566.0709228515625, -539.2841796875, -512.497314453125, -485.71051025390625, -458.9237060546875, -432.13690185546875, -405.35009765625, -378.5632629394531, -351.7764587402344, -324.9896545410156, -298.20281982421875, -271.4160461425781, -244.62924194335938, -217.84242248535156, -191.0556182861328, -164.268798828125, -137.48199462890625, -110.6951904296875, -83.90837097167969, -57.12156677246094, -30.33475685119629, -3.5479469299316406, 23.238861083984375, 50.025672912597656, 76.81248474121094, 103.59928894042969, 130.3861083984375, 157.17291259765625, 183.959716796875, 210.7465362548828, 237.53334045410156, 264.3201599121094, 291.1069641113281, 317.8937683105469, 344.68060302734375, 371.4674072265625, 398.25421142578125, 425.041015625, 451.82781982421875, 478.6146545410156, 505.4014587402344, 532.188232421875, 558.97509765625, 585.7618408203125, 612.5486450195312, 639.33544921875, 666.1222534179688, 692.9090576171875, 719.6959228515625, 746.482666015625, 773.26953125, 800.0563354492188, 826.8431396484375, 853.6299438476562, 880.416748046875, 907.2035522460938, 933.9903564453125, 960.7772216796875, 987.5640258789062, 1014.350830078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 14.0, 12.0, 12.0, 26.0, 42.0, 76.0, 111.0, 223.0, 308.0, 503.0, 880.0, 1695.0, 3968.0, 12777.0, 90189.0, 3363310.0, 672575.0, 34947.0, 7204.0, 2595.0, 1189.0, 636.0, 358.0, 224.0, 121.0, 88.0, 62.0, 31.0, 35.0, 17.0, 14.0, 9.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.4375, -110.5947265625, -106.751953125, -102.9091796875, -99.06640625, -95.2236328125, -91.380859375, -87.5380859375, -83.6953125, -79.8525390625, -76.009765625, -72.1669921875, -68.32421875, -64.4814453125, -60.638671875, -56.7958984375, -52.953125, -49.1103515625, -45.267578125, -41.4248046875, -37.58203125, -33.7392578125, -29.896484375, -26.0537109375, -22.2109375, -18.3681640625, -14.525390625, -10.6826171875, -6.83984375, -2.9970703125, 0.845703125, 4.6884765625, 8.53125, 12.3740234375, 16.216796875, 20.0595703125, 23.90234375, 27.7451171875, 31.587890625, 35.4306640625, 39.2734375, 43.1162109375, 46.958984375, 50.8017578125, 54.64453125, 58.4873046875, 62.330078125, 66.1728515625, 70.015625, 73.8583984375, 77.701171875, 81.5439453125, 85.38671875, 89.2294921875, 93.072265625, 96.9150390625, 100.7578125, 104.6005859375, 108.443359375, 112.2861328125, 116.12890625, 119.9716796875, 123.814453125, 127.6572265625, 131.5]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 7.0, 7.0, 9.0, 10.0, 11.0, 15.0, 16.0, 27.0, 37.0, 33.0, 40.0, 37.0, 60.0, 54.0, 64.0, 101.0, 73.0, 72.0, 47.0, 48.0, 40.0, 36.0, 32.0, 24.0, 21.0, 14.0, 12.0, 4.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.21875, -48.76171875, -47.3046875, -45.84765625, -44.390625, -42.93359375, -41.4765625, -40.01953125, -38.5625, -37.10546875, -35.6484375, -34.19140625, -32.734375, -31.27734375, -29.8203125, -28.36328125, -26.90625, -25.44921875, -23.9921875, -22.53515625, -21.078125, -19.62109375, -18.1640625, -16.70703125, -15.25, -13.79296875, -12.3359375, -10.87890625, -9.421875, -7.96484375, -6.5078125, -5.05078125, -3.59375, -2.13671875, -0.6796875, 0.77734375, 2.234375, 3.69140625, 5.1484375, 6.60546875, 8.0625, 9.51953125, 10.9765625, 12.43359375, 13.890625, 15.34765625, 16.8046875, 18.26171875, 19.71875, 21.17578125, 22.6328125, 24.08984375, 25.546875, 27.00390625, 28.4609375, 29.91796875, 31.375, 32.83203125, 34.2890625, 35.74609375, 37.203125, 38.66015625, 40.1171875, 41.57421875, 43.03125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 10.0, 10.0, 31.0, 37.0, 86.0, 171.0, 361.0, 775.0, 3883.0, 4171266.0, 15896.0, 922.0, 363.0, 178.0, 106.0, 54.0, 26.0, 36.0, 23.0, 17.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-894.0, -857.765625, -821.53125, -785.296875, -749.0625, -712.828125, -676.59375, -640.359375, -604.125, -567.890625, -531.65625, -495.421875, -459.1875, -422.953125, -386.71875, -350.484375, -314.25, -278.015625, -241.78125, -205.546875, -169.3125, -133.078125, -96.84375, -60.609375, -24.375, 11.859375, 48.09375, 84.328125, 120.5625, 156.796875, 193.03125, 229.265625, 265.5, 301.734375, 337.96875, 374.203125, 410.4375, 446.671875, 482.90625, 519.140625, 555.375, 591.609375, 627.84375, 664.078125, 700.3125, 736.546875, 772.78125, 809.015625, 845.25, 881.484375, 917.71875, 953.953125, 990.1875, 1026.421875, 1062.65625, 1098.890625, 1135.125, 1171.359375, 1207.59375, 1243.828125, 1280.0625, 1316.296875, 1352.53125, 1388.765625, 1425.0]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 8.0, 21.0, 105.0, 2801.0, 1030.0, 78.0, 17.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-646.0, -622.8125, -599.625, -576.4375, -553.25, -530.0625, -506.875, -483.6875, -460.5, -437.3125, -414.125, -390.9375, -367.75, -344.5625, -321.375, -298.1875, -275.0, -251.8125, -228.625, -205.4375, -182.25, -159.0625, -135.875, -112.6875, -89.5, -66.3125, -43.125, -19.9375, 3.25, 26.4375, 49.625, 72.8125, 96.0, 119.1875, 142.375, 165.5625, 188.75, 211.9375, 235.125, 258.3125, 281.5, 304.6875, 327.875, 351.0625, 374.25, 397.4375, 420.625, 443.8125, 467.0, 490.1875, 513.375, 536.5625, 559.75, 582.9375, 606.125, 629.3125, 652.5, 675.6875, 698.875, 722.0625, 745.25, 768.4375, 791.625, 814.8125, 838.0]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 15.0, 34.0, 119.0, 427.0, 285.0, 76.0, 21.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4234.72314453125, -4082.369384765625, -3930.015869140625, -3777.662109375, -3625.30859375, -3472.954833984375, -3320.60107421875, -3168.24755859375, -3015.893798828125, -2863.5400390625, -2711.1865234375, -2558.832763671875, -2406.47900390625, -2254.12548828125, -2101.771728515625, -1949.4180908203125, -1797.064453125, -1644.7108154296875, -1492.357177734375, -1340.00341796875, -1187.6497802734375, -1035.296142578125, -882.9424438476562, -730.5887451171875, -578.235107421875, -425.8814392089844, -273.52777099609375, -121.17410278320312, 31.1795654296875, 183.533203125, 335.88690185546875, 488.2406005859375, 640.59375, 792.9473876953125, 945.3010864257812, 1097.65478515625, 1250.0084228515625, 1402.362060546875, 1554.7158203125, 1707.0694580078125, 1859.423095703125, 2011.7767333984375, 2164.13037109375, 2316.484130859375, 2468.837890625, 2621.19140625, 2773.545166015625, 2925.89892578125, 3078.25244140625, 3230.606201171875, 3382.959716796875, 3535.3134765625, 3687.6669921875, 3840.020751953125, 3992.37451171875, 4144.72802734375, 4297.08203125, 4449.435546875, 4601.78955078125, 4754.14306640625, 4906.49658203125, 5058.8505859375, 5211.2041015625, 5363.5576171875, 5515.9111328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 14.0, 8.0, 18.0, 22.0, 39.0, 48.0, 39.0, 62.0, 73.0, 95.0, 76.0, 91.0, 84.0, 72.0, 70.0, 50.0, 42.0, 51.0, 17.0, 9.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1225.6424560546875, -1176.6087646484375, -1127.5750732421875, -1078.5413818359375, -1029.507568359375, -980.4739379882812, -931.440185546875, -882.406494140625, -833.372802734375, -784.339111328125, -735.305419921875, -686.2716674804688, -637.2379760742188, -588.2042846679688, -539.1705322265625, -490.1368408203125, -441.1031494140625, -392.0694580078125, -343.0357360839844, -294.00201416015625, -244.96832275390625, -195.9346160888672, -146.90090942382812, -97.8671875, -48.83349609375, 0.2002105712890625, 49.233917236328125, 98.26762390136719, 147.30133056640625, 196.3350372314453, 245.36874389648438, 294.4024658203125, 343.43603515625, 392.4697265625, 441.5034484863281, 490.53717041015625, 539.5708618164062, 588.6045532226562, 637.6383056640625, 686.6719970703125, 735.7056884765625, 784.7393798828125, 833.7730712890625, 882.8068237304688, 931.8405151367188, 980.8742065429688, 1029.907958984375, 1078.941650390625, 1127.975341796875, 1177.009033203125, 1226.042724609375, 1275.076416015625, 1324.110107421875, 1373.1439208984375, 1422.1776123046875, 1471.2113037109375, 1520.2449951171875, 1569.2786865234375, 1618.3123779296875, 1667.3460693359375, 1716.3798828125, 1765.41357421875, 1814.447265625, 1863.48095703125, 1912.5146484375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 4.0, 8.0, 13.0, 12.0, 24.0, 45.0, 40.0, 72.0, 96.0, 175.0, 300.0, 485.0, 848.0, 1442.0, 2655.0, 5099.0, 10301.0, 22205.0, 54089.0, 159791.0, 423953.0, 235967.0, 75104.0, 28995.0, 12844.0, 6366.0, 3218.0, 1826.0, 1020.0, 601.0, 341.0, 226.0, 145.0, 78.0, 50.0, 45.0, 24.0, 15.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.9375, -68.373046875, -65.80859375, -63.244140625, -60.6796875, -58.115234375, -55.55078125, -52.986328125, -50.421875, -47.857421875, -45.29296875, -42.728515625, -40.1640625, -37.599609375, -35.03515625, -32.470703125, -29.90625, -27.341796875, -24.77734375, -22.212890625, -19.6484375, -17.083984375, -14.51953125, -11.955078125, -9.390625, -6.826171875, -4.26171875, -1.697265625, 0.8671875, 3.431640625, 5.99609375, 8.560546875, 11.125, 13.689453125, 16.25390625, 18.818359375, 21.3828125, 23.947265625, 26.51171875, 29.076171875, 31.640625, 34.205078125, 36.76953125, 39.333984375, 41.8984375, 44.462890625, 47.02734375, 49.591796875, 52.15625, 54.720703125, 57.28515625, 59.849609375, 62.4140625, 64.978515625, 67.54296875, 70.107421875, 72.671875, 75.236328125, 77.80078125, 80.365234375, 82.9296875, 85.494140625, 88.05859375, 90.623046875, 93.1875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 11.0, 21.0, 21.0, 31.0, 37.0, 32.0, 45.0, 47.0, 58.0, 52.0, 65.0, 54.0, 68.0, 71.0, 57.0, 39.0, 45.0, 46.0, 31.0, 26.0, 22.0, 15.0, 17.0, 14.0, 9.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.28515625, -50.0703125, -47.85546875, -45.640625, -43.42578125, -41.2109375, -38.99609375, -36.78125, -34.56640625, -32.3515625, -30.13671875, -27.921875, -25.70703125, -23.4921875, -21.27734375, -19.0625, -16.84765625, -14.6328125, -12.41796875, -10.203125, -7.98828125, -5.7734375, -3.55859375, -1.34375, 0.87109375, 3.0859375, 5.30078125, 7.515625, 9.73046875, 11.9453125, 14.16015625, 16.375, 18.58984375, 20.8046875, 23.01953125, 25.234375, 27.44921875, 29.6640625, 31.87890625, 34.09375, 36.30859375, 38.5234375, 40.73828125, 42.953125, 45.16796875, 47.3828125, 49.59765625, 51.8125, 54.02734375, 56.2421875, 58.45703125, 60.671875, 62.88671875, 65.1015625, 67.31640625, 69.53125, 71.74609375, 73.9609375, 76.17578125, 78.390625, 80.60546875, 82.8203125, 85.03515625, 87.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 4.0, 5.0, 14.0, 8.0, 15.0, 23.0, 34.0, 42.0, 75.0, 119.0, 227.0, 452.0, 982.0, 2687.0, 8390.0, 37452.0, 331683.0, 603399.0, 47891.0, 9937.0, 2858.0, 1131.0, 485.0, 235.0, 143.0, 84.0, 51.0, 34.0, 34.0, 12.0, 18.0, 8.0, 4.0, 6.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-222.875, -216.134765625, -209.39453125, -202.654296875, -195.9140625, -189.173828125, -182.43359375, -175.693359375, -168.953125, -162.212890625, -155.47265625, -148.732421875, -141.9921875, -135.251953125, -128.51171875, -121.771484375, -115.03125, -108.291015625, -101.55078125, -94.810546875, -88.0703125, -81.330078125, -74.58984375, -67.849609375, -61.109375, -54.369140625, -47.62890625, -40.888671875, -34.1484375, -27.408203125, -20.66796875, -13.927734375, -7.1875, -0.447265625, 6.29296875, 13.033203125, 19.7734375, 26.513671875, 33.25390625, 39.994140625, 46.734375, 53.474609375, 60.21484375, 66.955078125, 73.6953125, 80.435546875, 87.17578125, 93.916015625, 100.65625, 107.396484375, 114.13671875, 120.876953125, 127.6171875, 134.357421875, 141.09765625, 147.837890625, 154.578125, 161.318359375, 168.05859375, 174.798828125, 181.5390625, 188.279296875, 195.01953125, 201.759765625, 208.5]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 11.0, 15.0, 20.0, 24.0, 26.0, 28.0, 23.0, 35.0, 39.0, 49.0, 49.0, 39.0, 45.0, 53.0, 47.0, 47.0, 57.0, 45.0, 39.0, 48.0, 37.0, 19.0, 31.0, 29.0, 17.0, 15.0, 16.0, 16.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-280.25, -271.91796875, -263.5859375, -255.25390625, -246.921875, -238.58984375, -230.2578125, -221.92578125, -213.59375, -205.26171875, -196.9296875, -188.59765625, -180.265625, -171.93359375, -163.6015625, -155.26953125, -146.9375, -138.60546875, -130.2734375, -121.94140625, -113.609375, -105.27734375, -96.9453125, -88.61328125, -80.28125, -71.94921875, -63.6171875, -55.28515625, -46.953125, -38.62109375, -30.2890625, -21.95703125, -13.625, -5.29296875, 3.0390625, 11.37109375, 19.703125, 28.03515625, 36.3671875, 44.69921875, 53.03125, 61.36328125, 69.6953125, 78.02734375, 86.359375, 94.69140625, 103.0234375, 111.35546875, 119.6875, 128.01953125, 136.3515625, 144.68359375, 153.015625, 161.34765625, 169.6796875, 178.01171875, 186.34375, 194.67578125, 203.0078125, 211.33984375, 219.671875, 228.00390625, 236.3359375, 244.66796875, 253.0]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 6.0, 12.0, 16.0, 20.0, 27.0, 35.0, 58.0, 67.0, 132.0, 207.0, 277.0, 433.0, 731.0, 1372.0, 2771.0, 8268.0, 47118.0, 775685.0, 184103.0, 18104.0, 4553.0, 1863.0, 978.0, 612.0, 353.0, 212.0, 172.0, 104.0, 62.0, 48.0, 43.0, 30.0, 16.0, 12.0, 12.0, 2.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-101.3125, -98.2197265625, -95.126953125, -92.0341796875, -88.94140625, -85.8486328125, -82.755859375, -79.6630859375, -76.5703125, -73.4775390625, -70.384765625, -67.2919921875, -64.19921875, -61.1064453125, -58.013671875, -54.9208984375, -51.828125, -48.7353515625, -45.642578125, -42.5498046875, -39.45703125, -36.3642578125, -33.271484375, -30.1787109375, -27.0859375, -23.9931640625, -20.900390625, -17.8076171875, -14.71484375, -11.6220703125, -8.529296875, -5.4365234375, -2.34375, 0.7490234375, 3.841796875, 6.9345703125, 10.02734375, 13.1201171875, 16.212890625, 19.3056640625, 22.3984375, 25.4912109375, 28.583984375, 31.6767578125, 34.76953125, 37.8623046875, 40.955078125, 44.0478515625, 47.140625, 50.2333984375, 53.326171875, 56.4189453125, 59.51171875, 62.6044921875, 65.697265625, 68.7900390625, 71.8828125, 74.9755859375, 78.068359375, 81.1611328125, 84.25390625, 87.3466796875, 90.439453125, 93.5322265625, 96.625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 27.0, 62.0, 228.0, 425.0, 148.0, 57.0, 17.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.1083984375, -0.10601091384887695, -0.1036233901977539, -0.10123586654663086, -0.09884834289550781, -0.09646081924438477, -0.09407329559326172, -0.09168577194213867, -0.08929824829101562, -0.08691072463989258, -0.08452320098876953, -0.08213567733764648, -0.07974815368652344, -0.07736063003540039, -0.07497310638427734, -0.0725855827331543, -0.07019805908203125, -0.0678105354309082, -0.06542301177978516, -0.06303548812866211, -0.06064796447753906, -0.058260440826416016, -0.05587291717529297, -0.05348539352416992, -0.051097869873046875, -0.04871034622192383, -0.04632282257080078, -0.043935298919677734, -0.04154777526855469, -0.03916025161743164, -0.036772727966308594, -0.03438520431518555, -0.0319976806640625, -0.029610157012939453, -0.027222633361816406, -0.02483510971069336, -0.022447586059570312, -0.020060062408447266, -0.01767253875732422, -0.015285015106201172, -0.012897491455078125, -0.010509967803955078, -0.008122444152832031, -0.005734920501708984, -0.0033473968505859375, -0.0009598731994628906, 0.0014276504516601562, 0.003815174102783203, 0.00620269775390625, 0.008590221405029297, 0.010977745056152344, 0.01336526870727539, 0.015752792358398438, 0.018140316009521484, 0.02052783966064453, 0.022915363311767578, 0.025302886962890625, 0.027690410614013672, 0.03007793426513672, 0.032465457916259766, 0.03485298156738281, 0.03724050521850586, 0.039628028869628906, 0.04201555252075195, 0.044403076171875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 13.0, 8.0, 14.0, 24.0, 36.0, 60.0, 114.0, 205.0, 394.0, 833.0, 1999.0, 5467.0, 23425.0, 277060.0, 689811.0, 37213.0, 7334.0, 2478.0, 1062.0, 470.0, 246.0, 114.0, 56.0, 44.0, 26.0, 18.0, 9.0, 6.0, 7.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.5625, -111.390625, -108.21875, -105.046875, -101.875, -98.703125, -95.53125, -92.359375, -89.1875, -86.015625, -82.84375, -79.671875, -76.5, -73.328125, -70.15625, -66.984375, -63.8125, -60.640625, -57.46875, -54.296875, -51.125, -47.953125, -44.78125, -41.609375, -38.4375, -35.265625, -32.09375, -28.921875, -25.75, -22.578125, -19.40625, -16.234375, -13.0625, -9.890625, -6.71875, -3.546875, -0.375, 2.796875, 5.96875, 9.140625, 12.3125, 15.484375, 18.65625, 21.828125, 25.0, 28.171875, 31.34375, 34.515625, 37.6875, 40.859375, 44.03125, 47.203125, 50.375, 53.546875, 56.71875, 59.890625, 63.0625, 66.234375, 69.40625, 72.578125, 75.75, 78.921875, 82.09375, 85.265625, 88.4375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 13.0, 8.0, 13.0, 17.0, 34.0, 54.0, 74.0, 109.0, 144.0, 148.0, 126.0, 83.0, 55.0, 42.0, 29.0, 17.0, 7.0, 3.0, 2.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.1875, -112.1796875, -109.171875, -106.1640625, -103.15625, -100.1484375, -97.140625, -94.1328125, -91.125, -88.1171875, -85.109375, -82.1015625, -79.09375, -76.0859375, -73.078125, -70.0703125, -67.0625, -64.0546875, -61.046875, -58.0390625, -55.03125, -52.0234375, -49.015625, -46.0078125, -43.0, -39.9921875, -36.984375, -33.9765625, -30.96875, -27.9609375, -24.953125, -21.9453125, -18.9375, -15.9296875, -12.921875, -9.9140625, -6.90625, -3.8984375, -0.890625, 2.1171875, 5.125, 8.1328125, 11.140625, 14.1484375, 17.15625, 20.1640625, 23.171875, 26.1796875, 29.1875, 32.1953125, 35.203125, 38.2109375, 41.21875, 44.2265625, 47.234375, 50.2421875, 53.25, 56.2578125, 59.265625, 62.2734375, 65.28125, 68.2890625, 71.296875, 74.3046875, 77.3125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 17.0, 30.0, 98.0, 228.0, 386.0, 147.0, 45.0, 24.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2199.96875, -2113.217041015625, -2026.465087890625, -1939.71337890625, -1852.9615478515625, -1766.209716796875, -1679.4580078125, -1592.7061767578125, -1505.954345703125, -1419.2025146484375, -1332.45068359375, -1245.698974609375, -1158.9471435546875, -1072.1953125, -985.4435424804688, -898.6917724609375, -811.93994140625, -725.1881103515625, -638.4363403320312, -551.6845703125, -464.9327392578125, -378.1809387207031, -291.42913818359375, -204.6773681640625, -117.925537109375, -31.173736572265625, 55.57806396484375, 142.32986450195312, 229.0816650390625, 315.8334655761719, 402.58526611328125, 489.3370361328125, 576.0888671875, 662.8406982421875, 749.5924682617188, 836.34423828125, 923.0960693359375, 1009.847900390625, 1096.599609375, 1183.3514404296875, 1270.103271484375, 1356.8551025390625, 1443.60693359375, 1530.358642578125, 1617.1104736328125, 1703.8623046875, 1790.614013671875, 1877.3658447265625, 1964.11767578125, 2050.869384765625, 2137.621337890625, 2224.373046875, 2311.125, 2397.876708984375, 2484.62841796875, 2571.38037109375, 2658.132080078125, 2744.8837890625, 2831.6357421875, 2918.387451171875, 3005.13916015625, 3091.89111328125, 3178.642822265625, 3265.39453125, 3352.146484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 5.0, 6.0, 8.0, 8.0, 12.0, 13.0, 17.0, 18.0, 14.0, 17.0, 24.0, 18.0, 22.0, 28.0, 34.0, 30.0, 44.0, 44.0, 52.0, 61.0, 53.0, 50.0, 52.0, 40.0, 26.0, 28.0, 27.0, 32.0, 17.0, 15.0, 31.0, 22.0, 16.0, 15.0, 14.0, 10.0, 11.0, 5.0, 9.0, 9.0, 6.0, 1.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-1008.56005859375, -977.6911010742188, -946.8220825195312, -915.953125, -885.0841674804688, -854.2152099609375, -823.34619140625, -792.4772338867188, -761.6082763671875, -730.7393188476562, -699.8703002929688, -669.0013427734375, -638.1323852539062, -607.263427734375, -576.3944091796875, -545.5254516601562, -514.656494140625, -483.7875061035156, -452.9185485839844, -422.049560546875, -391.18060302734375, -360.3116149902344, -329.442626953125, -298.57366943359375, -267.70465087890625, -236.83567810058594, -205.96670532226562, -175.09771728515625, -144.228759765625, -113.35977172851562, -82.49079895019531, -51.621826171875, -20.75286865234375, 10.116106033325195, 40.98508071899414, 71.85405731201172, 102.72303009033203, 133.59201049804688, 164.4609832763672, 195.3299560546875, 226.1989288330078, 257.0679016113281, 287.9368896484375, 318.80584716796875, 349.6748352050781, 380.5438232421875, 411.41278076171875, 442.28173828125, 473.1507263183594, 504.01971435546875, 534.888671875, 565.7576293945312, 596.6266479492188, 627.49560546875, 658.3645629882812, 689.2335205078125, 720.1025390625, 750.9714965820312, 781.8405151367188, 812.70947265625, 843.5784301757812, 874.4473876953125, 905.31640625, 936.1853637695312, 967.0543212890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 4.0, 13.0, 17.0, 14.0, 17.0, 34.0, 43.0, 61.0, 94.0, 130.0, 184.0, 302.0, 492.0, 780.0, 1453.0, 3249.0, 8845.0, 42744.0, 409964.0, 3339297.0, 331546.0, 40078.0, 8410.0, 2989.0, 1429.0, 777.0, 430.0, 307.0, 172.0, 120.0, 82.0, 64.0, 31.0, 28.0, 21.0, 14.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-98.5, -95.2666015625, -92.033203125, -88.7998046875, -85.56640625, -82.3330078125, -79.099609375, -75.8662109375, -72.6328125, -69.3994140625, -66.166015625, -62.9326171875, -59.69921875, -56.4658203125, -53.232421875, -49.9990234375, -46.765625, -43.5322265625, -40.298828125, -37.0654296875, -33.83203125, -30.5986328125, -27.365234375, -24.1318359375, -20.8984375, -17.6650390625, -14.431640625, -11.1982421875, -7.96484375, -4.7314453125, -1.498046875, 1.7353515625, 4.96875, 8.2021484375, 11.435546875, 14.6689453125, 17.90234375, 21.1357421875, 24.369140625, 27.6025390625, 30.8359375, 34.0693359375, 37.302734375, 40.5361328125, 43.76953125, 47.0029296875, 50.236328125, 53.4697265625, 56.703125, 59.9365234375, 63.169921875, 66.4033203125, 69.63671875, 72.8701171875, 76.103515625, 79.3369140625, 82.5703125, 85.8037109375, 89.037109375, 92.2705078125, 95.50390625, 98.7373046875, 101.970703125, 105.2041015625, 108.4375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 1.0, 9.0, 5.0, 11.0, 13.0, 24.0, 25.0, 38.0, 28.0, 43.0, 45.0, 40.0, 62.0, 52.0, 71.0, 70.0, 71.0, 63.0, 48.0, 47.0, 41.0, 45.0, 29.0, 21.0, 25.0, 16.0, 12.0, 15.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75, -69.376953125, -67.00390625, -64.630859375, -62.2578125, -59.884765625, -57.51171875, -55.138671875, -52.765625, -50.392578125, -48.01953125, -45.646484375, -43.2734375, -40.900390625, -38.52734375, -36.154296875, -33.78125, -31.408203125, -29.03515625, -26.662109375, -24.2890625, -21.916015625, -19.54296875, -17.169921875, -14.796875, -12.423828125, -10.05078125, -7.677734375, -5.3046875, -2.931640625, -0.55859375, 1.814453125, 4.1875, 6.560546875, 8.93359375, 11.306640625, 13.6796875, 16.052734375, 18.42578125, 20.798828125, 23.171875, 25.544921875, 27.91796875, 30.291015625, 32.6640625, 35.037109375, 37.41015625, 39.783203125, 42.15625, 44.529296875, 46.90234375, 49.275390625, 51.6484375, 54.021484375, 56.39453125, 58.767578125, 61.140625, 63.513671875, 65.88671875, 68.259765625, 70.6328125, 73.005859375, 75.37890625, 77.751953125, 80.125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 19.0, 39.0, 112.0, 267.0, 1405.0, 2400377.0, 1790205.0, 1375.0, 292.0, 111.0, 42.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1317.0, -1284.875, -1252.75, -1220.625, -1188.5, -1156.375, -1124.25, -1092.125, -1060.0, -1027.875, -995.75, -963.625, -931.5, -899.375, -867.25, -835.125, -803.0, -770.875, -738.75, -706.625, -674.5, -642.375, -610.25, -578.125, -546.0, -513.875, -481.75, -449.625, -417.5, -385.375, -353.25, -321.125, -289.0, -256.875, -224.75, -192.625, -160.5, -128.375, -96.25, -64.125, -32.0, 0.125, 32.25, 64.375, 96.5, 128.625, 160.75, 192.875, 225.0, 257.125, 289.25, 321.375, 353.5, 385.625, 417.75, 449.875, 482.0, 514.125, 546.25, 578.375, 610.5, 642.625, 674.75, 706.875, 739.0]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 3.0, 6.0, 12.0, 27.0, 42.0, 136.0, 740.0, 2208.0, 671.0, 120.0, 48.0, 23.0, 13.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.5, -192.1171875, -181.734375, -171.3515625, -160.96875, -150.5859375, -140.203125, -129.8203125, -119.4375, -109.0546875, -98.671875, -88.2890625, -77.90625, -67.5234375, -57.140625, -46.7578125, -36.375, -25.9921875, -15.609375, -5.2265625, 5.15625, 15.5390625, 25.921875, 36.3046875, 46.6875, 57.0703125, 67.453125, 77.8359375, 88.21875, 98.6015625, 108.984375, 119.3671875, 129.75, 140.1328125, 150.515625, 160.8984375, 171.28125, 181.6640625, 192.046875, 202.4296875, 212.8125, 223.1953125, 233.578125, 243.9609375, 254.34375, 264.7265625, 275.109375, 285.4921875, 295.875, 306.2578125, 316.640625, 327.0234375, 337.40625, 347.7890625, 358.171875, 368.5546875, 378.9375, 389.3203125, 399.703125, 410.0859375, 420.46875, 430.8515625, 441.234375, 451.6171875, 462.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 13.0, 21.0, 38.0, 54.0, 100.0, 123.0, 163.0, 148.0, 122.0, 95.0, 44.0, 30.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-743.2432861328125, -709.4435424804688, -675.643798828125, -641.8440551757812, -608.0443115234375, -574.2445678710938, -540.44482421875, -506.64508056640625, -472.8453369140625, -439.04559326171875, -405.245849609375, -371.44610595703125, -337.6463623046875, -303.84661865234375, -270.046875, -236.24713134765625, -202.4473876953125, -168.64764404296875, -134.847900390625, -101.04815673828125, -67.2484130859375, -33.44866943359375, 0.35107421875, 34.15081787109375, 67.9505615234375, 101.75030517578125, 135.550048828125, 169.34979248046875, 203.1495361328125, 236.94927978515625, 270.7490234375, 304.54876708984375, 338.3485107421875, 372.14825439453125, 405.947998046875, 439.74774169921875, 473.5474853515625, 507.34722900390625, 541.14697265625, 574.9467163085938, 608.7464599609375, 642.5462036132812, 676.345947265625, 710.1456909179688, 743.9454345703125, 777.7451782226562, 811.544921875, 845.3446655273438, 879.1444091796875, 912.9441528320312, 946.743896484375, 980.5436401367188, 1014.3433837890625, 1048.14306640625, 1081.94287109375, 1115.74267578125, 1149.5423583984375, 1183.342041015625, 1217.141845703125, 1250.941650390625, 1284.7413330078125, 1318.541015625, 1352.3408203125, 1386.140625, 1419.9403076171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 7.0, 7.0, 10.0, 11.0, 20.0, 20.0, 31.0, 36.0, 37.0, 31.0, 36.0, 42.0, 41.0, 40.0, 53.0, 41.0, 46.0, 41.0, 59.0, 40.0, 39.0, 30.0, 42.0, 25.0, 28.0, 22.0, 22.0, 26.0, 10.0, 21.0, 15.0, 12.0, 15.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-597.777099609375, -580.9933471679688, -564.2095336914062, -547.42578125, -530.6420288085938, -513.8582763671875, -497.074462890625, -480.29071044921875, -463.5069274902344, -446.72314453125, -429.93939208984375, -413.1556091308594, -396.371826171875, -379.58807373046875, -362.8042907714844, -346.0205078125, -329.23675537109375, -312.4529724121094, -295.6692199707031, -278.88543701171875, -262.1016845703125, -245.31790161132812, -228.53411865234375, -211.75035095214844, -194.96658325195312, -178.1828155517578, -161.3990478515625, -144.61526489257812, -127.83149719238281, -111.0477294921875, -94.26395416259766, -77.48017883300781, -60.6964111328125, -43.91263961791992, -27.128868103027344, -10.345096588134766, 6.4386749267578125, 23.222442626953125, 40.00621795654297, 56.78999328613281, 73.57376098632812, 90.35752868652344, 107.14130401611328, 123.92507934570312, 140.70884704589844, 157.49261474609375, 174.27639770507812, 191.06016540527344, 207.84393310546875, 224.62770080566406, 241.41146850585938, 258.19525146484375, 274.97900390625, 291.7627868652344, 308.54656982421875, 325.330322265625, 342.1141052246094, 358.89788818359375, 375.681640625, 392.4654235839844, 409.24920654296875, 426.032958984375, 442.8167419433594, 459.60052490234375, 476.38427734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 10.0, 14.0, 16.0, 35.0, 28.0, 52.0, 60.0, 131.0, 148.0, 210.0, 327.0, 490.0, 849.0, 1412.0, 2487.0, 4649.0, 9146.0, 19505.0, 48301.0, 147832.0, 441753.0, 245101.0, 72519.0, 27493.0, 12181.0, 5924.0, 3255.0, 1727.0, 1006.0, 649.0, 405.0, 245.0, 175.0, 126.0, 76.0, 61.0, 50.0, 28.0, 19.0, 10.0, 13.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.5, -73.923828125, -71.34765625, -68.771484375, -66.1953125, -63.619140625, -61.04296875, -58.466796875, -55.890625, -53.314453125, -50.73828125, -48.162109375, -45.5859375, -43.009765625, -40.43359375, -37.857421875, -35.28125, -32.705078125, -30.12890625, -27.552734375, -24.9765625, -22.400390625, -19.82421875, -17.248046875, -14.671875, -12.095703125, -9.51953125, -6.943359375, -4.3671875, -1.791015625, 0.78515625, 3.361328125, 5.9375, 8.513671875, 11.08984375, 13.666015625, 16.2421875, 18.818359375, 21.39453125, 23.970703125, 26.546875, 29.123046875, 31.69921875, 34.275390625, 36.8515625, 39.427734375, 42.00390625, 44.580078125, 47.15625, 49.732421875, 52.30859375, 54.884765625, 57.4609375, 60.037109375, 62.61328125, 65.189453125, 67.765625, 70.341796875, 72.91796875, 75.494140625, 78.0703125, 80.646484375, 83.22265625, 85.798828125, 88.375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 1.0, 6.0, 9.0, 15.0, 5.0, 19.0, 25.0, 30.0, 24.0, 47.0, 37.0, 51.0, 46.0, 56.0, 61.0, 71.0, 59.0, 57.0, 61.0, 50.0, 37.0, 41.0, 38.0, 21.0, 25.0, 13.0, 21.0, 19.0, 12.0, 11.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.3125, -80.0263671875, -77.740234375, -75.4541015625, -73.16796875, -70.8818359375, -68.595703125, -66.3095703125, -64.0234375, -61.7373046875, -59.451171875, -57.1650390625, -54.87890625, -52.5927734375, -50.306640625, -48.0205078125, -45.734375, -43.4482421875, -41.162109375, -38.8759765625, -36.58984375, -34.3037109375, -32.017578125, -29.7314453125, -27.4453125, -25.1591796875, -22.873046875, -20.5869140625, -18.30078125, -16.0146484375, -13.728515625, -11.4423828125, -9.15625, -6.8701171875, -4.583984375, -2.2978515625, -0.01171875, 2.2744140625, 4.560546875, 6.8466796875, 9.1328125, 11.4189453125, 13.705078125, 15.9912109375, 18.27734375, 20.5634765625, 22.849609375, 25.1357421875, 27.421875, 29.7080078125, 31.994140625, 34.2802734375, 36.56640625, 38.8525390625, 41.138671875, 43.4248046875, 45.7109375, 47.9970703125, 50.283203125, 52.5693359375, 54.85546875, 57.1416015625, 59.427734375, 61.7138671875, 64.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 11.0, 14.0, 18.0, 28.0, 44.0, 87.0, 140.0, 349.0, 1174.0, 5924.0, 80644.0, 921521.0, 33639.0, 3556.0, 798.0, 310.0, 116.0, 52.0, 37.0, 20.0, 18.0, 9.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.5, -328.3203125, -317.140625, -305.9609375, -294.78125, -283.6015625, -272.421875, -261.2421875, -250.0625, -238.8828125, -227.703125, -216.5234375, -205.34375, -194.1640625, -182.984375, -171.8046875, -160.625, -149.4453125, -138.265625, -127.0859375, -115.90625, -104.7265625, -93.546875, -82.3671875, -71.1875, -60.0078125, -48.828125, -37.6484375, -26.46875, -15.2890625, -4.109375, 7.0703125, 18.25, 29.4296875, 40.609375, 51.7890625, 62.96875, 74.1484375, 85.328125, 96.5078125, 107.6875, 118.8671875, 130.046875, 141.2265625, 152.40625, 163.5859375, 174.765625, 185.9453125, 197.125, 208.3046875, 219.484375, 230.6640625, 241.84375, 253.0234375, 264.203125, 275.3828125, 286.5625, 297.7421875, 308.921875, 320.1015625, 331.28125, 342.4609375, 353.640625, 364.8203125, 376.0]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 4.0, 8.0, 13.0, 10.0, 20.0, 17.0, 22.0, 26.0, 33.0, 28.0, 35.0, 42.0, 52.0, 48.0, 70.0, 43.0, 54.0, 60.0, 50.0, 51.0, 56.0, 41.0, 41.0, 28.0, 25.0, 19.0, 19.0, 17.0, 15.0, 12.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-278.0, -269.3671875, -260.734375, -252.1015625, -243.46875, -234.8359375, -226.203125, -217.5703125, -208.9375, -200.3046875, -191.671875, -183.0390625, -174.40625, -165.7734375, -157.140625, -148.5078125, -139.875, -131.2421875, -122.609375, -113.9765625, -105.34375, -96.7109375, -88.078125, -79.4453125, -70.8125, -62.1796875, -53.546875, -44.9140625, -36.28125, -27.6484375, -19.015625, -10.3828125, -1.75, 6.8828125, 15.515625, 24.1484375, 32.78125, 41.4140625, 50.046875, 58.6796875, 67.3125, 75.9453125, 84.578125, 93.2109375, 101.84375, 110.4765625, 119.109375, 127.7421875, 136.375, 145.0078125, 153.640625, 162.2734375, 170.90625, 179.5390625, 188.171875, 196.8046875, 205.4375, 214.0703125, 222.703125, 231.3359375, 239.96875, 248.6015625, 257.234375, 265.8671875, 274.5]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 15.0, 19.0, 33.0, 46.0, 58.0, 95.0, 153.0, 266.0, 577.0, 1336.0, 3641.0, 15277.0, 123745.0, 825730.0, 62832.0, 9900.0, 2664.0, 1060.0, 437.0, 222.0, 126.0, 91.0, 63.0, 45.0, 29.0, 24.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.125, -75.7109375, -73.296875, -70.8828125, -68.46875, -66.0546875, -63.640625, -61.2265625, -58.8125, -56.3984375, -53.984375, -51.5703125, -49.15625, -46.7421875, -44.328125, -41.9140625, -39.5, -37.0859375, -34.671875, -32.2578125, -29.84375, -27.4296875, -25.015625, -22.6015625, -20.1875, -17.7734375, -15.359375, -12.9453125, -10.53125, -8.1171875, -5.703125, -3.2890625, -0.875, 1.5390625, 3.953125, 6.3671875, 8.78125, 11.1953125, 13.609375, 16.0234375, 18.4375, 20.8515625, 23.265625, 25.6796875, 28.09375, 30.5078125, 32.921875, 35.3359375, 37.75, 40.1640625, 42.578125, 44.9921875, 47.40625, 49.8203125, 52.234375, 54.6484375, 57.0625, 59.4765625, 61.890625, 64.3046875, 66.71875, 69.1328125, 71.546875, 73.9609375, 76.375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 5.0, 14.0, 22.0, 36.0, 52.0, 141.0, 249.0, 231.0, 110.0, 61.0, 30.0, 19.0, 15.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04450798034667969, -0.043392181396484375, -0.04227638244628906, -0.04116058349609375, -0.04004478454589844, -0.038928985595703125, -0.03781318664550781, -0.0366973876953125, -0.03558158874511719, -0.034465789794921875, -0.03334999084472656, -0.03223419189453125, -0.031118392944335938, -0.030002593994140625, -0.028886795043945312, -0.02777099609375, -0.026655197143554688, -0.025539398193359375, -0.024423599243164062, -0.02330780029296875, -0.022192001342773438, -0.021076202392578125, -0.019960403442382812, -0.0188446044921875, -0.017728805541992188, -0.016613006591796875, -0.015497207641601562, -0.01438140869140625, -0.013265609741210938, -0.012149810791015625, -0.011034011840820312, -0.009918212890625, -0.008802413940429688, -0.007686614990234375, -0.0065708160400390625, -0.00545501708984375, -0.0043392181396484375, -0.003223419189453125, -0.0021076202392578125, -0.0009918212890625, 0.0001239776611328125, 0.001239776611328125, 0.0023555755615234375, 0.00347137451171875, 0.0045871734619140625, 0.005702972412109375, 0.0068187713623046875, 0.0079345703125, 0.009050369262695312, 0.010166168212890625, 0.011281967163085938, 0.01239776611328125, 0.013513565063476562, 0.014629364013671875, 0.015745162963867188, 0.0168609619140625, 0.017976760864257812, 0.019092559814453125, 0.020208358764648438, 0.02132415771484375, 0.022439956665039062, 0.023555755615234375, 0.024671554565429688, 0.025787353515625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 3.0, 12.0, 8.0, 11.0, 18.0, 27.0, 26.0, 40.0, 54.0, 101.0, 151.0, 257.0, 417.0, 831.0, 1700.0, 4210.0, 12978.0, 67894.0, 799835.0, 129945.0, 19866.0, 5674.0, 2139.0, 1061.0, 507.0, 298.0, 158.0, 104.0, 61.0, 45.0, 30.0, 14.0, 12.0, 19.0, 8.0, 11.0, 4.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.125, -72.7509765625, -70.376953125, -68.0029296875, -65.62890625, -63.2548828125, -60.880859375, -58.5068359375, -56.1328125, -53.7587890625, -51.384765625, -49.0107421875, -46.63671875, -44.2626953125, -41.888671875, -39.5146484375, -37.140625, -34.7666015625, -32.392578125, -30.0185546875, -27.64453125, -25.2705078125, -22.896484375, -20.5224609375, -18.1484375, -15.7744140625, -13.400390625, -11.0263671875, -8.65234375, -6.2783203125, -3.904296875, -1.5302734375, 0.84375, 3.2177734375, 5.591796875, 7.9658203125, 10.33984375, 12.7138671875, 15.087890625, 17.4619140625, 19.8359375, 22.2099609375, 24.583984375, 26.9580078125, 29.33203125, 31.7060546875, 34.080078125, 36.4541015625, 38.828125, 41.2021484375, 43.576171875, 45.9501953125, 48.32421875, 50.6982421875, 53.072265625, 55.4462890625, 57.8203125, 60.1943359375, 62.568359375, 64.9423828125, 67.31640625, 69.6904296875, 72.064453125, 74.4384765625, 76.8125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 11.0, 8.0, 6.0, 16.0, 26.0, 25.0, 50.0, 68.0, 68.0, 101.0, 131.0, 136.0, 94.0, 69.0, 39.0, 26.0, 21.0, 19.0, 11.0, 6.0, 8.0, 8.0, 12.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-61.34375, -59.529296875, -57.71484375, -55.900390625, -54.0859375, -52.271484375, -50.45703125, -48.642578125, -46.828125, -45.013671875, -43.19921875, -41.384765625, -39.5703125, -37.755859375, -35.94140625, -34.126953125, -32.3125, -30.498046875, -28.68359375, -26.869140625, -25.0546875, -23.240234375, -21.42578125, -19.611328125, -17.796875, -15.982421875, -14.16796875, -12.353515625, -10.5390625, -8.724609375, -6.91015625, -5.095703125, -3.28125, -1.466796875, 0.34765625, 2.162109375, 3.9765625, 5.791015625, 7.60546875, 9.419921875, 11.234375, 13.048828125, 14.86328125, 16.677734375, 18.4921875, 20.306640625, 22.12109375, 23.935546875, 25.75, 27.564453125, 29.37890625, 31.193359375, 33.0078125, 34.822265625, 36.63671875, 38.451171875, 40.265625, 42.080078125, 43.89453125, 45.708984375, 47.5234375, 49.337890625, 51.15234375, 52.966796875, 54.78125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 9.0, 25.0, 110.0, 533.0, 269.0, 38.0, 15.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-933.4581909179688, -812.8829956054688, -692.3077392578125, -571.7325439453125, -451.1573486328125, -330.5821533203125, -210.00689697265625, -89.43170166015625, 31.14349365234375, 151.7187042236328, 272.2939147949219, 392.869140625, 513.4443359375, 634.01953125, 754.5947875976562, 875.1699829101562, 995.7451782226562, 1116.3204345703125, 1236.8956298828125, 1357.4708251953125, 1478.0460205078125, 1598.6212158203125, 1719.196533203125, 1839.771728515625, 1960.346923828125, 2080.922119140625, 2201.497314453125, 2322.072509765625, 2442.647705078125, 2563.222900390625, 2683.79833984375, 2804.37353515625, 2924.94873046875, 3045.52392578125, 3166.09912109375, 3286.67431640625, 3407.24951171875, 3527.82470703125, 3648.39990234375, 3768.97509765625, 3889.55029296875, 4010.12548828125, 4130.70068359375, 4251.27587890625, 4371.85107421875, 4492.42626953125, 4613.00146484375, 4733.57666015625, 4854.15234375, 4974.7275390625, 5095.302734375, 5215.8779296875, 5336.453125, 5457.0283203125, 5577.603515625, 5698.1787109375, 5818.75390625, 5939.3291015625, 6059.904296875, 6180.4794921875, 6301.0546875, 6421.6298828125, 6542.205078125, 6662.7802734375, 6783.35546875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 10.0, 6.0, 10.0, 6.0, 12.0, 13.0, 19.0, 23.0, 12.0, 24.0, 36.0, 34.0, 32.0, 29.0, 53.0, 63.0, 92.0, 104.0, 76.0, 37.0, 39.0, 26.0, 31.0, 19.0, 25.0, 26.0, 21.0, 17.0, 13.0, 13.0, 12.0, 14.0, 10.0, 7.0, 4.0, 1.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1055.872802734375, -1024.9217529296875, -993.9706420898438, -963.01953125, -932.0684204101562, -901.1173706054688, -870.166259765625, -839.2152099609375, -808.2640991210938, -777.31298828125, -746.3619384765625, -715.4108276367188, -684.459716796875, -653.5086669921875, -622.5575561523438, -591.6064453125, -560.6553955078125, -529.7042846679688, -498.7532043457031, -467.8021240234375, -436.8510437011719, -405.89996337890625, -374.9488525390625, -343.9977722167969, -313.046630859375, -282.0955505371094, -251.1444549560547, -220.193359375, -189.24227905273438, -158.2911834716797, -127.340087890625, -96.38900756835938, -65.43792724609375, -34.486839294433594, -3.535747528076172, 27.41534423828125, 58.366432189941406, 89.31752014160156, 120.26861572265625, 151.21969604492188, 182.17079162597656, 213.12188720703125, 244.07296752929688, 275.0240478515625, 305.97515869140625, 336.9262390136719, 367.8773193359375, 398.82843017578125, 429.7795104980469, 460.7305908203125, 491.68170166015625, 522.6328125, 553.5838623046875, 584.5349731445312, 615.486083984375, 646.4371337890625, 677.3882446289062, 708.33935546875, 739.2904052734375, 770.2415161132812, 801.192626953125, 832.1436767578125, 863.0947875976562, 894.0458984375, 924.9969482421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 12.0, 6.0, 9.0, 8.0, 4.0, 12.0, 21.0, 18.0, 32.0, 29.0, 63.0, 90.0, 124.0, 229.0, 509.0, 1177.0, 4040.0, 28972.0, 3040370.0, 1096719.0, 16536.0, 3125.0, 1036.0, 466.0, 233.0, 129.0, 91.0, 53.0, 40.0, 30.0, 18.0, 9.0, 12.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-182.625, -175.294921875, -167.96484375, -160.634765625, -153.3046875, -145.974609375, -138.64453125, -131.314453125, -123.984375, -116.654296875, -109.32421875, -101.994140625, -94.6640625, -87.333984375, -80.00390625, -72.673828125, -65.34375, -58.013671875, -50.68359375, -43.353515625, -36.0234375, -28.693359375, -21.36328125, -14.033203125, -6.703125, 0.626953125, 7.95703125, 15.287109375, 22.6171875, 29.947265625, 37.27734375, 44.607421875, 51.9375, 59.267578125, 66.59765625, 73.927734375, 81.2578125, 88.587890625, 95.91796875, 103.248046875, 110.578125, 117.908203125, 125.23828125, 132.568359375, 139.8984375, 147.228515625, 154.55859375, 161.888671875, 169.21875, 176.548828125, 183.87890625, 191.208984375, 198.5390625, 205.869140625, 213.19921875, 220.529296875, 227.859375, 235.189453125, 242.51953125, 249.849609375, 257.1796875, 264.509765625, 271.83984375, 279.169921875, 286.5]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 15.0, 19.0, 24.0, 32.0, 42.0, 37.0, 49.0, 32.0, 40.0, 45.0, 41.0, 56.0, 56.0, 50.0, 65.0, 35.0, 48.0, 53.0, 26.0, 38.0, 21.0, 17.0, 13.0, 12.0, 16.0, 10.0, 15.0, 7.0, 15.0, 2.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.375, -56.4384765625, -54.501953125, -52.5654296875, -50.62890625, -48.6923828125, -46.755859375, -44.8193359375, -42.8828125, -40.9462890625, -39.009765625, -37.0732421875, -35.13671875, -33.2001953125, -31.263671875, -29.3271484375, -27.390625, -25.4541015625, -23.517578125, -21.5810546875, -19.64453125, -17.7080078125, -15.771484375, -13.8349609375, -11.8984375, -9.9619140625, -8.025390625, -6.0888671875, -4.15234375, -2.2158203125, -0.279296875, 1.6572265625, 3.59375, 5.5302734375, 7.466796875, 9.4033203125, 11.33984375, 13.2763671875, 15.212890625, 17.1494140625, 19.0859375, 21.0224609375, 22.958984375, 24.8955078125, 26.83203125, 28.7685546875, 30.705078125, 32.6416015625, 34.578125, 36.5146484375, 38.451171875, 40.3876953125, 42.32421875, 44.2607421875, 46.197265625, 48.1337890625, 50.0703125, 52.0068359375, 53.943359375, 55.8798828125, 57.81640625, 59.7529296875, 61.689453125, 63.6259765625, 65.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 12.0, 11.0, 23.0, 23.0, 55.0, 83.0, 184.0, 468.0, 2894.0, 64541.0, 4115822.0, 8744.0, 970.0, 216.0, 88.0, 59.0, 34.0, 28.0, 10.0, 11.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-869.5, -844.828125, -820.15625, -795.484375, -770.8125, -746.140625, -721.46875, -696.796875, -672.125, -647.453125, -622.78125, -598.109375, -573.4375, -548.765625, -524.09375, -499.421875, -474.75, -450.078125, -425.40625, -400.734375, -376.0625, -351.390625, -326.71875, -302.046875, -277.375, -252.703125, -228.03125, -203.359375, -178.6875, -154.015625, -129.34375, -104.671875, -80.0, -55.328125, -30.65625, -5.984375, 18.6875, 43.359375, 68.03125, 92.703125, 117.375, 142.046875, 166.71875, 191.390625, 216.0625, 240.734375, 265.40625, 290.078125, 314.75, 339.421875, 364.09375, 388.765625, 413.4375, 438.109375, 462.78125, 487.453125, 512.125, 536.796875, 561.46875, 586.140625, 610.8125, 635.484375, 660.15625, 684.828125, 709.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 5.0, 15.0, 22.0, 48.0, 119.0, 587.0, 2089.0, 840.0, 200.0, 52.0, 29.0, 15.0, 16.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-516.0, -504.935546875, -493.87109375, -482.806640625, -471.7421875, -460.677734375, -449.61328125, -438.548828125, -427.484375, -416.419921875, -405.35546875, -394.291015625, -383.2265625, -372.162109375, -361.09765625, -350.033203125, -338.96875, -327.904296875, -316.83984375, -305.775390625, -294.7109375, -283.646484375, -272.58203125, -261.517578125, -250.453125, -239.388671875, -228.32421875, -217.259765625, -206.1953125, -195.130859375, -184.06640625, -173.001953125, -161.9375, -150.873046875, -139.80859375, -128.744140625, -117.6796875, -106.615234375, -95.55078125, -84.486328125, -73.421875, -62.357421875, -51.29296875, -40.228515625, -29.1640625, -18.099609375, -7.03515625, 4.029296875, 15.09375, 26.158203125, 37.22265625, 48.287109375, 59.3515625, 70.416015625, 81.48046875, 92.544921875, 103.609375, 114.673828125, 125.73828125, 136.802734375, 147.8671875, 158.931640625, 169.99609375, 181.060546875, 192.125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 12.0, 16.0, 32.0, 100.0, 240.0, 381.0, 155.0, 41.0, 9.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5116.96142578125, -5004.3525390625, -4891.744140625, -4779.13525390625, -4666.5263671875, -4553.91748046875, -4441.30908203125, -4328.7001953125, -4216.09130859375, -4103.482421875, -3990.873779296875, -3878.26513671875, -3765.65625, -3653.047607421875, -3540.43896484375, -3427.830078125, -3315.221435546875, -3202.61279296875, -3090.00390625, -2977.395263671875, -2864.786376953125, -2752.177734375, -2639.56884765625, -2526.960205078125, -2414.3515625, -2301.742919921875, -2189.134033203125, -2076.525390625, -1963.91650390625, -1851.307861328125, -1738.6990966796875, -1626.09033203125, -1513.481201171875, -1400.8724365234375, -1288.263671875, -1175.655029296875, -1063.046142578125, -950.4374389648438, -837.8287353515625, -725.219970703125, -612.6112060546875, -500.00244140625, -387.3937072753906, -274.78497314453125, -162.17620849609375, -49.56744384765625, 63.041259765625, 175.6500244140625, 288.2587890625, 400.8675537109375, 513.476318359375, 626.0850219726562, 738.6937866210938, 851.3025512695312, 963.9112548828125, 1076.52001953125, 1189.1287841796875, 1301.737548828125, 1414.3463134765625, 1526.955078125, 1639.563720703125, 1752.172607421875, 1864.78125, 1977.3900146484375, 2089.998779296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 17.0, 17.0, 18.0, 23.0, 27.0, 31.0, 33.0, 42.0, 45.0, 44.0, 56.0, 63.0, 49.0, 56.0, 63.0, 46.0, 40.0, 41.0, 39.0, 41.0, 28.0, 32.0, 19.0, 30.0, 17.0, 13.0, 10.0, 11.0, 8.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-882.3338623046875, -852.0466918945312, -821.7595825195312, -791.472412109375, -761.185302734375, -730.8981323242188, -700.6109619140625, -670.3238525390625, -640.0367431640625, -609.7495727539062, -579.4624633789062, -549.17529296875, -518.88818359375, -488.60101318359375, -458.3138732910156, -428.0267333984375, -397.73956298828125, -367.4524230957031, -337.165283203125, -306.87811279296875, -276.59100341796875, -246.30384826660156, -216.01669311523438, -185.72955322265625, -155.44241333007812, -125.1552734375, -94.86812591552734, -64.58097839355469, -34.29383850097656, -4.0066986083984375, 26.28045654296875, 56.567596435546875, 86.854736328125, 117.14187622070312, 147.42901611328125, 177.71617126464844, 208.00331115722656, 238.2904510498047, 268.5776062011719, 298.86474609375, 329.1518859863281, 359.43902587890625, 389.7261657714844, 420.0133056640625, 450.30047607421875, 480.58758544921875, 510.874755859375, 541.161865234375, 571.4490356445312, 601.7362060546875, 632.0233154296875, 662.3104858398438, 692.5975952148438, 722.884765625, 753.171875, 783.4590454101562, 813.7462158203125, 844.0333862304688, 874.3204956054688, 904.607666015625, 934.894775390625, 965.1819458007812, 995.4691162109375, 1025.7562255859375, 1056.0433349609375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 17.0, 27.0, 44.0, 39.0, 82.0, 132.0, 179.0, 304.0, 489.0, 911.0, 1417.0, 2708.0, 5255.0, 10956.0, 25346.0, 69658.0, 246843.0, 464908.0, 140031.0, 44652.0, 17583.0, 7918.0, 4038.0, 2136.0, 1144.0, 661.0, 373.0, 202.0, 155.0, 110.0, 69.0, 53.0, 32.0, 22.0, 15.0, 10.0, 5.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-114.4375, -110.8935546875, -107.349609375, -103.8056640625, -100.26171875, -96.7177734375, -93.173828125, -89.6298828125, -86.0859375, -82.5419921875, -78.998046875, -75.4541015625, -71.91015625, -68.3662109375, -64.822265625, -61.2783203125, -57.734375, -54.1904296875, -50.646484375, -47.1025390625, -43.55859375, -40.0146484375, -36.470703125, -32.9267578125, -29.3828125, -25.8388671875, -22.294921875, -18.7509765625, -15.20703125, -11.6630859375, -8.119140625, -4.5751953125, -1.03125, 2.5126953125, 6.056640625, 9.6005859375, 13.14453125, 16.6884765625, 20.232421875, 23.7763671875, 27.3203125, 30.8642578125, 34.408203125, 37.9521484375, 41.49609375, 45.0400390625, 48.583984375, 52.1279296875, 55.671875, 59.2158203125, 62.759765625, 66.3037109375, 69.84765625, 73.3916015625, 76.935546875, 80.4794921875, 84.0234375, 87.5673828125, 91.111328125, 94.6552734375, 98.19921875, 101.7431640625, 105.287109375, 108.8310546875, 112.375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 8.0, 10.0, 11.0, 16.0, 21.0, 22.0, 37.0, 28.0, 34.0, 41.0, 54.0, 58.0, 44.0, 58.0, 53.0, 59.0, 66.0, 53.0, 44.0, 51.0, 28.0, 38.0, 24.0, 25.0, 15.0, 11.0, 8.0, 11.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-90.0625, -87.583984375, -85.10546875, -82.626953125, -80.1484375, -77.669921875, -75.19140625, -72.712890625, -70.234375, -67.755859375, -65.27734375, -62.798828125, -60.3203125, -57.841796875, -55.36328125, -52.884765625, -50.40625, -47.927734375, -45.44921875, -42.970703125, -40.4921875, -38.013671875, -35.53515625, -33.056640625, -30.578125, -28.099609375, -25.62109375, -23.142578125, -20.6640625, -18.185546875, -15.70703125, -13.228515625, -10.75, -8.271484375, -5.79296875, -3.314453125, -0.8359375, 1.642578125, 4.12109375, 6.599609375, 9.078125, 11.556640625, 14.03515625, 16.513671875, 18.9921875, 21.470703125, 23.94921875, 26.427734375, 28.90625, 31.384765625, 33.86328125, 36.341796875, 38.8203125, 41.298828125, 43.77734375, 46.255859375, 48.734375, 51.212890625, 53.69140625, 56.169921875, 58.6484375, 61.126953125, 63.60546875, 66.083984375, 68.5625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 11.0, 6.0, 14.0, 23.0, 21.0, 31.0, 36.0, 55.0, 73.0, 132.0, 242.0, 484.0, 1211.0, 3980.0, 20772.0, 389626.0, 603566.0, 21705.0, 4122.0, 1271.0, 495.0, 250.0, 134.0, 78.0, 65.0, 36.0, 24.0, 20.0, 12.0, 7.0, 10.0, 13.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-336.5, -325.98828125, -315.4765625, -304.96484375, -294.453125, -283.94140625, -273.4296875, -262.91796875, -252.40625, -241.89453125, -231.3828125, -220.87109375, -210.359375, -199.84765625, -189.3359375, -178.82421875, -168.3125, -157.80078125, -147.2890625, -136.77734375, -126.265625, -115.75390625, -105.2421875, -94.73046875, -84.21875, -73.70703125, -63.1953125, -52.68359375, -42.171875, -31.66015625, -21.1484375, -10.63671875, -0.125, 10.38671875, 20.8984375, 31.41015625, 41.921875, 52.43359375, 62.9453125, 73.45703125, 83.96875, 94.48046875, 104.9921875, 115.50390625, 126.015625, 136.52734375, 147.0390625, 157.55078125, 168.0625, 178.57421875, 189.0859375, 199.59765625, 210.109375, 220.62109375, 231.1328125, 241.64453125, 252.15625, 262.66796875, 273.1796875, 283.69140625, 294.203125, 304.71484375, 315.2265625, 325.73828125, 336.25]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 5.0, 4.0, 6.0, 7.0, 14.0, 12.0, 10.0, 20.0, 16.0, 23.0, 33.0, 30.0, 37.0, 37.0, 35.0, 46.0, 72.0, 71.0, 58.0, 62.0, 62.0, 52.0, 40.0, 47.0, 29.0, 25.0, 22.0, 13.0, 24.0, 14.0, 14.0, 13.0, 11.0, 6.0, 6.0, 6.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.0, -297.73046875, -287.4609375, -277.19140625, -266.921875, -256.65234375, -246.3828125, -236.11328125, -225.84375, -215.57421875, -205.3046875, -195.03515625, -184.765625, -174.49609375, -164.2265625, -153.95703125, -143.6875, -133.41796875, -123.1484375, -112.87890625, -102.609375, -92.33984375, -82.0703125, -71.80078125, -61.53125, -51.26171875, -40.9921875, -30.72265625, -20.453125, -10.18359375, 0.0859375, 10.35546875, 20.625, 30.89453125, 41.1640625, 51.43359375, 61.703125, 71.97265625, 82.2421875, 92.51171875, 102.78125, 113.05078125, 123.3203125, 133.58984375, 143.859375, 154.12890625, 164.3984375, 174.66796875, 184.9375, 195.20703125, 205.4765625, 215.74609375, 226.015625, 236.28515625, 246.5546875, 256.82421875, 267.09375, 277.36328125, 287.6328125, 297.90234375, 308.171875, 318.44140625, 328.7109375, 338.98046875, 349.25]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 8.0, 14.0, 16.0, 33.0, 87.0, 164.0, 345.0, 925.0, 2863.0, 13063.0, 178240.0, 823304.0, 23095.0, 4235.0, 1300.0, 455.0, 187.0, 93.0, 39.0, 26.0, 15.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.125, -125.80859375, -121.4921875, -117.17578125, -112.859375, -108.54296875, -104.2265625, -99.91015625, -95.59375, -91.27734375, -86.9609375, -82.64453125, -78.328125, -74.01171875, -69.6953125, -65.37890625, -61.0625, -56.74609375, -52.4296875, -48.11328125, -43.796875, -39.48046875, -35.1640625, -30.84765625, -26.53125, -22.21484375, -17.8984375, -13.58203125, -9.265625, -4.94921875, -0.6328125, 3.68359375, 8.0, 12.31640625, 16.6328125, 20.94921875, 25.265625, 29.58203125, 33.8984375, 38.21484375, 42.53125, 46.84765625, 51.1640625, 55.48046875, 59.796875, 64.11328125, 68.4296875, 72.74609375, 77.0625, 81.37890625, 85.6953125, 90.01171875, 94.328125, 98.64453125, 102.9609375, 107.27734375, 111.59375, 115.91015625, 120.2265625, 124.54296875, 128.859375, 133.17578125, 137.4921875, 141.80859375, 146.125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 7.0, 20.0, 31.0, 58.0, 162.0, 355.0, 158.0, 75.0, 35.0, 23.0, 6.0, 4.0, 5.0, 8.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0389404296875, -0.03747272491455078, -0.03600502014160156, -0.034537315368652344, -0.033069610595703125, -0.031601905822753906, -0.030134201049804688, -0.02866649627685547, -0.02719879150390625, -0.02573108673095703, -0.024263381958007812, -0.022795677185058594, -0.021327972412109375, -0.019860267639160156, -0.018392562866210938, -0.01692485809326172, -0.0154571533203125, -0.013989448547363281, -0.012521743774414062, -0.011054039001464844, -0.009586334228515625, -0.008118629455566406, -0.0066509246826171875, -0.005183219909667969, -0.00371551513671875, -0.0022478103637695312, -0.0007801055908203125, 0.0006875991821289062, 0.002155303955078125, 0.0036230087280273438, 0.0050907135009765625, 0.006558418273925781, 0.008026123046875, 0.009493827819824219, 0.010961532592773438, 0.012429237365722656, 0.013896942138671875, 0.015364646911621094, 0.016832351684570312, 0.01830005645751953, 0.01976776123046875, 0.02123546600341797, 0.022703170776367188, 0.024170875549316406, 0.025638580322265625, 0.027106285095214844, 0.028573989868164062, 0.03004169464111328, 0.0315093994140625, 0.03297710418701172, 0.03444480895996094, 0.035912513732910156, 0.037380218505859375, 0.038847923278808594, 0.04031562805175781, 0.04178333282470703, 0.04325103759765625, 0.04471874237060547, 0.04618644714355469, 0.047654151916503906, 0.049121856689453125, 0.050589561462402344, 0.05205726623535156, 0.05352497100830078, 0.05499267578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 12.0, 10.0, 18.0, 22.0, 31.0, 57.0, 85.0, 174.0, 346.0, 821.0, 2596.0, 12511.0, 139825.0, 848771.0, 35556.0, 5222.0, 1432.0, 533.0, 231.0, 113.0, 71.0, 36.0, 19.0, 16.0, 14.0, 10.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.1875, -114.2802734375, -110.373046875, -106.4658203125, -102.55859375, -98.6513671875, -94.744140625, -90.8369140625, -86.9296875, -83.0224609375, -79.115234375, -75.2080078125, -71.30078125, -67.3935546875, -63.486328125, -59.5791015625, -55.671875, -51.7646484375, -47.857421875, -43.9501953125, -40.04296875, -36.1357421875, -32.228515625, -28.3212890625, -24.4140625, -20.5068359375, -16.599609375, -12.6923828125, -8.78515625, -4.8779296875, -0.970703125, 2.9365234375, 6.84375, 10.7509765625, 14.658203125, 18.5654296875, 22.47265625, 26.3798828125, 30.287109375, 34.1943359375, 38.1015625, 42.0087890625, 45.916015625, 49.8232421875, 53.73046875, 57.6376953125, 61.544921875, 65.4521484375, 69.359375, 73.2666015625, 77.173828125, 81.0810546875, 84.98828125, 88.8955078125, 92.802734375, 96.7099609375, 100.6171875, 104.5244140625, 108.431640625, 112.3388671875, 116.24609375, 120.1533203125, 124.060546875, 127.9677734375, 131.875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 16.0, 23.0, 19.0, 33.0, 49.0, 58.0, 102.0, 164.0, 159.0, 101.0, 75.0, 49.0, 33.0, 26.0, 13.0, 17.0, 7.0, 9.0, 3.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.439453125, -81.19140625, -77.943359375, -74.6953125, -71.447265625, -68.19921875, -64.951171875, -61.703125, -58.455078125, -55.20703125, -51.958984375, -48.7109375, -45.462890625, -42.21484375, -38.966796875, -35.71875, -32.470703125, -29.22265625, -25.974609375, -22.7265625, -19.478515625, -16.23046875, -12.982421875, -9.734375, -6.486328125, -3.23828125, 0.009765625, 3.2578125, 6.505859375, 9.75390625, 13.001953125, 16.25, 19.498046875, 22.74609375, 25.994140625, 29.2421875, 32.490234375, 35.73828125, 38.986328125, 42.234375, 45.482421875, 48.73046875, 51.978515625, 55.2265625, 58.474609375, 61.72265625, 64.970703125, 68.21875, 71.466796875, 74.71484375, 77.962890625, 81.2109375, 84.458984375, 87.70703125, 90.955078125, 94.203125, 97.451171875, 100.69921875, 103.947265625, 107.1953125, 110.443359375, 113.69140625, 116.939453125, 120.1875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 14.0, 47.0, 288.0, 495.0, 111.0, 36.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5085.96435546875, -4927.49853515625, -4769.03271484375, -4610.56689453125, -4452.10107421875, -4293.63525390625, -4135.16943359375, -3976.70361328125, -3818.23779296875, -3659.77197265625, -3501.30615234375, -3342.84033203125, -3184.37451171875, -3025.90869140625, -2867.44287109375, -2708.97705078125, -2550.510986328125, -2392.045166015625, -2233.579345703125, -2075.113525390625, -1916.647705078125, -1758.181884765625, -1599.7159423828125, -1441.2501220703125, -1282.7843017578125, -1124.3184814453125, -965.8526611328125, -807.3867797851562, -648.9209594726562, -490.45513916015625, -331.9892578125, -173.5234375, -15.0576171875, 143.40821838378906, 301.8740539550781, 460.33990478515625, 618.8057250976562, 777.2715454101562, 935.7374267578125, 1094.2032470703125, 1252.6690673828125, 1411.1348876953125, 1569.6007080078125, 1728.066650390625, 1886.532470703125, 2044.998291015625, 2203.464111328125, 2361.929931640625, 2520.395751953125, 2678.861572265625, 2837.327392578125, 2995.793212890625, 3154.259033203125, 3312.724853515625, 3471.19091796875, 3629.65673828125, 3788.12255859375, 3946.58837890625, 4105.05419921875, 4263.52001953125, 4421.98583984375, 4580.45166015625, 4738.91748046875, 4897.38330078125, 5055.84912109375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 10.0, 11.0, 11.0, 14.0, 12.0, 10.0, 17.0, 28.0, 32.0, 20.0, 33.0, 32.0, 33.0, 46.0, 97.0, 158.0, 108.0, 44.0, 33.0, 29.0, 37.0, 19.0, 23.0, 22.0, 10.0, 12.0, 16.0, 15.0, 6.0, 14.0, 4.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1466.438720703125, -1422.586181640625, -1378.7337646484375, -1334.8812255859375, -1291.02880859375, -1247.17626953125, -1203.3238525390625, -1159.4713134765625, -1115.618896484375, -1071.766357421875, -1027.9139404296875, -984.0614624023438, -940.208984375, -896.3565063476562, -852.5040283203125, -808.6514892578125, -764.7990112304688, -720.946533203125, -677.0940551757812, -633.2415771484375, -589.3890991210938, -545.53662109375, -501.6841125488281, -457.8316345214844, -413.9791564941406, -370.1266784667969, -326.2742004394531, -282.42169189453125, -238.56922912597656, -194.7167510986328, -150.8642578125, -107.01177978515625, -63.1593017578125, -19.306819915771484, 24.54566192626953, 68.39814758300781, 112.25062561035156, 156.1031036376953, 199.95559692382812, 243.80807495117188, 287.6605529785156, 331.5130310058594, 375.3655090332031, 419.218017578125, 463.07049560546875, 506.9229736328125, 550.7754516601562, 594.6279296875, 638.4804077148438, 682.3328857421875, 726.1853637695312, 770.037841796875, 813.8903198242188, 857.7427978515625, 901.5953369140625, 945.44775390625, 989.30029296875, 1033.15283203125, 1077.0052490234375, 1120.8577880859375, 1164.710205078125, 1208.562744140625, 1252.4151611328125, 1296.2677001953125, 1340.1201171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 8.0, 11.0, 28.0, 40.0, 44.0, 86.0, 162.0, 175.0, 338.0, 546.0, 1040.0, 1861.0, 3656.0, 8443.0, 24108.0, 141294.0, 2369234.0, 1504594.0, 104159.0, 20241.0, 7294.0, 3208.0, 1516.0, 853.0, 487.0, 329.0, 161.0, 105.0, 66.0, 40.0, 43.0, 24.0, 20.0, 21.0, 7.0, 6.0, 10.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.125, -190.75, -184.375, -178.0, -171.625, -165.25, -158.875, -152.5, -146.125, -139.75, -133.375, -127.0, -120.625, -114.25, -107.875, -101.5, -95.125, -88.75, -82.375, -76.0, -69.625, -63.25, -56.875, -50.5, -44.125, -37.75, -31.375, -25.0, -18.625, -12.25, -5.875, 0.5, 6.875, 13.25, 19.625, 26.0, 32.375, 38.75, 45.125, 51.5, 57.875, 64.25, 70.625, 77.0, 83.375, 89.75, 96.125, 102.5, 108.875, 115.25, 121.625, 128.0, 134.375, 140.75, 147.125, 153.5, 159.875, 166.25, 172.625, 179.0, 185.375, 191.75, 198.125, 204.5, 210.875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 0.0, 4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 10.0, 9.0, 23.0, 22.0, 29.0, 35.0, 32.0, 45.0, 43.0, 53.0, 44.0, 54.0, 72.0, 48.0, 49.0, 59.0, 49.0, 45.0, 34.0, 39.0, 24.0, 29.0, 20.0, 20.0, 21.0, 12.0, 13.0, 12.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-79.125, -76.7275390625, -74.330078125, -71.9326171875, -69.53515625, -67.1376953125, -64.740234375, -62.3427734375, -59.9453125, -57.5478515625, -55.150390625, -52.7529296875, -50.35546875, -47.9580078125, -45.560546875, -43.1630859375, -40.765625, -38.3681640625, -35.970703125, -33.5732421875, -31.17578125, -28.7783203125, -26.380859375, -23.9833984375, -21.5859375, -19.1884765625, -16.791015625, -14.3935546875, -11.99609375, -9.5986328125, -7.201171875, -4.8037109375, -2.40625, -0.0087890625, 2.388671875, 4.7861328125, 7.18359375, 9.5810546875, 11.978515625, 14.3759765625, 16.7734375, 19.1708984375, 21.568359375, 23.9658203125, 26.36328125, 28.7607421875, 31.158203125, 33.5556640625, 35.953125, 38.3505859375, 40.748046875, 43.1455078125, 45.54296875, 47.9404296875, 50.337890625, 52.7353515625, 55.1328125, 57.5302734375, 59.927734375, 62.3251953125, 64.72265625, 67.1201171875, 69.517578125, 71.9150390625, 74.3125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 16.0, 18.0, 27.0, 55.0, 163.0, 408.0, 1756.0, 269248.0, 3919076.0, 2679.0, 500.0, 196.0, 72.0, 32.0, 21.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1460.0, -1404.0, -1348.0, -1292.0, -1236.0, -1180.0, -1124.0, -1068.0, -1012.0, -956.0, -900.0, -844.0, -788.0, -732.0, -676.0, -620.0, -564.0, -508.0, -452.0, -396.0, -340.0, -284.0, -228.0, -172.0, -116.0, -60.0, -4.0, 52.0, 108.0, 164.0, 220.0, 276.0, 332.0, 388.0, 444.0, 500.0, 556.0, 612.0, 668.0, 724.0, 780.0, 836.0, 892.0, 948.0, 1004.0, 1060.0, 1116.0, 1172.0, 1228.0, 1284.0, 1340.0, 1396.0, 1452.0, 1508.0, 1564.0, 1620.0, 1676.0, 1732.0, 1788.0, 1844.0, 1900.0, 1956.0, 2012.0, 2068.0, 2124.0]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 15.0, 32.0, 63.0, 178.0, 616.0, 2125.0, 694.0, 189.0, 77.0, 46.0, 14.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.5, -270.1484375, -246.796875, -223.4453125, -200.09375, -176.7421875, -153.390625, -130.0390625, -106.6875, -83.3359375, -59.984375, -36.6328125, -13.28125, 10.0703125, 33.421875, 56.7734375, 80.125, 103.4765625, 126.828125, 150.1796875, 173.53125, 196.8828125, 220.234375, 243.5859375, 266.9375, 290.2890625, 313.640625, 336.9921875, 360.34375, 383.6953125, 407.046875, 430.3984375, 453.75, 477.1015625, 500.453125, 523.8046875, 547.15625, 570.5078125, 593.859375, 617.2109375, 640.5625, 663.9140625, 687.265625, 710.6171875, 733.96875, 757.3203125, 780.671875, 804.0234375, 827.375, 850.7265625, 874.078125, 897.4296875, 920.78125, 944.1328125, 967.484375, 990.8359375, 1014.1875, 1037.5390625, 1060.890625, 1084.2421875, 1107.59375, 1130.9453125, 1154.296875, 1177.6484375, 1201.0]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 9.0, 10.0, 17.0, 35.0, 55.0, 94.0, 181.0, 189.0, 149.0, 94.0, 54.0, 23.0, 31.0, 7.0, 7.0, 7.0, 1.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2762.39892578125, -2664.6455078125, -2566.89208984375, -2469.138427734375, -2371.385009765625, -2273.631591796875, -2175.878173828125, -2078.12451171875, -1980.37109375, -1882.61767578125, -1784.8641357421875, -1687.1107177734375, -1589.357177734375, -1491.603759765625, -1393.850341796875, -1296.0968017578125, -1198.3433837890625, -1100.5899658203125, -1002.83642578125, -905.0830078125, -807.3294677734375, -709.5760498046875, -611.8225708007812, -514.069091796875, -416.31561279296875, -318.5621337890625, -220.8086700439453, -123.05520629882812, -25.301727294921875, 72.45175170898438, 170.2052001953125, 267.95867919921875, 365.712158203125, 463.46563720703125, 561.2191162109375, 658.9725341796875, 756.72607421875, 854.4794921875, 952.2329711914062, 1049.9864501953125, 1147.739990234375, 1245.493408203125, 1343.2469482421875, 1441.0003662109375, 1538.75390625, 1636.50732421875, 1734.2607421875, 1832.0142822265625, 1929.7677001953125, 2027.5211181640625, 2125.274658203125, 2223.028076171875, 2320.781494140625, 2418.53515625, 2516.28857421875, 2614.0419921875, 2711.79541015625, 2809.548828125, 2907.30224609375, 3005.055908203125, 3102.809326171875, 3200.562744140625, 3298.316162109375, 3396.06982421875, 3493.8232421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 18.0, 20.0, 27.0, 37.0, 48.0, 45.0, 52.0, 63.0, 77.0, 90.0, 87.0, 86.0, 51.0, 63.0, 53.0, 39.0, 26.0, 27.0, 21.0, 10.0, 13.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2712.68212890625, -2650.98193359375, -2589.28173828125, -2527.58154296875, -2465.88134765625, -2404.18115234375, -2342.48095703125, -2280.78076171875, -2219.08056640625, -2157.38037109375, -2095.68017578125, -2033.97998046875, -1972.27978515625, -1910.57958984375, -1848.87939453125, -1787.17919921875, -1725.4788818359375, -1663.7786865234375, -1602.0784912109375, -1540.3782958984375, -1478.6781005859375, -1416.9779052734375, -1355.277587890625, -1293.577392578125, -1231.877197265625, -1170.177001953125, -1108.476806640625, -1046.776611328125, -985.076416015625, -923.376220703125, -861.6759643554688, -799.9757690429688, -738.2755126953125, -676.5753173828125, -614.8751220703125, -553.1749267578125, -491.4747009277344, -429.7745056152344, -368.07427978515625, -306.37408447265625, -244.67388916015625, -182.97369384765625, -121.27348327636719, -59.573272705078125, 2.126922607421875, 63.827117919921875, 125.52734375, 187.2275390625, 248.927734375, 310.6279296875, 372.328125, 434.0283508300781, 495.7285461425781, 557.4287109375, 619.1289672851562, 680.8291625976562, 742.5293579101562, 804.2295532226562, 865.9297485351562, 927.6300048828125, 989.3302001953125, 1051.0303955078125, 1112.7305908203125, 1174.4307861328125, 1236.1309814453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 15.0, 20.0, 30.0, 61.0, 75.0, 135.0, 218.0, 357.0, 601.0, 1108.0, 2349.0, 5156.0, 12746.0, 37726.0, 164055.0, 635657.0, 134812.0, 32657.0, 11283.0, 4711.0, 2259.0, 1052.0, 572.0, 346.0, 183.0, 118.0, 88.0, 46.0, 30.0, 26.0, 14.0, 11.0, 7.0, 1.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.125, -163.380859375, -157.63671875, -151.892578125, -146.1484375, -140.404296875, -134.66015625, -128.916015625, -123.171875, -117.427734375, -111.68359375, -105.939453125, -100.1953125, -94.451171875, -88.70703125, -82.962890625, -77.21875, -71.474609375, -65.73046875, -59.986328125, -54.2421875, -48.498046875, -42.75390625, -37.009765625, -31.265625, -25.521484375, -19.77734375, -14.033203125, -8.2890625, -2.544921875, 3.19921875, 8.943359375, 14.6875, 20.431640625, 26.17578125, 31.919921875, 37.6640625, 43.408203125, 49.15234375, 54.896484375, 60.640625, 66.384765625, 72.12890625, 77.873046875, 83.6171875, 89.361328125, 95.10546875, 100.849609375, 106.59375, 112.337890625, 118.08203125, 123.826171875, 129.5703125, 135.314453125, 141.05859375, 146.802734375, 152.546875, 158.291015625, 164.03515625, 169.779296875, 175.5234375, 181.267578125, 187.01171875, 192.755859375, 198.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 11.0, 5.0, 8.0, 15.0, 16.0, 23.0, 27.0, 33.0, 37.0, 52.0, 67.0, 63.0, 77.0, 66.0, 72.0, 68.0, 57.0, 59.0, 36.0, 45.0, 32.0, 29.0, 32.0, 12.0, 9.0, 9.0, 9.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.6875, -115.6728515625, -111.658203125, -107.6435546875, -103.62890625, -99.6142578125, -95.599609375, -91.5849609375, -87.5703125, -83.5556640625, -79.541015625, -75.5263671875, -71.51171875, -67.4970703125, -63.482421875, -59.4677734375, -55.453125, -51.4384765625, -47.423828125, -43.4091796875, -39.39453125, -35.3798828125, -31.365234375, -27.3505859375, -23.3359375, -19.3212890625, -15.306640625, -11.2919921875, -7.27734375, -3.2626953125, 0.751953125, 4.7666015625, 8.78125, 12.7958984375, 16.810546875, 20.8251953125, 24.83984375, 28.8544921875, 32.869140625, 36.8837890625, 40.8984375, 44.9130859375, 48.927734375, 52.9423828125, 56.95703125, 60.9716796875, 64.986328125, 69.0009765625, 73.015625, 77.0302734375, 81.044921875, 85.0595703125, 89.07421875, 93.0888671875, 97.103515625, 101.1181640625, 105.1328125, 109.1474609375, 113.162109375, 117.1767578125, 121.19140625, 125.2060546875, 129.220703125, 133.2353515625, 137.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 6.0, 10.0, 11.0, 14.0, 28.0, 35.0, 73.0, 122.0, 221.0, 599.0, 1762.0, 7755.0, 103768.0, 907241.0, 21744.0, 3377.0, 937.0, 372.0, 185.0, 96.0, 61.0, 41.0, 16.0, 16.0, 12.0, 16.0, 5.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-344.25, -332.86328125, -321.4765625, -310.08984375, -298.703125, -287.31640625, -275.9296875, -264.54296875, -253.15625, -241.76953125, -230.3828125, -218.99609375, -207.609375, -196.22265625, -184.8359375, -173.44921875, -162.0625, -150.67578125, -139.2890625, -127.90234375, -116.515625, -105.12890625, -93.7421875, -82.35546875, -70.96875, -59.58203125, -48.1953125, -36.80859375, -25.421875, -14.03515625, -2.6484375, 8.73828125, 20.125, 31.51171875, 42.8984375, 54.28515625, 65.671875, 77.05859375, 88.4453125, 99.83203125, 111.21875, 122.60546875, 133.9921875, 145.37890625, 156.765625, 168.15234375, 179.5390625, 190.92578125, 202.3125, 213.69921875, 225.0859375, 236.47265625, 247.859375, 259.24609375, 270.6328125, 282.01953125, 293.40625, 304.79296875, 316.1796875, 327.56640625, 338.953125, 350.33984375, 361.7265625, 373.11328125, 384.5]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 7.0, 18.0, 28.0, 33.0, 45.0, 57.0, 69.0, 95.0, 106.0, 118.0, 85.0, 77.0, 55.0, 35.0, 26.0, 23.0, 24.0, 14.0, 17.0, 10.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-562.0, -543.1328125, -524.265625, -505.3984375, -486.53125, -467.6640625, -448.796875, -429.9296875, -411.0625, -392.1953125, -373.328125, -354.4609375, -335.59375, -316.7265625, -297.859375, -278.9921875, -260.125, -241.2578125, -222.390625, -203.5234375, -184.65625, -165.7890625, -146.921875, -128.0546875, -109.1875, -90.3203125, -71.453125, -52.5859375, -33.71875, -14.8515625, 4.015625, 22.8828125, 41.75, 60.6171875, 79.484375, 98.3515625, 117.21875, 136.0859375, 154.953125, 173.8203125, 192.6875, 211.5546875, 230.421875, 249.2890625, 268.15625, 287.0234375, 305.890625, 324.7578125, 343.625, 362.4921875, 381.359375, 400.2265625, 419.09375, 437.9609375, 456.828125, 475.6953125, 494.5625, 513.4296875, 532.296875, 551.1640625, 570.03125, 588.8984375, 607.765625, 626.6328125, 645.5]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 2.0, 3.0, 8.0, 1.0, 8.0, 6.0, 9.0, 5.0, 14.0, 18.0, 24.0, 28.0, 35.0, 42.0, 40.0, 64.0, 88.0, 150.0, 230.0, 376.0, 560.0, 1153.0, 2390.0, 6038.0, 22219.0, 295903.0, 684150.0, 23211.0, 6295.0, 2501.0, 1211.0, 631.0, 380.0, 232.0, 138.0, 92.0, 66.0, 48.0, 29.0, 34.0, 22.0, 26.0, 17.0, 16.0, 10.0, 12.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-87.375, -84.728515625, -82.08203125, -79.435546875, -76.7890625, -74.142578125, -71.49609375, -68.849609375, -66.203125, -63.556640625, -60.91015625, -58.263671875, -55.6171875, -52.970703125, -50.32421875, -47.677734375, -45.03125, -42.384765625, -39.73828125, -37.091796875, -34.4453125, -31.798828125, -29.15234375, -26.505859375, -23.859375, -21.212890625, -18.56640625, -15.919921875, -13.2734375, -10.626953125, -7.98046875, -5.333984375, -2.6875, -0.041015625, 2.60546875, 5.251953125, 7.8984375, 10.544921875, 13.19140625, 15.837890625, 18.484375, 21.130859375, 23.77734375, 26.423828125, 29.0703125, 31.716796875, 34.36328125, 37.009765625, 39.65625, 42.302734375, 44.94921875, 47.595703125, 50.2421875, 52.888671875, 55.53515625, 58.181640625, 60.828125, 63.474609375, 66.12109375, 68.767578125, 71.4140625, 74.060546875, 76.70703125, 79.353515625, 82.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 8.0, 14.0, 24.0, 79.0, 374.0, 332.0, 87.0, 31.0, 14.0, 5.0, 6.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07928466796875, -0.07654857635498047, -0.07381248474121094, -0.0710763931274414, -0.06834030151367188, -0.06560420989990234, -0.06286811828613281, -0.06013202667236328, -0.05739593505859375, -0.05465984344482422, -0.05192375183105469, -0.049187660217285156, -0.046451568603515625, -0.043715476989746094, -0.04097938537597656, -0.03824329376220703, -0.0355072021484375, -0.03277111053466797, -0.030035018920898438, -0.027298927307128906, -0.024562835693359375, -0.021826744079589844, -0.019090652465820312, -0.01635456085205078, -0.01361846923828125, -0.010882377624511719, -0.008146286010742188, -0.005410194396972656, -0.002674102783203125, 6.198883056640625e-05, 0.0027980804443359375, 0.005534172058105469, 0.008270263671875, 0.011006355285644531, 0.013742446899414062, 0.016478538513183594, 0.019214630126953125, 0.021950721740722656, 0.024686813354492188, 0.02742290496826172, 0.03015899658203125, 0.03289508819580078, 0.03563117980957031, 0.038367271423339844, 0.041103363037109375, 0.043839454650878906, 0.04657554626464844, 0.04931163787841797, 0.0520477294921875, 0.05478382110595703, 0.05751991271972656, 0.060256004333496094, 0.06299209594726562, 0.06572818756103516, 0.06846427917480469, 0.07120037078857422, 0.07393646240234375, 0.07667255401611328, 0.07940864562988281, 0.08214473724365234, 0.08488082885742188, 0.0876169204711914, 0.09035301208496094, 0.09308910369873047, 0.0958251953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 17.0, 17.0, 46.0, 69.0, 112.0, 168.0, 296.0, 668.0, 1489.0, 4207.0, 17133.0, 784495.0, 219667.0, 13861.0, 3604.0, 1277.0, 618.0, 297.0, 162.0, 115.0, 54.0, 48.0, 37.0, 21.0, 18.0, 9.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4375, -85.154296875, -81.87109375, -78.587890625, -75.3046875, -72.021484375, -68.73828125, -65.455078125, -62.171875, -58.888671875, -55.60546875, -52.322265625, -49.0390625, -45.755859375, -42.47265625, -39.189453125, -35.90625, -32.623046875, -29.33984375, -26.056640625, -22.7734375, -19.490234375, -16.20703125, -12.923828125, -9.640625, -6.357421875, -3.07421875, 0.208984375, 3.4921875, 6.775390625, 10.05859375, 13.341796875, 16.625, 19.908203125, 23.19140625, 26.474609375, 29.7578125, 33.041015625, 36.32421875, 39.607421875, 42.890625, 46.173828125, 49.45703125, 52.740234375, 56.0234375, 59.306640625, 62.58984375, 65.873046875, 69.15625, 72.439453125, 75.72265625, 79.005859375, 82.2890625, 85.572265625, 88.85546875, 92.138671875, 95.421875, 98.705078125, 101.98828125, 105.271484375, 108.5546875, 111.837890625, 115.12109375, 118.404296875, 121.6875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 7.0, 16.0, 20.0, 19.0, 14.0, 33.0, 31.0, 50.0, 79.0, 96.0, 117.0, 126.0, 82.0, 63.0, 56.0, 32.0, 22.0, 19.0, 18.0, 7.0, 15.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.9375, -62.671875, -60.40625, -58.140625, -55.875, -53.609375, -51.34375, -49.078125, -46.8125, -44.546875, -42.28125, -40.015625, -37.75, -35.484375, -33.21875, -30.953125, -28.6875, -26.421875, -24.15625, -21.890625, -19.625, -17.359375, -15.09375, -12.828125, -10.5625, -8.296875, -6.03125, -3.765625, -1.5, 0.765625, 3.03125, 5.296875, 7.5625, 9.828125, 12.09375, 14.359375, 16.625, 18.890625, 21.15625, 23.421875, 25.6875, 27.953125, 30.21875, 32.484375, 34.75, 37.015625, 39.28125, 41.546875, 43.8125, 46.078125, 48.34375, 50.609375, 52.875, 55.140625, 57.40625, 59.671875, 61.9375, 64.203125, 66.46875, 68.734375, 71.0, 73.265625, 75.53125, 77.796875, 80.0625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 21.0, 47.0, 269.0, 502.0, 91.0, 30.0, 16.0, 11.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1244.56787109375, -1107.2962646484375, -970.0245361328125, -832.7529296875, -695.4812622070312, -558.2095947265625, -420.93798828125, -283.66632080078125, -146.3946533203125, -9.123001098632812, 128.14865112304688, 265.4202880859375, 402.69195556640625, 539.963623046875, 677.2352294921875, 814.5068969726562, 951.778564453125, 1089.0501708984375, 1226.3218994140625, 1363.593505859375, 1500.865234375, 1638.1368408203125, 1775.408447265625, 1912.68017578125, 2049.95166015625, 2187.223388671875, 2324.494873046875, 2461.7666015625, 2599.038330078125, 2736.31005859375, 2873.58154296875, 3010.853271484375, 3148.125, 3285.396728515625, 3422.668212890625, 3559.93994140625, 3697.211669921875, 3834.4833984375, 3971.7548828125, 4109.0263671875, 4246.29833984375, 4383.56982421875, 4520.841796875, 4658.11328125, 4795.384765625, 4932.65673828125, 5069.92822265625, 5207.19970703125, 5344.4716796875, 5481.7431640625, 5619.01513671875, 5756.28662109375, 5893.55810546875, 6030.830078125, 6168.1015625, 6305.373046875, 6442.64453125, 6579.916015625, 6717.18798828125, 6854.45947265625, 6991.73095703125, 7129.0029296875, 7266.2744140625, 7403.5458984375, 7540.81787109375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 8.0, 9.0, 11.0, 15.0, 24.0, 21.0, 29.0, 35.0, 31.0, 37.0, 215.0, 255.0, 58.0, 37.0, 33.0, 26.0, 28.0, 18.0, 17.0, 14.0, 13.0, 13.0, 11.0, 4.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1884.7779541015625, -1826.2215576171875, -1767.6651611328125, -1709.1087646484375, -1650.5523681640625, -1591.995849609375, -1533.439453125, -1474.883056640625, -1416.32666015625, -1357.770263671875, -1299.2138671875, -1240.657470703125, -1182.10107421875, -1123.544677734375, -1064.98828125, -1006.4317626953125, -947.8754272460938, -889.3190307617188, -830.7626342773438, -772.2061767578125, -713.6497802734375, -655.0933837890625, -596.5369873046875, -537.9805908203125, -479.4241638183594, -420.8677673339844, -362.31134033203125, -303.75494384765625, -245.1985321044922, -186.64212036132812, -128.08572387695312, -69.529296875, -10.972900390625, 47.5835075378418, 106.1399154663086, 164.69631958007812, 223.2527313232422, 281.80914306640625, 340.36553955078125, 398.9219665527344, 457.4783630371094, 516.0347900390625, 574.5911865234375, 633.1475830078125, 691.7039794921875, 750.2603759765625, 808.8167724609375, 867.3732299804688, 925.9296264648438, 984.4860229492188, 1043.04248046875, 1101.598876953125, 1160.1552734375, 1218.711669921875, 1277.26806640625, 1335.824462890625, 1394.380859375, 1452.937255859375, 1511.49365234375, 1570.050048828125, 1628.6064453125, 1687.162841796875, 1745.71923828125, 1804.2757568359375, 1862.8321533203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 7.0, 5.0, 13.0, 9.0, 12.0, 11.0, 12.0, 13.0, 26.0, 28.0, 34.0, 45.0, 48.0, 131.0, 211.0, 100.0, 51.0, 33.0, 34.0, 25.0, 19.0, 22.0, 15.0, 15.0, 11.0, 11.0, 6.0, 8.0, 7.0, 5.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-117.3125, -113.888671875, -110.46484375, -107.041015625, -103.6171875, -100.193359375, -96.76953125, -93.345703125, -89.921875, -86.498046875, -83.07421875, -79.650390625, -76.2265625, -72.802734375, -69.37890625, -65.955078125, -62.53125, -59.107421875, -55.68359375, -52.259765625, -48.8359375, -45.412109375, -41.98828125, -38.564453125, -35.140625, -31.716796875, -28.29296875, -24.869140625, -21.4453125, -18.021484375, -14.59765625, -11.173828125, -7.75, -4.326171875, -0.90234375, 2.521484375, 5.9453125, 9.369140625, 12.79296875, 16.216796875, 19.640625, 23.064453125, 26.48828125, 29.912109375, 33.3359375, 36.759765625, 40.18359375, 43.607421875, 47.03125, 50.455078125, 53.87890625, 57.302734375, 60.7265625, 64.150390625, 67.57421875, 70.998046875, 74.421875, 77.845703125, 81.26953125, 84.693359375, 88.1171875, 91.541015625, 94.96484375, 98.388671875, 101.8125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 16.0, 18.0, 21.0, 40.0, 69.0, 212.0, 755.0, 5946.0, 8367471.0, 12405.0, 1124.0, 227.0, 122.0, 49.0, 20.0, 16.0, 19.0, 6.0, 2.0, 1.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1390.2318115234375, -1335.9791259765625, -1281.726318359375, -1227.4736328125, -1173.220947265625, -1118.96826171875, -1064.715576171875, -1010.4627685546875, -956.2100830078125, -901.9573974609375, -847.7046508789062, -793.451904296875, -739.19921875, -684.946533203125, -630.6937866210938, -576.4410400390625, -522.1883544921875, -467.9356384277344, -413.68292236328125, -359.4302062988281, -305.177490234375, -250.92477416992188, -196.67205810546875, -142.41934204101562, -88.1666259765625, -33.913909912109375, 20.33880615234375, 74.59152221679688, 128.84423828125, 183.09695434570312, 237.34967041015625, 291.6023864746094, 345.855224609375, 400.1079406738281, 454.36065673828125, 508.6133728027344, 562.8660888671875, 617.1187744140625, 671.3715209960938, 725.624267578125, 779.876953125, 834.129638671875, 888.3823852539062, 942.6351318359375, 996.8878173828125, 1051.1405029296875, 1105.393310546875, 1159.64599609375, 1213.898681640625, 1268.1513671875, 1322.404052734375, 1376.6568603515625, 1430.9095458984375, 1485.1622314453125, 1539.4150390625, 1593.667724609375, 1647.92041015625, 1702.173095703125, 1756.42578125, 1810.6785888671875, 1864.9312744140625, 1919.1839599609375, 1973.436767578125, 2027.689453125, 2081.942138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 6.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1213.4683837890625, -1177.4456787109375, -1141.423095703125, -1105.400390625, -1069.377685546875, -1033.35498046875, -997.3323364257812, -961.3096923828125, -925.2869873046875, -889.2642822265625, -853.2416381835938, -817.218994140625, -781.1962890625, -745.173583984375, -709.1509399414062, -673.1282958984375, -637.1055908203125, -601.0828857421875, -565.0602416992188, -529.03759765625, -493.014892578125, -456.9922180175781, -420.96954345703125, -384.9468688964844, -348.9241943359375, -312.9015197753906, -276.87884521484375, -240.85617065429688, -204.83349609375, -168.81082153320312, -132.78814697265625, -96.76547241210938, -60.74267578125, -24.720001220703125, 11.30267333984375, 47.325347900390625, 83.3480224609375, 119.37069702148438, 155.39337158203125, 191.41604614257812, 227.438720703125, 263.4613952636719, 299.48406982421875, 335.5067443847656, 371.5294189453125, 407.5520935058594, 443.57476806640625, 479.5974426269531, 515.6201171875, 551.642822265625, 587.6654663085938, 623.6881103515625, 659.7108154296875, 695.7335205078125, 731.7561645507812, 767.77880859375, 803.801513671875, 839.82421875, 875.8468627929688, 911.8695068359375, 947.8922119140625, 983.9149169921875, 1019.9375610351562, 1055.960205078125, 1091.98291015625]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 14.0, 16.0, 32.0, 48.0, 49.0, 79.0, 90.0, 100.0, 94.0, 94.0, 71.0, 92.0, 54.0, 53.0, 32.0, 27.0, 18.0, 14.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-102.8125, -100.34814453125, -97.8837890625, -95.41943359375, -92.955078125, -90.49072265625, -88.0263671875, -85.56201171875, -83.09765625, -80.63330078125, -78.1689453125, -75.70458984375, -73.240234375, -70.77587890625, -68.3115234375, -65.84716796875, -63.3828125, -60.91845703125, -58.4541015625, -55.98974609375, -53.525390625, -51.06103515625, -48.5966796875, -46.13232421875, -43.66796875, -41.20361328125, -38.7392578125, -36.27490234375, -33.810546875, -31.34619140625, -28.8818359375, -26.41748046875, -23.953125, -21.48876953125, -19.0244140625, -16.56005859375, -14.095703125, -11.63134765625, -9.1669921875, -6.70263671875, -4.23828125, -1.77392578125, 0.6904296875, 3.15478515625, 5.619140625, 8.08349609375, 10.5478515625, 13.01220703125, 15.4765625, 17.94091796875, 20.4052734375, 22.86962890625, 25.333984375, 27.79833984375, 30.2626953125, 32.72705078125, 35.19140625, 37.65576171875, 40.1201171875, 42.58447265625, 45.048828125, 47.51318359375, 49.9775390625, 52.44189453125, 54.90625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 13.0, 11.0, 15.0, 24.0, 31.0, 42.0, 78.0, 105.0, 163.0, 250.0, 459.0, 807.0, 1591.0, 3365.0, 8117.0, 24160.0, 97692.0, 261570.0, 89405.0, 22870.0, 7225.0, 3026.0, 1359.0, 734.0, 415.0, 256.0, 154.0, 118.0, 69.0, 49.0, 32.0, 19.0, 13.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-684.0, -656.046875, -628.09375, -600.140625, -572.1875, -544.234375, -516.28125, -488.328125, -460.375, -432.421875, -404.46875, -376.515625, -348.5625, -320.609375, -292.65625, -264.703125, -236.75, -208.796875, -180.84375, -152.890625, -124.9375, -96.984375, -69.03125, -41.078125, -13.125, 14.828125, 42.78125, 70.734375, 98.6875, 126.640625, 154.59375, 182.546875, 210.5, 238.453125, 266.40625, 294.359375, 322.3125, 350.265625, 378.21875, 406.171875, 434.125, 462.078125, 490.03125, 517.984375, 545.9375, 573.890625, 601.84375, 629.796875, 657.75, 685.703125, 713.65625, 741.609375, 769.5625, 797.515625, 825.46875, 853.421875, 881.375, 909.328125, 937.28125, 965.234375, 993.1875, 1021.140625, 1049.09375, 1077.046875, 1105.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 7.0, 7.0, 13.0, 14.0, 16.0, 22.0, 19.0, 25.0, 37.0, 41.0, 45.0, 54.0, 54.0, 72.0, 73.0, 70.0, 54.0, 59.0, 59.0, 49.0, 29.0, 40.0, 29.0, 17.0, 13.0, 22.0, 12.0, 13.0, 3.0, 4.0, 6.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.6875, -91.1787109375, -87.669921875, -84.1611328125, -80.65234375, -77.1435546875, -73.634765625, -70.1259765625, -66.6171875, -63.1083984375, -59.599609375, -56.0908203125, -52.58203125, -49.0732421875, -45.564453125, -42.0556640625, -38.546875, -35.0380859375, -31.529296875, -28.0205078125, -24.51171875, -21.0029296875, -17.494140625, -13.9853515625, -10.4765625, -6.9677734375, -3.458984375, 0.0498046875, 3.55859375, 7.0673828125, 10.576171875, 14.0849609375, 17.59375, 21.1025390625, 24.611328125, 28.1201171875, 31.62890625, 35.1376953125, 38.646484375, 42.1552734375, 45.6640625, 49.1728515625, 52.681640625, 56.1904296875, 59.69921875, 63.2080078125, 66.716796875, 70.2255859375, 73.734375, 77.2431640625, 80.751953125, 84.2607421875, 87.76953125, 91.2783203125, 94.787109375, 98.2958984375, 101.8046875, 105.3134765625, 108.822265625, 112.3310546875, 115.83984375, 119.3486328125, 122.857421875, 126.3662109375, 129.875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 24.0, 30.0, 62.0, 79.0, 89.0, 52.0, 37.0, 28.0, 27.0, 10.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-871.1535034179688, -844.0928344726562, -817.0321655273438, -789.971435546875, -762.9107666015625, -735.85009765625, -708.7894287109375, -681.728759765625, -654.6680908203125, -627.607421875, -600.5467529296875, -573.486083984375, -546.4253540039062, -519.3646850585938, -492.30401611328125, -465.24334716796875, -438.1826171875, -411.1219482421875, -384.0612487792969, -357.0005798339844, -329.93988037109375, -302.87921142578125, -275.81854248046875, -248.7578582763672, -221.69717407226562, -194.63648986816406, -167.5758056640625, -140.51513671875, -113.45445251464844, -86.39376831054688, -59.333099365234375, -32.27241516113281, -5.2117919921875, 21.848888397216797, 48.909568786621094, 75.97024536132812, 103.03092956542969, 130.09161376953125, 157.15228271484375, 184.2129669189453, 211.27365112304688, 238.33433532714844, 265.39501953125, 292.4556884765625, 319.516357421875, 346.5770568847656, 373.6377258300781, 400.69842529296875, 427.75909423828125, 454.81976318359375, 481.8804626464844, 508.9411315917969, 536.0018310546875, 563.0625, 590.1231689453125, 617.183837890625, 644.2445068359375, 671.30517578125, 698.3658447265625, 725.426513671875, 752.4872436523438, 779.5479125976562, 806.6085815429688, 833.6692504882812, 860.72998046875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 7.0, 9.0, 11.0, 20.0, 37.0, 91.0, 82.0, 76.0, 46.0, 23.0, 17.0, 4.0, 9.0, 7.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-685.730712890625, -663.8141479492188, -641.8975830078125, -619.98095703125, -598.0643920898438, -576.1478271484375, -554.231201171875, -532.3146362304688, -510.3980712890625, -488.48150634765625, -466.5649108886719, -444.6483154296875, -422.73175048828125, -400.815185546875, -378.8985900878906, -356.98199462890625, -335.0654296875, -313.14886474609375, -291.2322692871094, -269.315673828125, -247.39910888671875, -225.48252868652344, -203.56594848632812, -181.6493682861328, -159.7327880859375, -137.8162078857422, -115.89962768554688, -93.98304748535156, -72.06646728515625, -50.14988708496094, -28.233306884765625, -6.3167266845703125, 15.599853515625, 37.51643371582031, 59.433013916015625, 81.34959411621094, 103.26617431640625, 125.18275451660156, 147.09933471679688, 169.0159149169922, 190.9324951171875, 212.8490753173828, 234.76565551757812, 256.6822509765625, 278.59881591796875, 300.515380859375, 322.4319763183594, 344.34857177734375, 366.26513671875, 388.18170166015625, 410.0982971191406, 432.014892578125, 453.93145751953125, 475.8480224609375, 497.7646179199219, 519.6812133789062, 541.5977783203125, 563.5143432617188, 585.430908203125, 607.3475341796875, 629.2640991210938, 651.1806640625, 673.0972900390625, 695.0138549804688, 716.930419921875]}, "eval/loss": 2.1931169033050537, "eval/wer": 0.34303847679492266, "eval/runtime": 642.668, "eval/samples_per_second": 4.111, "eval/steps_per_second": 0.515} \ No newline at end of file +{"train/loss": 1.4285, "train/learning_rate": 2.085070422535211e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 44888, "_timestamp": 1648186232, "_step": 7504, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 6.0, 13.0, 10.0, 7.0, 15.0, 12.0, 15.0, 20.0, 20.0, 25.0, 29.0, 32.0, 37.0, 27.0, 45.0, 42.0, 31.0, 35.0, 39.0, 45.0, 35.0, 38.0, 45.0, 31.0, 33.0, 33.0, 28.0, 27.0, 41.0, 34.0, 22.0, 9.0, 16.0, 9.0, 13.0, 12.0, 7.0, 11.0, 10.0, 10.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.566865921020508, -10.332884788513184, -10.098902702331543, -9.864921569824219, -9.630940437316895, -9.39695930480957, -9.16297721862793, -8.928996086120605, -8.695014953613281, -8.461033821105957, -8.227051734924316, -7.993070602416992, -7.759089469909668, -7.5251078605651855, -7.291126251220703, -7.057145118713379, -6.823163032531738, -6.589181423187256, -6.355200290679932, -6.121218681335449, -5.887237548828125, -5.653255939483643, -5.41927433013916, -5.185293197631836, -4.951312065124512, -4.717330455780029, -4.483349323272705, -4.249367713928223, -4.015386581420898, -3.781404972076416, -3.5474236011505127, -3.3134422302246094, -3.079460620880127, -2.8454792499542236, -2.6114978790283203, -2.377516269683838, -2.1435348987579346, -1.9095535278320312, -1.675572156906128, -1.441590666770935, -1.2076092958450317, -0.9736278653144836, -0.7396464347839355, -0.5056650638580322, -0.27168363332748413, -0.037702202796936035, 0.19627916812896729, 0.43026065826416016, 0.6642420291900635, 0.8982234597206116, 1.1322048902511597, 1.366186261177063, 1.6001677513122559, 1.8341491222381592, 2.0681304931640625, 2.302112102508545, 2.536093235015869, 2.7700746059417725, 3.004055976867676, 3.238037586212158, 3.4720189571380615, 3.706000328063965, 3.939981698989868, 4.1739630699157715, 4.407944679260254]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 11.0, 5.0, 11.0, 9.0, 17.0, 14.0, 30.0, 20.0, 32.0, 19.0, 38.0, 34.0, 47.0, 39.0, 43.0, 48.0, 43.0, 39.0, 59.0, 42.0, 35.0, 45.0, 34.0, 35.0, 30.0, 23.0, 26.0, 22.0, 24.0, 27.0, 29.0, 13.0, 12.0, 7.0, 5.0, 13.0, 12.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.810319900512695, -8.533601760864258, -8.25688362121582, -7.980165481567383, -7.703447341918945, -7.426729202270508, -7.150010585784912, -6.873292446136475, -6.596574306488037, -6.3198561668396, -6.043138027191162, -5.766419887542725, -5.489701271057129, -5.212983131408691, -4.936264991760254, -4.659546852111816, -4.382828712463379, -4.106110572814941, -3.829392433166504, -3.5526740550994873, -3.27595591545105, -2.9992377758026123, -2.7225193977355957, -2.445801258087158, -2.1690831184387207, -1.8923649787902832, -1.6156467199325562, -1.338928461074829, -1.0622103214263916, -0.7854921817779541, -0.508773922920227, -0.2320556640625, 0.044661521911621094, 0.32137972116470337, 0.5980979204177856, 0.8748161196708679, 1.1515343189239502, 1.4282524585723877, 1.7049707174301147, 1.9816889762878418, 2.2584071159362793, 2.535125255584717, 2.8118433952331543, 3.088561773300171, 3.3652799129486084, 3.641998052597046, 3.9187164306640625, 4.1954345703125, 4.4721527099609375, 4.748870849609375, 5.0255889892578125, 5.30230712890625, 5.5790252685546875, 5.855743408203125, 6.132462024688721, 6.409180164337158, 6.685898303985596, 6.962616443634033, 7.239334583282471, 7.516052722930908, 7.792771339416504, 8.069489479064941, 8.346207618713379, 8.622925758361816, 8.899643898010254]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 11.0, 17.0, 23.0, 34.0, 65.0, 79.0, 143.0, 258.0, 404.0, 649.0, 1015.0, 1667.0, 2858.0, 4626.0, 7548.0, 12760.0, 20672.0, 34098.0, 55358.0, 90839.0, 145362.0, 229066.0, 348797.0, 493910.0, 604871.0, 614068.0, 511286.0, 368955.0, 244625.0, 154671.0, 96336.0, 58897.0, 35860.0, 21341.0, 12948.0, 8032.0, 4729.0, 2907.0, 1738.0, 1087.0, 687.0, 393.0, 242.0, 141.0, 73.0, 48.0, 37.0, 23.0, 12.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0], "bins": [-9.390625, -9.114990234375, -8.83935546875, -8.563720703125, -8.2880859375, -8.012451171875, -7.73681640625, -7.461181640625, -7.185546875, -6.909912109375, -6.63427734375, -6.358642578125, -6.0830078125, -5.807373046875, -5.53173828125, -5.256103515625, -4.98046875, -4.704833984375, -4.42919921875, -4.153564453125, -3.8779296875, -3.602294921875, -3.32666015625, -3.051025390625, -2.775390625, -2.499755859375, -2.22412109375, -1.948486328125, -1.6728515625, -1.397216796875, -1.12158203125, -0.845947265625, -0.5703125, -0.294677734375, -0.01904296875, 0.256591796875, 0.5322265625, 0.807861328125, 1.08349609375, 1.359130859375, 1.634765625, 1.910400390625, 2.18603515625, 2.461669921875, 2.7373046875, 3.012939453125, 3.28857421875, 3.564208984375, 3.83984375, 4.115478515625, 4.39111328125, 4.666748046875, 4.9423828125, 5.218017578125, 5.49365234375, 5.769287109375, 6.044921875, 6.320556640625, 6.59619140625, 6.871826171875, 7.1474609375, 7.423095703125, 7.69873046875, 7.974365234375, 8.25]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 6.0, 10.0, 19.0, 24.0, 27.0, 21.0, 21.0, 31.0, 39.0, 39.0, 48.0, 43.0, 44.0, 43.0, 56.0, 50.0, 47.0, 47.0, 48.0, 45.0, 40.0, 30.0, 31.0, 37.0, 24.0, 21.0, 23.0, 22.0, 11.0, 8.0, 5.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.015625, -9.739501953125, -9.46337890625, -9.187255859375, -8.9111328125, -8.635009765625, -8.35888671875, -8.082763671875, -7.806640625, -7.530517578125, -7.25439453125, -6.978271484375, -6.7021484375, -6.426025390625, -6.14990234375, -5.873779296875, -5.59765625, -5.321533203125, -5.04541015625, -4.769287109375, -4.4931640625, -4.217041015625, -3.94091796875, -3.664794921875, -3.388671875, -3.112548828125, -2.83642578125, -2.560302734375, -2.2841796875, -2.008056640625, -1.73193359375, -1.455810546875, -1.1796875, -0.903564453125, -0.62744140625, -0.351318359375, -0.0751953125, 0.200927734375, 0.47705078125, 0.753173828125, 1.029296875, 1.305419921875, 1.58154296875, 1.857666015625, 2.1337890625, 2.409912109375, 2.68603515625, 2.962158203125, 3.23828125, 3.514404296875, 3.79052734375, 4.066650390625, 4.3427734375, 4.618896484375, 4.89501953125, 5.171142578125, 5.447265625, 5.723388671875, 5.99951171875, 6.275634765625, 6.5517578125, 6.827880859375, 7.10400390625, 7.380126953125, 7.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 9.0, 2.0, 13.0, 27.0, 39.0, 63.0, 81.0, 166.0, 213.0, 340.0, 532.0, 826.0, 1287.0, 2116.0, 3434.0, 5522.0, 8295.0, 13093.0, 20270.0, 31313.0, 48083.0, 72741.0, 109191.0, 157840.0, 222634.0, 300677.0, 385181.0, 454258.0, 482633.0, 457843.0, 391691.0, 307313.0, 228464.0, 161718.0, 111594.0, 74728.0, 49500.0, 32709.0, 21110.0, 13461.0, 8505.0, 5339.0, 3507.0, 2111.0, 1393.0, 882.0, 553.0, 368.0, 235.0, 156.0, 95.0, 54.0, 32.0, 20.0, 18.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-6.4140625, -6.2169189453125, -6.019775390625, -5.8226318359375, -5.62548828125, -5.4283447265625, -5.231201171875, -5.0340576171875, -4.8369140625, -4.6397705078125, -4.442626953125, -4.2454833984375, -4.04833984375, -3.8511962890625, -3.654052734375, -3.4569091796875, -3.259765625, -3.0626220703125, -2.865478515625, -2.6683349609375, -2.47119140625, -2.2740478515625, -2.076904296875, -1.8797607421875, -1.6826171875, -1.4854736328125, -1.288330078125, -1.0911865234375, -0.89404296875, -0.6968994140625, -0.499755859375, -0.3026123046875, -0.10546875, 0.0916748046875, 0.288818359375, 0.4859619140625, 0.68310546875, 0.8802490234375, 1.077392578125, 1.2745361328125, 1.4716796875, 1.6688232421875, 1.865966796875, 2.0631103515625, 2.26025390625, 2.4573974609375, 2.654541015625, 2.8516845703125, 3.048828125, 3.2459716796875, 3.443115234375, 3.6402587890625, 3.83740234375, 4.0345458984375, 4.231689453125, 4.4288330078125, 4.6259765625, 4.8231201171875, 5.020263671875, 5.2174072265625, 5.41455078125, 5.6116943359375, 5.808837890625, 6.0059814453125, 6.203125]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 15.0, 14.0, 28.0, 31.0, 40.0, 49.0, 61.0, 57.0, 80.0, 100.0, 125.0, 125.0, 144.0, 157.0, 157.0, 178.0, 178.0, 182.0, 227.0, 214.0, 220.0, 214.0, 211.0, 171.0, 157.0, 141.0, 138.0, 113.0, 70.0, 67.0, 70.0, 57.0, 48.0, 34.0, 24.0, 29.0, 19.0, 14.0, 17.0, 13.0, 8.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.716796875, -2.6234130859375, -2.530029296875, -2.4366455078125, -2.34326171875, -2.2498779296875, -2.156494140625, -2.0631103515625, -1.9697265625, -1.8763427734375, -1.782958984375, -1.6895751953125, -1.59619140625, -1.5028076171875, -1.409423828125, -1.3160400390625, -1.22265625, -1.1292724609375, -1.035888671875, -0.9425048828125, -0.84912109375, -0.7557373046875, -0.662353515625, -0.5689697265625, -0.4755859375, -0.3822021484375, -0.288818359375, -0.1954345703125, -0.10205078125, -0.0086669921875, 0.084716796875, 0.1781005859375, 0.271484375, 0.3648681640625, 0.458251953125, 0.5516357421875, 0.64501953125, 0.7384033203125, 0.831787109375, 0.9251708984375, 1.0185546875, 1.1119384765625, 1.205322265625, 1.2987060546875, 1.39208984375, 1.4854736328125, 1.578857421875, 1.6722412109375, 1.765625, 1.8590087890625, 1.952392578125, 2.0457763671875, 2.13916015625, 2.2325439453125, 2.325927734375, 2.4193115234375, 2.5126953125, 2.6060791015625, 2.699462890625, 2.7928466796875, 2.88623046875, 2.9796142578125, 3.072998046875, 3.1663818359375, 3.259765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 3.0, 4.0, 7.0, 10.0, 13.0, 20.0, 17.0, 25.0, 21.0, 32.0, 36.0, 46.0, 52.0, 44.0, 38.0, 39.0, 49.0, 44.0, 52.0, 56.0, 47.0, 44.0, 35.0, 33.0, 24.0, 26.0, 35.0, 25.0, 14.0, 13.0, 26.0, 10.0, 14.0, 6.0, 8.0, 7.0, 12.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.144612312316895, -7.875809669494629, -7.607007026672363, -7.338204383850098, -7.069401741027832, -6.800599098205566, -6.531795978546143, -6.262993335723877, -5.994190692901611, -5.725388050079346, -5.45658540725708, -5.1877827644348145, -4.918979644775391, -4.650177001953125, -4.381374359130859, -4.112571716308594, -3.843769073486328, -3.5749664306640625, -3.306163787841797, -3.037360906600952, -2.7685582637786865, -2.499755620956421, -2.230952739715576, -1.9621500968933105, -1.693347454071045, -1.4245448112487793, -1.1557420492172241, -0.8869393467903137, -0.6181366443634033, -0.3493340015411377, -0.08053123950958252, 0.18827152252197266, 0.4570732116699219, 0.7258759140968323, 0.9946786165237427, 1.2634813785552979, 1.5322840213775635, 1.801086664199829, 2.069889545440674, 2.3386921882629395, 2.607494831085205, 2.8762974739074707, 3.1451001167297363, 3.413902997970581, 3.6827056407928467, 3.9515082836151123, 4.220311164855957, 4.489113807678223, 4.757916450500488, 5.026719093322754, 5.2955217361450195, 5.564324378967285, 5.833127021789551, 6.101929664611816, 6.37073278427124, 6.639535427093506, 6.9083380699157715, 7.177140712738037, 7.445943355560303, 7.714745998382568, 7.983549118041992, 8.252351760864258, 8.521154403686523, 8.789957046508789, 9.058759689331055]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 1.0, 2.0, 5.0, 9.0, 5.0, 4.0, 8.0, 9.0, 10.0, 9.0, 22.0, 23.0, 25.0, 29.0, 29.0, 34.0, 48.0, 40.0, 39.0, 32.0, 48.0, 38.0, 40.0, 44.0, 34.0, 48.0, 44.0, 43.0, 31.0, 30.0, 32.0, 31.0, 22.0, 25.0, 16.0, 15.0, 14.0, 15.0, 9.0, 12.0, 7.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.632984161376953, -8.378067016601562, -8.123149871826172, -7.868232727050781, -7.613315582275391, -7.3583984375, -7.103480815887451, -6.8485636711120605, -6.59364652633667, -6.338729381561279, -6.083812236785889, -5.828895092010498, -5.573977470397949, -5.319060325622559, -5.064143180847168, -4.809226036071777, -4.554308891296387, -4.299391746520996, -4.0444746017456055, -3.7895572185516357, -3.534640073776245, -3.2797229290008545, -3.0248055458068848, -2.769888401031494, -2.5149712562561035, -2.260054111480713, -2.0051369667053223, -1.7502195835113525, -1.495302438735962, -1.2403852939605713, -0.9854680299758911, -0.7305507659912109, -0.4756331443786621, -0.2207159399986267, 0.03420126438140869, 0.2891184687614441, 0.5440356731414795, 0.7989528179168701, 1.0538700819015503, 1.3087873458862305, 1.563704490661621, 1.8186216354370117, 2.0735387802124023, 2.328456163406372, 2.5833733081817627, 2.8382904529571533, 3.093207836151123, 3.3481249809265137, 3.6030421257019043, 3.857959270477295, 4.1128764152526855, 4.367793560028076, 4.622711181640625, 4.877628326416016, 5.132545471191406, 5.387462615966797, 5.6423797607421875, 5.897296905517578, 6.152214050292969, 6.407131195068359, 6.66204833984375, 6.916965484619141, 7.1718831062316895, 7.42680025100708, 7.681717395782471]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 9.0, 7.0, 12.0, 14.0, 33.0, 48.0, 66.0, 93.0, 206.0, 302.0, 498.0, 763.0, 1276.0, 1973.0, 3287.0, 5340.0, 8671.0, 14004.0, 22097.0, 34541.0, 51494.0, 74625.0, 102648.0, 127048.0, 137310.0, 128825.0, 104936.0, 77411.0, 53776.0, 35736.0, 23194.0, 14483.0, 8977.0, 5688.0, 3464.0, 2188.0, 1354.0, 875.0, 501.0, 302.0, 190.0, 109.0, 83.0, 48.0, 31.0, 8.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.07421875, -6.81744384765625, -6.5606689453125, -6.30389404296875, -6.047119140625, -5.79034423828125, -5.5335693359375, -5.27679443359375, -5.02001953125, -4.76324462890625, -4.5064697265625, -4.24969482421875, -3.992919921875, -3.73614501953125, -3.4793701171875, -3.22259521484375, -2.9658203125, -2.70904541015625, -2.4522705078125, -2.19549560546875, -1.938720703125, -1.68194580078125, -1.4251708984375, -1.16839599609375, -0.91162109375, -0.65484619140625, -0.3980712890625, -0.14129638671875, 0.115478515625, 0.37225341796875, 0.6290283203125, 0.88580322265625, 1.142578125, 1.39935302734375, 1.6561279296875, 1.91290283203125, 2.169677734375, 2.42645263671875, 2.6832275390625, 2.94000244140625, 3.19677734375, 3.45355224609375, 3.7103271484375, 3.96710205078125, 4.223876953125, 4.48065185546875, 4.7374267578125, 4.99420166015625, 5.2509765625, 5.50775146484375, 5.7645263671875, 6.02130126953125, 6.278076171875, 6.53485107421875, 6.7916259765625, 7.04840087890625, 7.30517578125, 7.56195068359375, 7.8187255859375, 8.07550048828125, 8.332275390625, 8.58905029296875, 8.8458251953125, 9.10260009765625, 9.359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 2.0, 6.0, 6.0, 5.0, 6.0, 12.0, 12.0, 21.0, 19.0, 23.0, 31.0, 27.0, 25.0, 41.0, 43.0, 32.0, 37.0, 39.0, 36.0, 44.0, 45.0, 45.0, 41.0, 36.0, 41.0, 34.0, 30.0, 45.0, 33.0, 32.0, 17.0, 24.0, 11.0, 18.0, 11.0, 14.0, 7.0, 5.0, 8.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.875, -7.63897705078125, -7.4029541015625, -7.16693115234375, -6.930908203125, -6.69488525390625, -6.4588623046875, -6.22283935546875, -5.98681640625, -5.75079345703125, -5.5147705078125, -5.27874755859375, -5.042724609375, -4.80670166015625, -4.5706787109375, -4.33465576171875, -4.0986328125, -3.86260986328125, -3.6265869140625, -3.39056396484375, -3.154541015625, -2.91851806640625, -2.6824951171875, -2.44647216796875, -2.21044921875, -1.97442626953125, -1.7384033203125, -1.50238037109375, -1.266357421875, -1.03033447265625, -0.7943115234375, -0.55828857421875, -0.322265625, -0.08624267578125, 0.1497802734375, 0.38580322265625, 0.621826171875, 0.85784912109375, 1.0938720703125, 1.32989501953125, 1.56591796875, 1.80194091796875, 2.0379638671875, 2.27398681640625, 2.510009765625, 2.74603271484375, 2.9820556640625, 3.21807861328125, 3.4541015625, 3.69012451171875, 3.9261474609375, 4.16217041015625, 4.398193359375, 4.63421630859375, 4.8702392578125, 5.10626220703125, 5.34228515625, 5.57830810546875, 5.8143310546875, 6.05035400390625, 6.286376953125, 6.52239990234375, 6.7584228515625, 6.99444580078125, 7.23046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 16.0, 16.0, 25.0, 38.0, 62.0, 91.0, 136.0, 194.0, 327.0, 449.0, 705.0, 1047.0, 1601.0, 2587.0, 4079.0, 6613.0, 10798.0, 17878.0, 30065.0, 50844.0, 85387.0, 134476.0, 181145.0, 179159.0, 132110.0, 83054.0, 49611.0, 30041.0, 17636.0, 10618.0, 6545.0, 3977.0, 2526.0, 1623.0, 1058.0, 687.0, 453.0, 306.0, 192.0, 127.0, 81.0, 63.0, 41.0, 29.0, 12.0, 13.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-11.9609375, -11.60888671875, -11.2568359375, -10.90478515625, -10.552734375, -10.20068359375, -9.8486328125, -9.49658203125, -9.14453125, -8.79248046875, -8.4404296875, -8.08837890625, -7.736328125, -7.38427734375, -7.0322265625, -6.68017578125, -6.328125, -5.97607421875, -5.6240234375, -5.27197265625, -4.919921875, -4.56787109375, -4.2158203125, -3.86376953125, -3.51171875, -3.15966796875, -2.8076171875, -2.45556640625, -2.103515625, -1.75146484375, -1.3994140625, -1.04736328125, -0.6953125, -0.34326171875, 0.0087890625, 0.36083984375, 0.712890625, 1.06494140625, 1.4169921875, 1.76904296875, 2.12109375, 2.47314453125, 2.8251953125, 3.17724609375, 3.529296875, 3.88134765625, 4.2333984375, 4.58544921875, 4.9375, 5.28955078125, 5.6416015625, 5.99365234375, 6.345703125, 6.69775390625, 7.0498046875, 7.40185546875, 7.75390625, 8.10595703125, 8.4580078125, 8.81005859375, 9.162109375, 9.51416015625, 9.8662109375, 10.21826171875, 10.5703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 8.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 11.0, 22.0, 20.0, 22.0, 28.0, 20.0, 29.0, 31.0, 32.0, 33.0, 46.0, 40.0, 37.0, 40.0, 41.0, 29.0, 38.0, 46.0, 33.0, 36.0, 30.0, 35.0, 33.0, 32.0, 23.0, 23.0, 15.0, 23.0, 18.0, 12.0, 15.0, 12.0, 10.0, 5.0, 5.0, 6.0, 3.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.0703125, -4.90240478515625, -4.7344970703125, -4.56658935546875, -4.398681640625, -4.23077392578125, -4.0628662109375, -3.89495849609375, -3.72705078125, -3.55914306640625, -3.3912353515625, -3.22332763671875, -3.055419921875, -2.88751220703125, -2.7196044921875, -2.55169677734375, -2.3837890625, -2.21588134765625, -2.0479736328125, -1.88006591796875, -1.712158203125, -1.54425048828125, -1.3763427734375, -1.20843505859375, -1.04052734375, -0.87261962890625, -0.7047119140625, -0.53680419921875, -0.368896484375, -0.20098876953125, -0.0330810546875, 0.13482666015625, 0.302734375, 0.47064208984375, 0.6385498046875, 0.80645751953125, 0.974365234375, 1.14227294921875, 1.3101806640625, 1.47808837890625, 1.64599609375, 1.81390380859375, 1.9818115234375, 2.14971923828125, 2.317626953125, 2.48553466796875, 2.6534423828125, 2.82135009765625, 2.9892578125, 3.15716552734375, 3.3250732421875, 3.49298095703125, 3.660888671875, 3.82879638671875, 3.9967041015625, 4.16461181640625, 4.33251953125, 4.50042724609375, 4.6683349609375, 4.83624267578125, 5.004150390625, 5.17205810546875, 5.3399658203125, 5.50787353515625, 5.67578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 17.0, 15.0, 36.0, 47.0, 57.0, 106.0, 138.0, 268.0, 387.0, 633.0, 1008.0, 1667.0, 2837.0, 4971.0, 9670.0, 20630.0, 47709.0, 120909.0, 276445.0, 308862.0, 145687.0, 57396.0, 24039.0, 11279.0, 5855.0, 3141.0, 1765.0, 1106.0, 676.0, 407.0, 248.0, 176.0, 114.0, 82.0, 41.0, 46.0, 22.0, 21.0, 10.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8125, -8.5291748046875, -8.245849609375, -7.9625244140625, -7.67919921875, -7.3958740234375, -7.112548828125, -6.8292236328125, -6.5458984375, -6.2625732421875, -5.979248046875, -5.6959228515625, -5.41259765625, -5.1292724609375, -4.845947265625, -4.5626220703125, -4.279296875, -3.9959716796875, -3.712646484375, -3.4293212890625, -3.14599609375, -2.8626708984375, -2.579345703125, -2.2960205078125, -2.0126953125, -1.7293701171875, -1.446044921875, -1.1627197265625, -0.87939453125, -0.5960693359375, -0.312744140625, -0.0294189453125, 0.25390625, 0.5372314453125, 0.820556640625, 1.1038818359375, 1.38720703125, 1.6705322265625, 1.953857421875, 2.2371826171875, 2.5205078125, 2.8038330078125, 3.087158203125, 3.3704833984375, 3.65380859375, 3.9371337890625, 4.220458984375, 4.5037841796875, 4.787109375, 5.0704345703125, 5.353759765625, 5.6370849609375, 5.92041015625, 6.2037353515625, 6.487060546875, 6.7703857421875, 7.0537109375, 7.3370361328125, 7.620361328125, 7.9036865234375, 8.18701171875, 8.4703369140625, 8.753662109375, 9.0369873046875, 9.3203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 6.0, 5.0, 10.0, 13.0, 10.0, 12.0, 29.0, 32.0, 42.0, 42.0, 57.0, 55.0, 83.0, 92.0, 79.0, 69.0, 65.0, 68.0, 46.0, 41.0, 26.0, 19.0, 27.0, 18.0, 11.0, 7.0, 8.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005421638488769531, -0.000520855188369751, -0.0004995465278625488, -0.0004782378673553467, -0.00045692920684814453, -0.0004356205463409424, -0.00041431188583374023, -0.0003930032253265381, -0.00037169456481933594, -0.0003503859043121338, -0.00032907724380493164, -0.0003077685832977295, -0.00028645992279052734, -0.0002651512622833252, -0.00024384260177612305, -0.0002225339412689209, -0.00020122528076171875, -0.0001799166202545166, -0.00015860795974731445, -0.0001372992992401123, -0.00011599063873291016, -9.468197822570801e-05, -7.337331771850586e-05, -5.206465721130371e-05, -3.075599670410156e-05, -9.447336196899414e-06, 1.1861324310302734e-05, 3.316998481750488e-05, 5.447864532470703e-05, 7.578730583190918e-05, 9.709596633911133e-05, 0.00011840462684631348, 0.00013971328735351562, 0.00016102194786071777, 0.00018233060836791992, 0.00020363926887512207, 0.00022494792938232422, 0.00024625658988952637, 0.0002675652503967285, 0.00028887391090393066, 0.0003101825714111328, 0.00033149123191833496, 0.0003527998924255371, 0.00037410855293273926, 0.0003954172134399414, 0.00041672587394714355, 0.0004380345344543457, 0.00045934319496154785, 0.00048065185546875, 0.0005019605159759521, 0.0005232691764831543, 0.0005445778369903564, 0.0005658864974975586, 0.0005871951580047607, 0.0006085038185119629, 0.000629812479019165, 0.0006511211395263672, 0.0006724298000335693, 0.0006937384605407715, 0.0007150471210479736, 0.0007363557815551758, 0.0007576644420623779, 0.0007789731025695801, 0.0008002817630767822, 0.0008215904235839844]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 12.0, 18.0, 41.0, 55.0, 79.0, 125.0, 138.0, 249.0, 388.0, 528.0, 835.0, 1291.0, 2134.0, 3489.0, 5824.0, 10257.0, 17642.0, 30893.0, 53836.0, 89742.0, 135337.0, 170794.0, 171718.0, 135232.0, 89989.0, 53878.0, 31048.0, 17582.0, 10204.0, 5784.0, 3423.0, 2176.0, 1301.0, 860.0, 511.0, 359.0, 244.0, 176.0, 124.0, 76.0, 63.0, 28.0, 23.0, 15.0, 8.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.99609375, -5.80267333984375, -5.6092529296875, -5.41583251953125, -5.222412109375, -5.02899169921875, -4.8355712890625, -4.64215087890625, -4.44873046875, -4.25531005859375, -4.0618896484375, -3.86846923828125, -3.675048828125, -3.48162841796875, -3.2882080078125, -3.09478759765625, -2.9013671875, -2.70794677734375, -2.5145263671875, -2.32110595703125, -2.127685546875, -1.93426513671875, -1.7408447265625, -1.54742431640625, -1.35400390625, -1.16058349609375, -0.9671630859375, -0.77374267578125, -0.580322265625, -0.38690185546875, -0.1934814453125, -6.103515625e-05, 0.193359375, 0.38677978515625, 0.5802001953125, 0.77362060546875, 0.967041015625, 1.16046142578125, 1.3538818359375, 1.54730224609375, 1.74072265625, 1.93414306640625, 2.1275634765625, 2.32098388671875, 2.514404296875, 2.70782470703125, 2.9012451171875, 3.09466552734375, 3.2880859375, 3.48150634765625, 3.6749267578125, 3.86834716796875, 4.061767578125, 4.25518798828125, 4.4486083984375, 4.64202880859375, 4.83544921875, 5.02886962890625, 5.2222900390625, 5.41571044921875, 5.609130859375, 5.80255126953125, 5.9959716796875, 6.18939208984375, 6.3828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 16.0, 16.0, 16.0, 21.0, 16.0, 29.0, 20.0, 41.0, 64.0, 57.0, 60.0, 64.0, 72.0, 61.0, 61.0, 73.0, 63.0, 39.0, 27.0, 24.0, 32.0, 12.0, 15.0, 17.0, 10.0, 13.0, 7.0, 11.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.521484375, -2.43951416015625, -2.3575439453125, -2.27557373046875, -2.193603515625, -2.11163330078125, -2.0296630859375, -1.94769287109375, -1.86572265625, -1.78375244140625, -1.7017822265625, -1.61981201171875, -1.537841796875, -1.45587158203125, -1.3739013671875, -1.29193115234375, -1.2099609375, -1.12799072265625, -1.0460205078125, -0.96405029296875, -0.882080078125, -0.80010986328125, -0.7181396484375, -0.63616943359375, -0.55419921875, -0.47222900390625, -0.3902587890625, -0.30828857421875, -0.226318359375, -0.14434814453125, -0.0623779296875, 0.01959228515625, 0.1015625, 0.18353271484375, 0.2655029296875, 0.34747314453125, 0.429443359375, 0.51141357421875, 0.5933837890625, 0.67535400390625, 0.75732421875, 0.83929443359375, 0.9212646484375, 1.00323486328125, 1.085205078125, 1.16717529296875, 1.2491455078125, 1.33111572265625, 1.4130859375, 1.49505615234375, 1.5770263671875, 1.65899658203125, 1.740966796875, 1.82293701171875, 1.9049072265625, 1.98687744140625, 2.06884765625, 2.15081787109375, 2.2327880859375, 2.31475830078125, 2.396728515625, 2.47869873046875, 2.5606689453125, 2.64263916015625, 2.724609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 9.0, 4.0, 3.0, 8.0, 15.0, 8.0, 15.0, 14.0, 28.0, 33.0, 32.0, 37.0, 38.0, 39.0, 49.0, 32.0, 44.0, 43.0, 52.0, 43.0, 44.0, 41.0, 48.0, 44.0, 36.0, 47.0, 21.0, 25.0, 27.0, 26.0, 17.0, 16.0, 14.0, 7.0, 12.0, 11.0, 3.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.441717624664307, -7.196321487426758, -6.950925827026367, -6.705529689788818, -6.4601335525512695, -6.214737415313721, -5.969341278076172, -5.723945617675781, -5.478549480438232, -5.233153343200684, -4.987757682800293, -4.742361545562744, -4.496965408325195, -4.2515692710876465, -4.006173133850098, -3.760777473449707, -3.515381336212158, -3.2699851989746094, -3.0245893001556396, -2.77919340133667, -2.533797264099121, -2.2884011268615723, -2.0430052280426025, -1.7976092100143433, -1.552213191986084, -1.3068171739578247, -1.0614211559295654, -0.8160251379013062, -0.5706291198730469, -0.3252331018447876, -0.07983708381652832, 0.16555893421173096, 0.41095542907714844, 0.6563514471054077, 0.901747465133667, 1.1471434831619263, 1.3925395011901855, 1.6379355192184448, 1.883331537246704, 2.128727436065674, 2.3741235733032227, 2.6195197105407715, 2.864915609359741, 3.110311508178711, 3.3557076454162598, 3.6011037826538086, 3.8464996814727783, 4.091895580291748, 4.337291717529297, 4.582687854766846, 4.8280839920043945, 5.073479652404785, 5.318875789642334, 5.564271926879883, 5.809667587280273, 6.055063724517822, 6.300459861755371, 6.54585599899292, 6.791252136230469, 7.036647796630859, 7.282043933868408, 7.527440071105957, 7.772835731506348, 8.018232345581055, 8.263628005981445]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 8.0, 3.0, 12.0, 17.0, 16.0, 16.0, 27.0, 36.0, 24.0, 26.0, 33.0, 34.0, 35.0, 39.0, 31.0, 53.0, 54.0, 40.0, 40.0, 25.0, 41.0, 43.0, 35.0, 40.0, 23.0, 26.0, 21.0, 27.0, 30.0, 16.0, 22.0, 10.0, 18.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-7.057295799255371, -6.835038185119629, -6.612780570983887, -6.3905229568481445, -6.168265342712402, -5.94600772857666, -5.723750114440918, -5.501492500305176, -5.279234886169434, -5.056977272033691, -4.834719657897949, -4.612462043762207, -4.390204429626465, -4.167946815490723, -3.9456892013549805, -3.7234315872192383, -3.501173973083496, -3.278916358947754, -3.0566587448120117, -2.8344011306762695, -2.6121435165405273, -2.389885902404785, -2.167628288269043, -1.9453706741333008, -1.7231130599975586, -1.5008554458618164, -1.2785978317260742, -1.056340217590332, -0.8340826034545898, -0.6118249893188477, -0.38956737518310547, -0.16730976104736328, 0.0549473762512207, 0.2772049903869629, 0.4994626045227051, 0.7217202186584473, 0.9439778327941895, 1.1662354469299316, 1.3884930610656738, 1.610750675201416, 1.8330082893371582, 2.0552659034729004, 2.2775235176086426, 2.4997811317443848, 2.722038745880127, 2.944296360015869, 3.1665539741516113, 3.3888115882873535, 3.6110692024230957, 3.833326816558838, 4.05558443069458, 4.277842044830322, 4.5000996589660645, 4.722357273101807, 4.944614887237549, 5.166872501373291, 5.389130115509033, 5.611387729644775, 5.833645343780518, 6.05590295791626, 6.278160572052002, 6.500418186187744, 6.722675800323486, 6.9449334144592285, 7.167191028594971]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 22.0, 26.0, 65.0, 81.0, 137.0, 234.0, 385.0, 646.0, 1075.0, 1837.0, 2965.0, 4636.0, 7356.0, 11519.0, 17443.0, 25358.0, 35785.0, 48656.0, 63281.0, 77226.0, 90442.0, 98478.0, 100956.0, 96581.0, 86847.0, 73844.0, 58908.0, 44817.0, 33029.0, 23149.0, 15427.0, 10247.0, 6453.0, 4063.0, 2702.0, 1570.0, 961.0, 554.0, 303.0, 175.0, 139.0, 69.0, 42.0, 23.0, 16.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.6953125, -4.5545654296875, -4.413818359375, -4.2730712890625, -4.13232421875, -3.9915771484375, -3.850830078125, -3.7100830078125, -3.5693359375, -3.4285888671875, -3.287841796875, -3.1470947265625, -3.00634765625, -2.8656005859375, -2.724853515625, -2.5841064453125, -2.443359375, -2.3026123046875, -2.161865234375, -2.0211181640625, -1.88037109375, -1.7396240234375, -1.598876953125, -1.4581298828125, -1.3173828125, -1.1766357421875, -1.035888671875, -0.8951416015625, -0.75439453125, -0.6136474609375, -0.472900390625, -0.3321533203125, -0.19140625, -0.0506591796875, 0.090087890625, 0.2308349609375, 0.37158203125, 0.5123291015625, 0.653076171875, 0.7938232421875, 0.9345703125, 1.0753173828125, 1.216064453125, 1.3568115234375, 1.49755859375, 1.6383056640625, 1.779052734375, 1.9197998046875, 2.060546875, 2.2012939453125, 2.342041015625, 2.4827880859375, 2.62353515625, 2.7642822265625, 2.905029296875, 3.0457763671875, 3.1865234375, 3.3272705078125, 3.468017578125, 3.6087646484375, 3.74951171875, 3.8902587890625, 4.031005859375, 4.1717529296875, 4.3125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 8.0, 9.0, 17.0, 8.0, 18.0, 18.0, 22.0, 24.0, 34.0, 32.0, 32.0, 38.0, 39.0, 42.0, 63.0, 42.0, 46.0, 47.0, 41.0, 39.0, 30.0, 39.0, 40.0, 30.0, 23.0, 25.0, 34.0, 20.0, 19.0, 15.0, 18.0, 14.0, 7.0, 6.0, 9.0, 8.0, 3.0, 3.0, 9.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-8.1015625, -7.8636474609375, -7.625732421875, -7.3878173828125, -7.14990234375, -6.9119873046875, -6.674072265625, -6.4361572265625, -6.1982421875, -5.9603271484375, -5.722412109375, -5.4844970703125, -5.24658203125, -5.0086669921875, -4.770751953125, -4.5328369140625, -4.294921875, -4.0570068359375, -3.819091796875, -3.5811767578125, -3.34326171875, -3.1053466796875, -2.867431640625, -2.6295166015625, -2.3916015625, -2.1536865234375, -1.915771484375, -1.6778564453125, -1.43994140625, -1.2020263671875, -0.964111328125, -0.7261962890625, -0.48828125, -0.2503662109375, -0.012451171875, 0.2254638671875, 0.46337890625, 0.7012939453125, 0.939208984375, 1.1771240234375, 1.4150390625, 1.6529541015625, 1.890869140625, 2.1287841796875, 2.36669921875, 2.6046142578125, 2.842529296875, 3.0804443359375, 3.318359375, 3.5562744140625, 3.794189453125, 4.0321044921875, 4.27001953125, 4.5079345703125, 4.745849609375, 4.9837646484375, 5.2216796875, 5.4595947265625, 5.697509765625, 5.9354248046875, 6.17333984375, 6.4112548828125, 6.649169921875, 6.8870849609375, 7.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 16.0, 22.0, 59.0, 60.0, 125.0, 185.0, 260.0, 419.0, 662.0, 1019.0, 1581.0, 2419.0, 3595.0, 5564.0, 8246.0, 12216.0, 18012.0, 25620.0, 34914.0, 46688.0, 60463.0, 74566.0, 86762.0, 94237.0, 97179.0, 94766.0, 85385.0, 73847.0, 59968.0, 45953.0, 34973.0, 25011.0, 17780.0, 12196.0, 8152.0, 5497.0, 3546.0, 2286.0, 1529.0, 990.0, 623.0, 430.0, 275.0, 166.0, 111.0, 60.0, 50.0, 28.0, 18.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.55078125, -5.37445068359375, -5.1981201171875, -5.02178955078125, -4.845458984375, -4.66912841796875, -4.4927978515625, -4.31646728515625, -4.14013671875, -3.96380615234375, -3.7874755859375, -3.61114501953125, -3.434814453125, -3.25848388671875, -3.0821533203125, -2.90582275390625, -2.7294921875, -2.55316162109375, -2.3768310546875, -2.20050048828125, -2.024169921875, -1.84783935546875, -1.6715087890625, -1.49517822265625, -1.31884765625, -1.14251708984375, -0.9661865234375, -0.78985595703125, -0.613525390625, -0.43719482421875, -0.2608642578125, -0.08453369140625, 0.091796875, 0.26812744140625, 0.4444580078125, 0.62078857421875, 0.797119140625, 0.97344970703125, 1.1497802734375, 1.32611083984375, 1.50244140625, 1.67877197265625, 1.8551025390625, 2.03143310546875, 2.207763671875, 2.38409423828125, 2.5604248046875, 2.73675537109375, 2.9130859375, 3.08941650390625, 3.2657470703125, 3.44207763671875, 3.618408203125, 3.79473876953125, 3.9710693359375, 4.14739990234375, 4.32373046875, 4.50006103515625, 4.6763916015625, 4.85272216796875, 5.029052734375, 5.20538330078125, 5.3817138671875, 5.55804443359375, 5.734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 5.0, 5.0, 10.0, 15.0, 20.0, 20.0, 32.0, 25.0, 26.0, 35.0, 27.0, 45.0, 43.0, 37.0, 36.0, 49.0, 40.0, 38.0, 46.0, 39.0, 33.0, 44.0, 36.0, 42.0, 26.0, 29.0, 29.0, 30.0, 15.0, 15.0, 20.0, 14.0, 16.0, 9.0, 6.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9765625, -4.820556640625, -4.66455078125, -4.508544921875, -4.3525390625, -4.196533203125, -4.04052734375, -3.884521484375, -3.728515625, -3.572509765625, -3.41650390625, -3.260498046875, -3.1044921875, -2.948486328125, -2.79248046875, -2.636474609375, -2.48046875, -2.324462890625, -2.16845703125, -2.012451171875, -1.8564453125, -1.700439453125, -1.54443359375, -1.388427734375, -1.232421875, -1.076416015625, -0.92041015625, -0.764404296875, -0.6083984375, -0.452392578125, -0.29638671875, -0.140380859375, 0.015625, 0.171630859375, 0.32763671875, 0.483642578125, 0.6396484375, 0.795654296875, 0.95166015625, 1.107666015625, 1.263671875, 1.419677734375, 1.57568359375, 1.731689453125, 1.8876953125, 2.043701171875, 2.19970703125, 2.355712890625, 2.51171875, 2.667724609375, 2.82373046875, 2.979736328125, 3.1357421875, 3.291748046875, 3.44775390625, 3.603759765625, 3.759765625, 3.915771484375, 4.07177734375, 4.227783203125, 4.3837890625, 4.539794921875, 4.69580078125, 4.851806640625, 5.0078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 14.0, 11.0, 12.0, 19.0, 53.0, 73.0, 96.0, 161.0, 229.0, 351.0, 543.0, 867.0, 1355.0, 2050.0, 3051.0, 4998.0, 7675.0, 11749.0, 17738.0, 26083.0, 37628.0, 51741.0, 67811.0, 83926.0, 96871.0, 104980.0, 105795.0, 98011.0, 84986.0, 69450.0, 52777.0, 38517.0, 26487.0, 18184.0, 12029.0, 7803.0, 5166.0, 3273.0, 2140.0, 1351.0, 888.0, 549.0, 353.0, 242.0, 144.0, 109.0, 65.0, 57.0, 33.0, 17.0, 14.0, 8.0, 9.0, 6.0, 3.0, 0.0, 1.0], "bins": [-1.5439453125, -1.4972076416015625, -1.450469970703125, -1.4037322998046875, -1.35699462890625, -1.3102569580078125, -1.263519287109375, -1.2167816162109375, -1.1700439453125, -1.1233062744140625, -1.076568603515625, -1.0298309326171875, -0.98309326171875, -0.9363555908203125, -0.889617919921875, -0.8428802490234375, -0.796142578125, -0.7494049072265625, -0.702667236328125, -0.6559295654296875, -0.60919189453125, -0.5624542236328125, -0.515716552734375, -0.4689788818359375, -0.4222412109375, -0.3755035400390625, -0.328765869140625, -0.2820281982421875, -0.23529052734375, -0.1885528564453125, -0.141815185546875, -0.0950775146484375, -0.04833984375, -0.0016021728515625, 0.045135498046875, 0.0918731689453125, 0.13861083984375, 0.1853485107421875, 0.232086181640625, 0.2788238525390625, 0.3255615234375, 0.3722991943359375, 0.419036865234375, 0.4657745361328125, 0.51251220703125, 0.5592498779296875, 0.605987548828125, 0.6527252197265625, 0.699462890625, 0.7462005615234375, 0.792938232421875, 0.8396759033203125, 0.88641357421875, 0.9331512451171875, 0.979888916015625, 1.0266265869140625, 1.0733642578125, 1.1201019287109375, 1.166839599609375, 1.2135772705078125, 1.26031494140625, 1.3070526123046875, 1.353790283203125, 1.4005279541015625, 1.447265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 9.0, 9.0, 11.0, 12.0, 20.0, 14.0, 20.0, 23.0, 32.0, 32.0, 31.0, 34.0, 41.0, 36.0, 60.0, 46.0, 48.0, 50.0, 57.0, 48.0, 50.0, 32.0, 30.0, 38.0, 31.0, 32.0, 22.0, 25.0, 26.0, 14.0, 15.0, 6.0, 13.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019288063049316406, -0.0001862160861492157, -0.00017955154180526733, -0.00017288699746131897, -0.0001662224531173706, -0.00015955790877342224, -0.00015289336442947388, -0.0001462288200855255, -0.00013956427574157715, -0.00013289973139762878, -0.00012623518705368042, -0.00011957064270973206, -0.00011290609836578369, -0.00010624155402183533, -9.957700967788696e-05, -9.29124653339386e-05, -8.624792098999023e-05, -7.958337664604187e-05, -7.29188323020935e-05, -6.625428795814514e-05, -5.958974361419678e-05, -5.292519927024841e-05, -4.626065492630005e-05, -3.9596110582351685e-05, -3.293156623840332e-05, -2.6267021894454956e-05, -1.9602477550506592e-05, -1.2937933206558228e-05, -6.273388862609863e-06, 3.91155481338501e-07, 7.055699825286865e-06, 1.372024416923523e-05, 2.0384788513183594e-05, 2.7049332857131958e-05, 3.371387720108032e-05, 4.0378421545028687e-05, 4.704296588897705e-05, 5.3707510232925415e-05, 6.037205457687378e-05, 6.703659892082214e-05, 7.370114326477051e-05, 8.036568760871887e-05, 8.703023195266724e-05, 9.36947762966156e-05, 0.00010035932064056396, 0.00010702386498451233, 0.0001136884093284607, 0.00012035295367240906, 0.00012701749801635742, 0.00013368204236030579, 0.00014034658670425415, 0.00014701113104820251, 0.00015367567539215088, 0.00016034021973609924, 0.0001670047640800476, 0.00017366930842399597, 0.00018033385276794434, 0.0001869983971118927, 0.00019366294145584106, 0.00020032748579978943, 0.0002069920301437378, 0.00021365657448768616, 0.00022032111883163452, 0.00022698566317558289, 0.00023365020751953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 11.0, 19.0, 29.0, 33.0, 54.0, 100.0, 138.0, 227.0, 400.0, 614.0, 908.0, 1519.0, 2454.0, 3900.0, 6117.0, 9769.0, 15297.0, 23536.0, 34339.0, 48614.0, 65814.0, 83921.0, 99769.0, 109363.0, 110935.0, 103021.0, 89366.0, 71624.0, 54100.0, 38065.0, 26272.0, 17665.0, 11217.0, 7175.0, 4487.0, 2834.0, 1790.0, 1082.0, 729.0, 437.0, 299.0, 186.0, 122.0, 72.0, 44.0, 32.0, 26.0, 13.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.43609619140625, -1.3868408203125, -1.33758544921875, -1.288330078125, -1.23907470703125, -1.1898193359375, -1.14056396484375, -1.09130859375, -1.04205322265625, -0.9927978515625, -0.94354248046875, -0.894287109375, -0.84503173828125, -0.7957763671875, -0.74652099609375, -0.697265625, -0.64801025390625, -0.5987548828125, -0.54949951171875, -0.500244140625, -0.45098876953125, -0.4017333984375, -0.35247802734375, -0.30322265625, -0.25396728515625, -0.2047119140625, -0.15545654296875, -0.106201171875, -0.05694580078125, -0.0076904296875, 0.04156494140625, 0.0908203125, 0.14007568359375, 0.1893310546875, 0.23858642578125, 0.287841796875, 0.33709716796875, 0.3863525390625, 0.43560791015625, 0.48486328125, 0.53411865234375, 0.5833740234375, 0.63262939453125, 0.681884765625, 0.73114013671875, 0.7803955078125, 0.82965087890625, 0.87890625, 0.92816162109375, 0.9774169921875, 1.02667236328125, 1.075927734375, 1.12518310546875, 1.1744384765625, 1.22369384765625, 1.27294921875, 1.32220458984375, 1.3714599609375, 1.42071533203125, 1.469970703125, 1.51922607421875, 1.5684814453125, 1.61773681640625, 1.6669921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 10.0, 7.0, 18.0, 16.0, 27.0, 41.0, 41.0, 49.0, 48.0, 71.0, 63.0, 59.0, 65.0, 65.0, 67.0, 57.0, 39.0, 48.0, 40.0, 41.0, 27.0, 17.0, 10.0, 21.0, 13.0, 5.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.9622879028320312, -0.9323883056640625, -0.9024887084960938, -0.872589111328125, -0.8426895141601562, -0.8127899169921875, -0.7828903198242188, -0.75299072265625, -0.7230911254882812, -0.6931915283203125, -0.6632919311523438, -0.633392333984375, -0.6034927368164062, -0.5735931396484375, -0.5436935424804688, -0.5137939453125, -0.48389434814453125, -0.4539947509765625, -0.42409515380859375, -0.394195556640625, -0.36429595947265625, -0.3343963623046875, -0.30449676513671875, -0.27459716796875, -0.24469757080078125, -0.2147979736328125, -0.18489837646484375, -0.154998779296875, -0.12509918212890625, -0.0951995849609375, -0.06529998779296875, -0.035400390625, -0.00550079345703125, 0.0243988037109375, 0.05429840087890625, 0.084197998046875, 0.11409759521484375, 0.1439971923828125, 0.17389678955078125, 0.20379638671875, 0.23369598388671875, 0.2635955810546875, 0.29349517822265625, 0.323394775390625, 0.35329437255859375, 0.3831939697265625, 0.41309356689453125, 0.4429931640625, 0.47289276123046875, 0.5027923583984375, 0.5326919555664062, 0.562591552734375, 0.5924911499023438, 0.6223907470703125, 0.6522903442382812, 0.68218994140625, 0.7120895385742188, 0.7419891357421875, 0.7718887329101562, 0.801788330078125, 0.8316879272460938, 0.8615875244140625, 0.8914871215820312, 0.92138671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 13.0, 6.0, 17.0, 12.0, 23.0, 23.0, 21.0, 25.0, 32.0, 32.0, 41.0, 58.0, 34.0, 45.0, 39.0, 49.0, 45.0, 40.0, 34.0, 50.0, 37.0, 45.0, 36.0, 32.0, 25.0, 25.0, 23.0, 20.0, 17.0, 15.0, 15.0, 8.0, 10.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.954412460327148, -7.717670440673828, -7.480928421020508, -7.2441864013671875, -7.007443904876709, -6.770701885223389, -6.533959865570068, -6.297217845916748, -6.0604753494262695, -5.823733329772949, -5.586991310119629, -5.350249290466309, -5.11350679397583, -4.87676477432251, -4.6400227546691895, -4.403280735015869, -4.166538715362549, -3.9297966957092285, -3.693054437637329, -3.456312417984009, -3.2195701599121094, -2.982828140258789, -2.7460861206054688, -2.5093441009521484, -2.272601842880249, -2.0358598232269287, -1.7991175651550293, -1.562375545501709, -1.3256334066390991, -1.0888912677764893, -0.852149248123169, -0.6154071092605591, -0.378664493560791, -0.14192238450050354, 0.09481972455978394, 0.331561803817749, 0.5683039426803589, 0.8050460815429688, 1.041788101196289, 1.278530240058899, 1.5152723789215088, 1.7520145177841187, 1.9887566566467285, 2.225498676300049, 2.462240695953369, 2.6989829540252686, 2.935724973678589, 3.1724672317504883, 3.4092092514038086, 3.645951271057129, 3.8826935291290283, 4.1194353103637695, 4.356177806854248, 4.592919826507568, 4.829661846160889, 5.066403865814209, 5.3031463623046875, 5.539888381958008, 5.776630401611328, 6.013372421264648, 6.250114917755127, 6.486856937408447, 6.723598957061768, 6.960340976715088, 7.197082996368408]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 10.0, 14.0, 14.0, 19.0, 14.0, 28.0, 29.0, 34.0, 35.0, 38.0, 23.0, 36.0, 36.0, 38.0, 49.0, 36.0, 46.0, 36.0, 26.0, 31.0, 33.0, 53.0, 39.0, 33.0, 36.0, 18.0, 33.0, 24.0, 15.0, 15.0, 17.0, 10.0, 14.0, 11.0, 4.0, 6.0, 5.0, 2.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.722298622131348, -7.485788345336914, -7.2492780685424805, -7.012767791748047, -6.776257514953613, -6.53974723815918, -6.303237438201904, -6.066727161407471, -5.830216884613037, -5.5937066078186035, -5.35719633102417, -5.120686054229736, -4.884176254272461, -4.647665977478027, -4.411155700683594, -4.17464542388916, -3.9381351470947266, -3.701624870300293, -3.4651145935058594, -3.228604555130005, -2.9920942783355713, -2.7555840015411377, -2.519073963165283, -2.2825636863708496, -2.046053409576416, -1.8095431327819824, -1.5730329751968384, -1.3365228176116943, -1.1000125408172607, -0.8635022640228271, -0.6269921064376831, -0.39048194885253906, -0.15397119522094727, 0.08253902196884155, 0.31904923915863037, 0.5555594563484192, 0.792069673538208, 1.0285799503326416, 1.2650901079177856, 1.5016002655029297, 1.7381105422973633, 1.9746208190917969, 2.2111310958862305, 2.447641134262085, 2.6841514110565186, 2.920661687850952, 3.1571717262268066, 3.3936820030212402, 3.630192279815674, 3.8667025566101074, 4.103212833404541, 4.339723110198975, 4.57623291015625, 4.812743186950684, 5.049253463745117, 5.285763740539551, 5.522274017333984, 5.758784294128418, 5.995294570922852, 6.231804847717285, 6.468315124511719, 6.704825401306152, 6.941335201263428, 7.177845478057861, 7.414355754852295]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 8.0, 15.0, 18.0, 27.0, 39.0, 63.0, 126.0, 168.0, 299.0, 462.0, 666.0, 1134.0, 1778.0, 3013.0, 4749.0, 7768.0, 12628.0, 20292.0, 33584.0, 52891.0, 85203.0, 133993.0, 203129.0, 297495.0, 409604.0, 507368.0, 552328.0, 518992.0, 427832.0, 316282.0, 218794.0, 143353.0, 91829.0, 57342.0, 35156.0, 21886.0, 13082.0, 8085.0, 4913.0, 3018.0, 1855.0, 1123.0, 722.0, 438.0, 266.0, 195.0, 87.0, 67.0, 50.0, 23.0, 16.0, 10.0, 12.0, 10.0, 8.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.859375, -5.66778564453125, -5.4761962890625, -5.28460693359375, -5.093017578125, -4.90142822265625, -4.7098388671875, -4.51824951171875, -4.32666015625, -4.13507080078125, -3.9434814453125, -3.75189208984375, -3.560302734375, -3.36871337890625, -3.1771240234375, -2.98553466796875, -2.7939453125, -2.60235595703125, -2.4107666015625, -2.21917724609375, -2.027587890625, -1.83599853515625, -1.6444091796875, -1.45281982421875, -1.26123046875, -1.06964111328125, -0.8780517578125, -0.68646240234375, -0.494873046875, -0.30328369140625, -0.1116943359375, 0.07989501953125, 0.271484375, 0.46307373046875, 0.6546630859375, 0.84625244140625, 1.037841796875, 1.22943115234375, 1.4210205078125, 1.61260986328125, 1.80419921875, 1.99578857421875, 2.1873779296875, 2.37896728515625, 2.570556640625, 2.76214599609375, 2.9537353515625, 3.14532470703125, 3.3369140625, 3.52850341796875, 3.7200927734375, 3.91168212890625, 4.103271484375, 4.29486083984375, 4.4864501953125, 4.67803955078125, 4.86962890625, 5.06121826171875, 5.2528076171875, 5.44439697265625, 5.635986328125, 5.82757568359375, 6.0191650390625, 6.21075439453125, 6.40234375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 6.0, 5.0, 13.0, 10.0, 19.0, 22.0, 16.0, 16.0, 37.0, 38.0, 37.0, 38.0, 41.0, 39.0, 36.0, 40.0, 43.0, 44.0, 35.0, 40.0, 50.0, 30.0, 40.0, 43.0, 30.0, 44.0, 26.0, 23.0, 22.0, 18.0, 20.0, 11.0, 13.0, 5.0, 5.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.43359375, -6.236328125, -6.0390625, -5.841796875, -5.64453125, -5.447265625, -5.25, -5.052734375, -4.85546875, -4.658203125, -4.4609375, -4.263671875, -4.06640625, -3.869140625, -3.671875, -3.474609375, -3.27734375, -3.080078125, -2.8828125, -2.685546875, -2.48828125, -2.291015625, -2.09375, -1.896484375, -1.69921875, -1.501953125, -1.3046875, -1.107421875, -0.91015625, -0.712890625, -0.515625, -0.318359375, -0.12109375, 0.076171875, 0.2734375, 0.470703125, 0.66796875, 0.865234375, 1.0625, 1.259765625, 1.45703125, 1.654296875, 1.8515625, 2.048828125, 2.24609375, 2.443359375, 2.640625, 2.837890625, 3.03515625, 3.232421875, 3.4296875, 3.626953125, 3.82421875, 4.021484375, 4.21875, 4.416015625, 4.61328125, 4.810546875, 5.0078125, 5.205078125, 5.40234375, 5.599609375, 5.796875, 5.994140625, 6.19140625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 5.0, 6.0, 13.0, 12.0, 25.0, 49.0, 86.0, 137.0, 202.0, 336.0, 483.0, 790.0, 1295.0, 2063.0, 3333.0, 5093.0, 8360.0, 12950.0, 20232.0, 31232.0, 48004.0, 72886.0, 107620.0, 155799.0, 216746.0, 288921.0, 364294.0, 424122.0, 454479.0, 444156.0, 394758.0, 324360.0, 248967.0, 181818.0, 128359.0, 86920.0, 58940.0, 38433.0, 24495.0, 15930.0, 10124.0, 6483.0, 4003.0, 2659.0, 1618.0, 1020.0, 635.0, 384.0, 264.0, 150.0, 96.0, 53.0, 29.0, 23.0, 17.0, 12.0, 6.0, 6.0, 2.0, 2.0], "bins": [-5.16015625, -5.00250244140625, -4.8448486328125, -4.68719482421875, -4.529541015625, -4.37188720703125, -4.2142333984375, -4.05657958984375, -3.89892578125, -3.74127197265625, -3.5836181640625, -3.42596435546875, -3.268310546875, -3.11065673828125, -2.9530029296875, -2.79534912109375, -2.6376953125, -2.48004150390625, -2.3223876953125, -2.16473388671875, -2.007080078125, -1.84942626953125, -1.6917724609375, -1.53411865234375, -1.37646484375, -1.21881103515625, -1.0611572265625, -0.90350341796875, -0.745849609375, -0.58819580078125, -0.4305419921875, -0.27288818359375, -0.115234375, 0.04241943359375, 0.2000732421875, 0.35772705078125, 0.515380859375, 0.67303466796875, 0.8306884765625, 0.98834228515625, 1.14599609375, 1.30364990234375, 1.4613037109375, 1.61895751953125, 1.776611328125, 1.93426513671875, 2.0919189453125, 2.24957275390625, 2.4072265625, 2.56488037109375, 2.7225341796875, 2.88018798828125, 3.037841796875, 3.19549560546875, 3.3531494140625, 3.51080322265625, 3.66845703125, 3.82611083984375, 3.9837646484375, 4.14141845703125, 4.299072265625, 4.45672607421875, 4.6143798828125, 4.77203369140625, 4.9296875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 4.0, 5.0, 4.0, 13.0, 11.0, 20.0, 26.0, 25.0, 30.0, 44.0, 39.0, 53.0, 51.0, 64.0, 98.0, 117.0, 136.0, 124.0, 136.0, 180.0, 188.0, 200.0, 222.0, 205.0, 213.0, 217.0, 182.0, 192.0, 179.0, 135.0, 153.0, 110.0, 100.0, 90.0, 92.0, 67.0, 55.0, 53.0, 47.0, 46.0, 41.0, 25.0, 20.0, 17.0, 11.0, 9.0, 5.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.10546875, -2.0277099609375, -1.949951171875, -1.8721923828125, -1.79443359375, -1.7166748046875, -1.638916015625, -1.5611572265625, -1.4833984375, -1.4056396484375, -1.327880859375, -1.2501220703125, -1.17236328125, -1.0946044921875, -1.016845703125, -0.9390869140625, -0.861328125, -0.7835693359375, -0.705810546875, -0.6280517578125, -0.55029296875, -0.4725341796875, -0.394775390625, -0.3170166015625, -0.2392578125, -0.1614990234375, -0.083740234375, -0.0059814453125, 0.07177734375, 0.1495361328125, 0.227294921875, 0.3050537109375, 0.3828125, 0.4605712890625, 0.538330078125, 0.6160888671875, 0.69384765625, 0.7716064453125, 0.849365234375, 0.9271240234375, 1.0048828125, 1.0826416015625, 1.160400390625, 1.2381591796875, 1.31591796875, 1.3936767578125, 1.471435546875, 1.5491943359375, 1.626953125, 1.7047119140625, 1.782470703125, 1.8602294921875, 1.93798828125, 2.0157470703125, 2.093505859375, 2.1712646484375, 2.2490234375, 2.3267822265625, 2.404541015625, 2.4822998046875, 2.56005859375, 2.6378173828125, 2.715576171875, 2.7933349609375, 2.87109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 4.0, 2.0, 6.0, 8.0, 11.0, 5.0, 14.0, 11.0, 13.0, 24.0, 19.0, 25.0, 22.0, 29.0, 35.0, 36.0, 44.0, 39.0, 42.0, 51.0, 40.0, 36.0, 39.0, 48.0, 51.0, 37.0, 42.0, 38.0, 37.0, 28.0, 29.0, 25.0, 18.0, 16.0, 10.0, 16.0, 9.0, 7.0, 10.0, 8.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.474795341491699, -7.252834796905518, -7.030874252319336, -6.808913707733154, -6.586953163146973, -6.364992141723633, -6.143031597137451, -5.9210710525512695, -5.699110507965088, -5.477149963378906, -5.255189418792725, -5.033228874206543, -4.811267852783203, -4.58930778503418, -4.36734676361084, -4.145386219024658, -3.9234256744384766, -3.701465129852295, -3.4795045852661133, -3.2575438022613525, -3.035583257675171, -2.8136227130889893, -2.5916619300842285, -2.369701385498047, -2.1477408409118652, -1.9257802963256836, -1.7038196325302124, -1.4818589687347412, -1.2598984241485596, -1.037937879562378, -0.8159772157669067, -0.5940165519714355, -0.3720555305480957, -0.1500949263572693, 0.07186567783355713, 0.29382628202438354, 0.51578688621521, 0.7377474308013916, 0.9597080945968628, 1.181668758392334, 1.4036293029785156, 1.6255898475646973, 1.8475505113601685, 2.0695111751556396, 2.2914717197418213, 2.513432264328003, 2.7353930473327637, 2.9573535919189453, 3.179314136505127, 3.4012746810913086, 3.6232352256774902, 3.845196008682251, 4.067156791687012, 4.289116859436035, 4.511077880859375, 4.733038425445557, 4.954998970031738, 5.17695951461792, 5.398920059204102, 5.620880603790283, 5.842841148376465, 6.064802169799805, 6.286762714385986, 6.508723258972168, 6.73068380355835]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 7.0, 5.0, 14.0, 13.0, 13.0, 12.0, 18.0, 20.0, 16.0, 34.0, 29.0, 34.0, 29.0, 38.0, 36.0, 46.0, 36.0, 48.0, 46.0, 52.0, 38.0, 41.0, 35.0, 36.0, 37.0, 28.0, 35.0, 25.0, 21.0, 30.0, 27.0, 14.0, 18.0, 17.0, 10.0, 6.0, 3.0, 8.0, 1.0, 3.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.701112270355225, -7.468407154083252, -7.2357025146484375, -7.002997398376465, -6.770292282104492, -6.537587642669678, -6.304882526397705, -6.072177886962891, -5.839472770690918, -5.606767654418945, -5.374063014984131, -5.141357898712158, -4.908653259277344, -4.675948143005371, -4.443243026733398, -4.210537910461426, -3.9778332710266113, -3.7451283931732178, -3.512423515319824, -3.2797183990478516, -3.047013521194458, -2.8143086433410645, -2.581603527069092, -2.3488986492156982, -2.1161937713623047, -1.8834888935089111, -1.650783896446228, -1.418078899383545, -1.1853740215301514, -0.9526691436767578, -0.7199641466140747, -0.4872591495513916, -0.25455427169799805, -0.021849334239959717, 0.2108556032180786, 0.44356054067611694, 0.6762654781341553, 0.9089703559875488, 1.141675353050232, 1.374380350112915, 1.6070852279663086, 1.8397901058197021, 2.0724949836730957, 2.3052000999450684, 2.537904977798462, 2.7706098556518555, 3.003314971923828, 3.2360198497772217, 3.4687247276306152, 3.701429605484009, 3.9341344833374023, 4.166839599609375, 4.399544715881348, 4.632249355316162, 4.864954471588135, 5.097659111022949, 5.330364227294922, 5.5630693435668945, 5.795773983001709, 6.028479099273682, 6.261183738708496, 6.493888854980469, 6.726593971252441, 6.959299087524414, 7.1920037269592285]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 7.0, 15.0, 14.0, 23.0, 54.0, 79.0, 133.0, 176.0, 263.0, 427.0, 619.0, 900.0, 1369.0, 1953.0, 2942.0, 4268.0, 6170.0, 8647.0, 12120.0, 16620.0, 23047.0, 30385.0, 40530.0, 53909.0, 68369.0, 84087.0, 98385.0, 105009.0, 101360.0, 89145.0, 73500.0, 57487.0, 44936.0, 33513.0, 25267.0, 18388.0, 13522.0, 9488.0, 6702.0, 4684.0, 3249.0, 2260.0, 1503.0, 1016.0, 720.0, 452.0, 293.0, 210.0, 112.0, 71.0, 54.0, 41.0, 35.0, 21.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-6.80859375, -6.593505859375, -6.37841796875, -6.163330078125, -5.9482421875, -5.733154296875, -5.51806640625, -5.302978515625, -5.087890625, -4.872802734375, -4.65771484375, -4.442626953125, -4.2275390625, -4.012451171875, -3.79736328125, -3.582275390625, -3.3671875, -3.152099609375, -2.93701171875, -2.721923828125, -2.5068359375, -2.291748046875, -2.07666015625, -1.861572265625, -1.646484375, -1.431396484375, -1.21630859375, -1.001220703125, -0.7861328125, -0.571044921875, -0.35595703125, -0.140869140625, 0.07421875, 0.289306640625, 0.50439453125, 0.719482421875, 0.9345703125, 1.149658203125, 1.36474609375, 1.579833984375, 1.794921875, 2.010009765625, 2.22509765625, 2.440185546875, 2.6552734375, 2.870361328125, 3.08544921875, 3.300537109375, 3.515625, 3.730712890625, 3.94580078125, 4.160888671875, 4.3759765625, 4.591064453125, 4.80615234375, 5.021240234375, 5.236328125, 5.451416015625, 5.66650390625, 5.881591796875, 6.0966796875, 6.311767578125, 6.52685546875, 6.741943359375, 6.95703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 12.0, 16.0, 10.0, 13.0, 10.0, 18.0, 19.0, 21.0, 24.0, 20.0, 33.0, 32.0, 29.0, 33.0, 41.0, 31.0, 35.0, 43.0, 40.0, 35.0, 34.0, 54.0, 30.0, 32.0, 28.0, 29.0, 36.0, 36.0, 21.0, 21.0, 22.0, 27.0, 17.0, 14.0, 14.0, 13.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.9609375, -4.8001708984375, -4.639404296875, -4.4786376953125, -4.31787109375, -4.1571044921875, -3.996337890625, -3.8355712890625, -3.6748046875, -3.5140380859375, -3.353271484375, -3.1925048828125, -3.03173828125, -2.8709716796875, -2.710205078125, -2.5494384765625, -2.388671875, -2.2279052734375, -2.067138671875, -1.9063720703125, -1.74560546875, -1.5848388671875, -1.424072265625, -1.2633056640625, -1.1025390625, -0.9417724609375, -0.781005859375, -0.6202392578125, -0.45947265625, -0.2987060546875, -0.137939453125, 0.0228271484375, 0.18359375, 0.3443603515625, 0.505126953125, 0.6658935546875, 0.82666015625, 0.9874267578125, 1.148193359375, 1.3089599609375, 1.4697265625, 1.6304931640625, 1.791259765625, 1.9520263671875, 2.11279296875, 2.2735595703125, 2.434326171875, 2.5950927734375, 2.755859375, 2.9166259765625, 3.077392578125, 3.2381591796875, 3.39892578125, 3.5596923828125, 3.720458984375, 3.8812255859375, 4.0419921875, 4.2027587890625, 4.363525390625, 4.5242919921875, 4.68505859375, 4.8458251953125, 5.006591796875, 5.1673583984375, 5.328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 16.0, 31.0, 47.0, 66.0, 87.0, 130.0, 230.0, 293.0, 424.0, 674.0, 1030.0, 1691.0, 2561.0, 4012.0, 6074.0, 9603.0, 15190.0, 23966.0, 37646.0, 59763.0, 93199.0, 138350.0, 177602.0, 161208.0, 113386.0, 73347.0, 46359.0, 29376.0, 18761.0, 11977.0, 7557.0, 4853.0, 3184.0, 2037.0, 1348.0, 837.0, 529.0, 390.0, 245.0, 155.0, 100.0, 66.0, 48.0, 32.0, 22.0, 15.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -10.98486328125, -10.6025390625, -10.22021484375, -9.837890625, -9.45556640625, -9.0732421875, -8.69091796875, -8.30859375, -7.92626953125, -7.5439453125, -7.16162109375, -6.779296875, -6.39697265625, -6.0146484375, -5.63232421875, -5.25, -4.86767578125, -4.4853515625, -4.10302734375, -3.720703125, -3.33837890625, -2.9560546875, -2.57373046875, -2.19140625, -1.80908203125, -1.4267578125, -1.04443359375, -0.662109375, -0.27978515625, 0.1025390625, 0.48486328125, 0.8671875, 1.24951171875, 1.6318359375, 2.01416015625, 2.396484375, 2.77880859375, 3.1611328125, 3.54345703125, 3.92578125, 4.30810546875, 4.6904296875, 5.07275390625, 5.455078125, 5.83740234375, 6.2197265625, 6.60205078125, 6.984375, 7.36669921875, 7.7490234375, 8.13134765625, 8.513671875, 8.89599609375, 9.2783203125, 9.66064453125, 10.04296875, 10.42529296875, 10.8076171875, 11.18994140625, 11.572265625, 11.95458984375, 12.3369140625, 12.71923828125, 13.1015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 14.0, 17.0, 20.0, 24.0, 21.0, 25.0, 38.0, 35.0, 53.0, 55.0, 40.0, 43.0, 51.0, 59.0, 58.0, 69.0, 49.0, 48.0, 47.0, 35.0, 26.0, 32.0, 36.0, 25.0, 16.0, 16.0, 7.0, 10.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.2310791015625, -6.028564453125, -5.8260498046875, -5.62353515625, -5.4210205078125, -5.218505859375, -5.0159912109375, -4.8134765625, -4.6109619140625, -4.408447265625, -4.2059326171875, -4.00341796875, -3.8009033203125, -3.598388671875, -3.3958740234375, -3.193359375, -2.9908447265625, -2.788330078125, -2.5858154296875, -2.38330078125, -2.1807861328125, -1.978271484375, -1.7757568359375, -1.5732421875, -1.3707275390625, -1.168212890625, -0.9656982421875, -0.76318359375, -0.5606689453125, -0.358154296875, -0.1556396484375, 0.046875, 0.2493896484375, 0.451904296875, 0.6544189453125, 0.85693359375, 1.0594482421875, 1.261962890625, 1.4644775390625, 1.6669921875, 1.8695068359375, 2.072021484375, 2.2745361328125, 2.47705078125, 2.6795654296875, 2.882080078125, 3.0845947265625, 3.287109375, 3.4896240234375, 3.692138671875, 3.8946533203125, 4.09716796875, 4.2996826171875, 4.502197265625, 4.7047119140625, 4.9072265625, 5.1097412109375, 5.312255859375, 5.5147705078125, 5.71728515625, 5.9197998046875, 6.122314453125, 6.3248291015625, 6.52734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 9.0, 17.0, 21.0, 21.0, 38.0, 58.0, 54.0, 81.0, 126.0, 151.0, 240.0, 360.0, 518.0, 714.0, 1067.0, 1665.0, 2516.0, 4106.0, 7052.0, 13587.0, 32044.0, 142960.0, 668812.0, 113465.0, 28628.0, 12331.0, 6731.0, 3830.0, 2339.0, 1567.0, 1059.0, 696.0, 487.0, 338.0, 257.0, 161.0, 106.0, 100.0, 68.0, 49.0, 28.0, 28.0, 23.0, 17.0, 3.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-36.5625, -35.46923828125, -34.3759765625, -33.28271484375, -32.189453125, -31.09619140625, -30.0029296875, -28.90966796875, -27.81640625, -26.72314453125, -25.6298828125, -24.53662109375, -23.443359375, -22.35009765625, -21.2568359375, -20.16357421875, -19.0703125, -17.97705078125, -16.8837890625, -15.79052734375, -14.697265625, -13.60400390625, -12.5107421875, -11.41748046875, -10.32421875, -9.23095703125, -8.1376953125, -7.04443359375, -5.951171875, -4.85791015625, -3.7646484375, -2.67138671875, -1.578125, -0.48486328125, 0.6083984375, 1.70166015625, 2.794921875, 3.88818359375, 4.9814453125, 6.07470703125, 7.16796875, 8.26123046875, 9.3544921875, 10.44775390625, 11.541015625, 12.63427734375, 13.7275390625, 14.82080078125, 15.9140625, 17.00732421875, 18.1005859375, 19.19384765625, 20.287109375, 21.38037109375, 22.4736328125, 23.56689453125, 24.66015625, 25.75341796875, 26.8466796875, 27.93994140625, 29.033203125, 30.12646484375, 31.2197265625, 32.31298828125, 33.40625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 12.0, 12.0, 20.0, 40.0, 72.0, 108.0, 193.0, 182.0, 129.0, 54.0, 42.0, 28.0, 17.0, 10.0, 6.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.00261688232421875, -0.0025422275066375732, -0.0024675726890563965, -0.0023929178714752197, -0.002318263053894043, -0.002243608236312866, -0.0021689534187316895, -0.0020942986011505127, -0.002019643783569336, -0.0019449889659881592, -0.0018703341484069824, -0.0017956793308258057, -0.001721024513244629, -0.0016463696956634521, -0.0015717148780822754, -0.0014970600605010986, -0.0014224052429199219, -0.0013477504253387451, -0.0012730956077575684, -0.0011984407901763916, -0.0011237859725952148, -0.001049131155014038, -0.0009744763374328613, -0.0008998215198516846, -0.0008251667022705078, -0.0007505118846893311, -0.0006758570671081543, -0.0006012022495269775, -0.0005265474319458008, -0.000451892614364624, -0.00037723779678344727, -0.0003025829792022705, -0.00022792816162109375, -0.000153273344039917, -7.861852645874023e-05, -3.9637088775634766e-06, 7.069110870361328e-05, 0.00014534592628479004, 0.0002200007438659668, 0.00029465556144714355, 0.0003693103790283203, 0.00044396519660949707, 0.0005186200141906738, 0.0005932748317718506, 0.0006679296493530273, 0.0007425844669342041, 0.0008172392845153809, 0.0008918941020965576, 0.0009665489196777344, 0.0010412037372589111, 0.0011158585548400879, 0.0011905133724212646, 0.0012651681900024414, 0.0013398230075836182, 0.001414477825164795, 0.0014891326427459717, 0.0015637874603271484, 0.0016384422779083252, 0.001713097095489502, 0.0017877519130706787, 0.0018624067306518555, 0.0019370615482330322, 0.002011716365814209, 0.0020863711833953857, 0.0021610260009765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 15.0, 14.0, 45.0, 52.0, 64.0, 88.0, 163.0, 209.0, 282.0, 377.0, 580.0, 918.0, 1272.0, 1937.0, 3013.0, 4696.0, 7347.0, 12330.0, 22571.0, 49528.0, 157646.0, 429707.0, 225035.0, 64991.0, 27257.0, 14627.0, 8469.0, 5314.0, 3306.0, 2141.0, 1428.0, 965.0, 616.0, 435.0, 312.0, 255.0, 170.0, 110.0, 59.0, 57.0, 36.0, 32.0, 19.0, 16.0, 14.0, 6.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0], "bins": [-16.453125, -15.948974609375, -15.44482421875, -14.940673828125, -14.4365234375, -13.932373046875, -13.42822265625, -12.924072265625, -12.419921875, -11.915771484375, -11.41162109375, -10.907470703125, -10.4033203125, -9.899169921875, -9.39501953125, -8.890869140625, -8.38671875, -7.882568359375, -7.37841796875, -6.874267578125, -6.3701171875, -5.865966796875, -5.36181640625, -4.857666015625, -4.353515625, -3.849365234375, -3.34521484375, -2.841064453125, -2.3369140625, -1.832763671875, -1.32861328125, -0.824462890625, -0.3203125, 0.183837890625, 0.68798828125, 1.192138671875, 1.6962890625, 2.200439453125, 2.70458984375, 3.208740234375, 3.712890625, 4.217041015625, 4.72119140625, 5.225341796875, 5.7294921875, 6.233642578125, 6.73779296875, 7.241943359375, 7.74609375, 8.250244140625, 8.75439453125, 9.258544921875, 9.7626953125, 10.266845703125, 10.77099609375, 11.275146484375, 11.779296875, 12.283447265625, 12.78759765625, 13.291748046875, 13.7958984375, 14.300048828125, 14.80419921875, 15.308349609375, 15.8125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 3.0, 5.0, 14.0, 9.0, 10.0, 8.0, 10.0, 15.0, 23.0, 15.0, 36.0, 47.0, 76.0, 80.0, 129.0, 107.0, 107.0, 87.0, 50.0, 21.0, 18.0, 18.0, 15.0, 9.0, 14.0, 9.0, 12.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.063720703125, -3.92822265625, -3.792724609375, -3.6572265625, -3.521728515625, -3.38623046875, -3.250732421875, -3.115234375, -2.979736328125, -2.84423828125, -2.708740234375, -2.5732421875, -2.437744140625, -2.30224609375, -2.166748046875, -2.03125, -1.895751953125, -1.76025390625, -1.624755859375, -1.4892578125, -1.353759765625, -1.21826171875, -1.082763671875, -0.947265625, -0.811767578125, -0.67626953125, -0.540771484375, -0.4052734375, -0.269775390625, -0.13427734375, 0.001220703125, 0.13671875, 0.272216796875, 0.40771484375, 0.543212890625, 0.6787109375, 0.814208984375, 0.94970703125, 1.085205078125, 1.220703125, 1.356201171875, 1.49169921875, 1.627197265625, 1.7626953125, 1.898193359375, 2.03369140625, 2.169189453125, 2.3046875, 2.440185546875, 2.57568359375, 2.711181640625, 2.8466796875, 2.982177734375, 3.11767578125, 3.253173828125, 3.388671875, 3.524169921875, 3.65966796875, 3.795166015625, 3.9306640625, 4.066162109375, 4.20166015625, 4.337158203125, 4.47265625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 11.0, 17.0, 17.0, 16.0, 21.0, 18.0, 27.0, 29.0, 19.0, 31.0, 48.0, 49.0, 50.0, 49.0, 59.0, 41.0, 59.0, 57.0, 39.0, 40.0, 40.0, 30.0, 36.0, 26.0, 23.0, 22.0, 19.0, 17.0, 11.0, 13.0, 7.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.145132064819336, -6.93000602722168, -6.714879989624023, -6.499753952026367, -6.284627914428711, -6.069501876831055, -5.854375839233398, -5.639249801635742, -5.424123764038086, -5.20899772644043, -4.993871688842773, -4.778745651245117, -4.563619613647461, -4.348493576049805, -4.133367538452148, -3.918241500854492, -3.703115701675415, -3.487989664077759, -3.2728636264801025, -3.0577375888824463, -2.84261155128479, -2.627485752105713, -2.4123597145080566, -2.1972336769104004, -1.9821075201034546, -1.7669814825057983, -1.551855444908142, -1.3367295265197754, -1.1216034889221191, -0.9064774513244629, -0.6913514137268066, -0.4762253761291504, -0.26109933853149414, -0.045973315834999084, 0.16915270686149597, 0.38427871465682983, 0.5994047522544861, 0.8145307302474976, 1.0296567678451538, 1.24478280544281, 1.4599088430404663, 1.6750348806381226, 1.8901609182357788, 2.1052868366241455, 2.3204128742218018, 2.535538911819458, 2.7506649494171143, 2.9657909870147705, 3.1809170246124268, 3.396043062210083, 3.6111690998077393, 3.8262951374053955, 4.041420936584473, 4.256546974182129, 4.471673011779785, 4.686799049377441, 4.901925086975098, 5.117051124572754, 5.33217716217041, 5.547303199768066, 5.762429237365723, 5.977555274963379, 6.192681312561035, 6.407807350158691, 6.622933387756348]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 5.0, 11.0, 14.0, 15.0, 18.0, 10.0, 25.0, 16.0, 31.0, 35.0, 23.0, 31.0, 42.0, 39.0, 26.0, 37.0, 39.0, 36.0, 40.0, 50.0, 40.0, 34.0, 52.0, 30.0, 29.0, 29.0, 25.0, 31.0, 33.0, 28.0, 12.0, 19.0, 12.0, 12.0, 16.0, 9.0, 13.0, 3.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.348331928253174, -6.147264003753662, -5.946195602416992, -5.7451276779174805, -5.544059753417969, -5.342991828918457, -5.141923427581787, -4.940855503082275, -4.7397871017456055, -4.538719177246094, -4.337650775909424, -4.136582851409912, -3.9355149269104004, -3.7344467639923096, -3.5333786010742188, -3.332310676574707, -3.1312427520751953, -2.9301745891571045, -2.7291066646575928, -2.528038501739502, -2.3269705772399902, -2.1259024143218994, -1.9248342514038086, -1.7237662076950073, -1.522698163986206, -1.3216301202774048, -1.1205620765686035, -0.9194939136505127, -0.7184258699417114, -0.5173578262329102, -0.31628966331481934, -0.11522161960601807, 0.085845947265625, 0.28691402077674866, 0.4879820942878723, 0.6890501976013184, 0.8901182413101196, 1.091186285018921, 1.2922544479370117, 1.493322491645813, 1.6943905353546143, 1.8954585790634155, 2.096526622772217, 2.2975947856903076, 2.4986629486083984, 2.69973087310791, 2.900799036026001, 3.101867198944092, 3.3029351234436035, 3.5040032863616943, 3.705071210861206, 3.906139373779297, 4.107207298278809, 4.30827522277832, 4.50934362411499, 4.710411548614502, 4.911479949951172, 5.112547874450684, 5.3136162757873535, 5.514684200286865, 5.715752124786377, 5.916820526123047, 6.117888450622559, 6.31895637512207, 6.520024299621582]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 6.0, 12.0, 13.0, 37.0, 49.0, 67.0, 87.0, 138.0, 262.0, 393.0, 605.0, 894.0, 1417.0, 2026.0, 3238.0, 4783.0, 7485.0, 11340.0, 16817.0, 24529.0, 35165.0, 48231.0, 63419.0, 79429.0, 94600.0, 103706.0, 106049.0, 99659.0, 86834.0, 70829.0, 55728.0, 40961.0, 29231.0, 20345.0, 13672.0, 9169.0, 6042.0, 3943.0, 2579.0, 1651.0, 1153.0, 672.0, 469.0, 272.0, 199.0, 124.0, 88.0, 53.0, 41.0, 21.0, 13.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.49609375, -4.35662841796875, -4.2171630859375, -4.07769775390625, -3.938232421875, -3.79876708984375, -3.6593017578125, -3.51983642578125, -3.38037109375, -3.24090576171875, -3.1014404296875, -2.96197509765625, -2.822509765625, -2.68304443359375, -2.5435791015625, -2.40411376953125, -2.2646484375, -2.12518310546875, -1.9857177734375, -1.84625244140625, -1.706787109375, -1.56732177734375, -1.4278564453125, -1.28839111328125, -1.14892578125, -1.00946044921875, -0.8699951171875, -0.73052978515625, -0.591064453125, -0.45159912109375, -0.3121337890625, -0.17266845703125, -0.033203125, 0.10626220703125, 0.2457275390625, 0.38519287109375, 0.524658203125, 0.66412353515625, 0.8035888671875, 0.94305419921875, 1.08251953125, 1.22198486328125, 1.3614501953125, 1.50091552734375, 1.640380859375, 1.77984619140625, 1.9193115234375, 2.05877685546875, 2.1982421875, 2.33770751953125, 2.4771728515625, 2.61663818359375, 2.756103515625, 2.89556884765625, 3.0350341796875, 3.17449951171875, 3.31396484375, 3.45343017578125, 3.5928955078125, 3.73236083984375, 3.871826171875, 4.01129150390625, 4.1507568359375, 4.29022216796875, 4.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 8.0, 3.0, 11.0, 10.0, 17.0, 18.0, 10.0, 20.0, 14.0, 34.0, 23.0, 44.0, 33.0, 33.0, 27.0, 37.0, 36.0, 42.0, 46.0, 44.0, 46.0, 41.0, 37.0, 37.0, 33.0, 31.0, 27.0, 30.0, 28.0, 23.0, 28.0, 19.0, 21.0, 15.0, 11.0, 7.0, 11.0, 6.0, 10.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.5, -6.3009033203125, -6.101806640625, -5.9027099609375, -5.70361328125, -5.5045166015625, -5.305419921875, -5.1063232421875, -4.9072265625, -4.7081298828125, -4.509033203125, -4.3099365234375, -4.11083984375, -3.9117431640625, -3.712646484375, -3.5135498046875, -3.314453125, -3.1153564453125, -2.916259765625, -2.7171630859375, -2.51806640625, -2.3189697265625, -2.119873046875, -1.9207763671875, -1.7216796875, -1.5225830078125, -1.323486328125, -1.1243896484375, -0.92529296875, -0.7261962890625, -0.527099609375, -0.3280029296875, -0.12890625, 0.0701904296875, 0.269287109375, 0.4683837890625, 0.66748046875, 0.8665771484375, 1.065673828125, 1.2647705078125, 1.4638671875, 1.6629638671875, 1.862060546875, 2.0611572265625, 2.26025390625, 2.4593505859375, 2.658447265625, 2.8575439453125, 3.056640625, 3.2557373046875, 3.454833984375, 3.6539306640625, 3.85302734375, 4.0521240234375, 4.251220703125, 4.4503173828125, 4.6494140625, 4.8485107421875, 5.047607421875, 5.2467041015625, 5.44580078125, 5.6448974609375, 5.843994140625, 6.0430908203125, 6.2421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 4.0, 8.0, 11.0, 23.0, 23.0, 37.0, 62.0, 86.0, 120.0, 214.0, 336.0, 487.0, 783.0, 1175.0, 1883.0, 2991.0, 4378.0, 6864.0, 10642.0, 16115.0, 23915.0, 35650.0, 50882.0, 69415.0, 90293.0, 108043.0, 118082.0, 116216.0, 103420.0, 84140.0, 63756.0, 45509.0, 31686.0, 21156.0, 14108.0, 9130.0, 5952.0, 3892.0, 2473.0, 1624.0, 1046.0, 673.0, 430.0, 289.0, 184.0, 123.0, 79.0, 57.0, 45.0, 14.0, 12.0, 11.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.28765869140625, -5.1104736328125, -4.93328857421875, -4.756103515625, -4.57891845703125, -4.4017333984375, -4.22454833984375, -4.04736328125, -3.87017822265625, -3.6929931640625, -3.51580810546875, -3.338623046875, -3.16143798828125, -2.9842529296875, -2.80706787109375, -2.6298828125, -2.45269775390625, -2.2755126953125, -2.09832763671875, -1.921142578125, -1.74395751953125, -1.5667724609375, -1.38958740234375, -1.21240234375, -1.03521728515625, -0.8580322265625, -0.68084716796875, -0.503662109375, -0.32647705078125, -0.1492919921875, 0.02789306640625, 0.205078125, 0.38226318359375, 0.5594482421875, 0.73663330078125, 0.913818359375, 1.09100341796875, 1.2681884765625, 1.44537353515625, 1.62255859375, 1.79974365234375, 1.9769287109375, 2.15411376953125, 2.331298828125, 2.50848388671875, 2.6856689453125, 2.86285400390625, 3.0400390625, 3.21722412109375, 3.3944091796875, 3.57159423828125, 3.748779296875, 3.92596435546875, 4.1031494140625, 4.28033447265625, 4.45751953125, 4.63470458984375, 4.8118896484375, 4.98907470703125, 5.166259765625, 5.34344482421875, 5.5206298828125, 5.69781494140625, 5.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 8.0, 7.0, 8.0, 18.0, 16.0, 19.0, 26.0, 26.0, 34.0, 26.0, 32.0, 33.0, 29.0, 44.0, 41.0, 46.0, 51.0, 53.0, 52.0, 49.0, 37.0, 36.0, 38.0, 40.0, 41.0, 24.0, 22.0, 32.0, 21.0, 15.0, 6.0, 15.0, 14.0, 9.0, 8.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6873779296875, -4.523193359375, -4.3590087890625, -4.19482421875, -4.0306396484375, -3.866455078125, -3.7022705078125, -3.5380859375, -3.3739013671875, -3.209716796875, -3.0455322265625, -2.88134765625, -2.7171630859375, -2.552978515625, -2.3887939453125, -2.224609375, -2.0604248046875, -1.896240234375, -1.7320556640625, -1.56787109375, -1.4036865234375, -1.239501953125, -1.0753173828125, -0.9111328125, -0.7469482421875, -0.582763671875, -0.4185791015625, -0.25439453125, -0.0902099609375, 0.073974609375, 0.2381591796875, 0.40234375, 0.5665283203125, 0.730712890625, 0.8948974609375, 1.05908203125, 1.2232666015625, 1.387451171875, 1.5516357421875, 1.7158203125, 1.8800048828125, 2.044189453125, 2.2083740234375, 2.37255859375, 2.5367431640625, 2.700927734375, 2.8651123046875, 3.029296875, 3.1934814453125, 3.357666015625, 3.5218505859375, 3.68603515625, 3.8502197265625, 4.014404296875, 4.1785888671875, 4.3427734375, 4.5069580078125, 4.671142578125, 4.8353271484375, 4.99951171875, 5.1636962890625, 5.327880859375, 5.4920654296875, 5.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 17.0, 27.0, 43.0, 55.0, 92.0, 110.0, 142.0, 225.0, 312.0, 499.0, 751.0, 1096.0, 1772.0, 2693.0, 4144.0, 6491.0, 10443.0, 17102.0, 28071.0, 46579.0, 75782.0, 117699.0, 159388.0, 173244.0, 143742.0, 98488.0, 61545.0, 37574.0, 22637.0, 13953.0, 8467.0, 5312.0, 3462.0, 2214.0, 1465.0, 964.0, 589.0, 407.0, 299.0, 192.0, 124.0, 106.0, 73.0, 41.0, 37.0, 18.0, 10.0, 15.0, 11.0, 3.0, 6.0, 7.0, 0.0, 0.0, 2.0], "bins": [-5.2890625, -5.125244140625, -4.96142578125, -4.797607421875, -4.6337890625, -4.469970703125, -4.30615234375, -4.142333984375, -3.978515625, -3.814697265625, -3.65087890625, -3.487060546875, -3.3232421875, -3.159423828125, -2.99560546875, -2.831787109375, -2.66796875, -2.504150390625, -2.34033203125, -2.176513671875, -2.0126953125, -1.848876953125, -1.68505859375, -1.521240234375, -1.357421875, -1.193603515625, -1.02978515625, -0.865966796875, -0.7021484375, -0.538330078125, -0.37451171875, -0.210693359375, -0.046875, 0.116943359375, 0.28076171875, 0.444580078125, 0.6083984375, 0.772216796875, 0.93603515625, 1.099853515625, 1.263671875, 1.427490234375, 1.59130859375, 1.755126953125, 1.9189453125, 2.082763671875, 2.24658203125, 2.410400390625, 2.57421875, 2.738037109375, 2.90185546875, 3.065673828125, 3.2294921875, 3.393310546875, 3.55712890625, 3.720947265625, 3.884765625, 4.048583984375, 4.21240234375, 4.376220703125, 4.5400390625, 4.703857421875, 4.86767578125, 5.031494140625, 5.1953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 6.0, 8.0, 15.0, 12.0, 20.0, 26.0, 40.0, 43.0, 55.0, 53.0, 64.0, 100.0, 86.0, 81.0, 67.0, 69.0, 49.0, 47.0, 46.0, 29.0, 19.0, 15.0, 5.0, 12.0, 6.0, 6.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010118484497070312, -0.0009869709610939026, -0.0009620934724807739, -0.0009372159838676453, -0.0009123384952545166, -0.0008874610066413879, -0.0008625835180282593, -0.0008377060294151306, -0.000812828540802002, -0.0007879510521888733, -0.0007630735635757446, -0.000738196074962616, -0.0007133185863494873, -0.0006884410977363586, -0.00066356360912323, -0.0006386861205101013, -0.0006138086318969727, -0.000588931143283844, -0.0005640536546707153, -0.0005391761660575867, -0.000514298677444458, -0.0004894211888313293, -0.0004645437002182007, -0.000439666211605072, -0.00041478872299194336, -0.0003899112343788147, -0.00036503374576568604, -0.0003401562571525574, -0.0003152787685394287, -0.00029040127992630005, -0.0002655237913131714, -0.00024064630270004272, -0.00021576881408691406, -0.0001908913254737854, -0.00016601383686065674, -0.00014113634824752808, -0.00011625885963439941, -9.138137102127075e-05, -6.650388240814209e-05, -4.162639379501343e-05, -1.6748905181884766e-05, 8.128583431243896e-06, 3.300607204437256e-05, 5.788356065750122e-05, 8.276104927062988e-05, 0.00010763853788375854, 0.0001325160264968872, 0.00015739351511001587, 0.00018227100372314453, 0.0002071484923362732, 0.00023202598094940186, 0.0002569034695625305, 0.0002817809581756592, 0.00030665844678878784, 0.0003315359354019165, 0.00035641342401504517, 0.00038129091262817383, 0.0004061684012413025, 0.00043104588985443115, 0.0004559233784675598, 0.0004808008670806885, 0.0005056783556938171, 0.0005305558443069458, 0.0005554333329200745, 0.0005803108215332031]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 12.0, 6.0, 18.0, 23.0, 33.0, 52.0, 65.0, 112.0, 152.0, 273.0, 426.0, 787.0, 1289.0, 2212.0, 3685.0, 6709.0, 12000.0, 22421.0, 41775.0, 76074.0, 128203.0, 180095.0, 193996.0, 154913.0, 99706.0, 56265.0, 30061.0, 16291.0, 8933.0, 4955.0, 2812.0, 1640.0, 969.0, 577.0, 369.0, 223.0, 155.0, 96.0, 58.0, 38.0, 23.0, 20.0, 9.0, 5.0, 3.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.81640625, -5.64654541015625, -5.4766845703125, -5.30682373046875, -5.136962890625, -4.96710205078125, -4.7972412109375, -4.62738037109375, -4.45751953125, -4.28765869140625, -4.1177978515625, -3.94793701171875, -3.778076171875, -3.60821533203125, -3.4383544921875, -3.26849365234375, -3.0986328125, -2.92877197265625, -2.7589111328125, -2.58905029296875, -2.419189453125, -2.24932861328125, -2.0794677734375, -1.90960693359375, -1.73974609375, -1.56988525390625, -1.4000244140625, -1.23016357421875, -1.060302734375, -0.89044189453125, -0.7205810546875, -0.55072021484375, -0.380859375, -0.21099853515625, -0.0411376953125, 0.12872314453125, 0.298583984375, 0.46844482421875, 0.6383056640625, 0.80816650390625, 0.97802734375, 1.14788818359375, 1.3177490234375, 1.48760986328125, 1.657470703125, 1.82733154296875, 1.9971923828125, 2.16705322265625, 2.3369140625, 2.50677490234375, 2.6766357421875, 2.84649658203125, 3.016357421875, 3.18621826171875, 3.3560791015625, 3.52593994140625, 3.69580078125, 3.86566162109375, 4.0355224609375, 4.20538330078125, 4.375244140625, 4.54510498046875, 4.7149658203125, 4.88482666015625, 5.0546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 9.0, 6.0, 9.0, 11.0, 19.0, 12.0, 19.0, 21.0, 25.0, 21.0, 41.0, 29.0, 41.0, 38.0, 46.0, 45.0, 58.0, 54.0, 41.0, 46.0, 59.0, 56.0, 33.0, 43.0, 32.0, 40.0, 31.0, 17.0, 20.0, 12.0, 21.0, 9.0, 5.0, 11.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.729461669921875, -1.66986083984375, -1.610260009765625, -1.5506591796875, -1.491058349609375, -1.43145751953125, -1.371856689453125, -1.312255859375, -1.252655029296875, -1.19305419921875, -1.133453369140625, -1.0738525390625, -1.014251708984375, -0.95465087890625, -0.895050048828125, -0.83544921875, -0.775848388671875, -0.71624755859375, -0.656646728515625, -0.5970458984375, -0.537445068359375, -0.47784423828125, -0.418243408203125, -0.358642578125, -0.299041748046875, -0.23944091796875, -0.179840087890625, -0.1202392578125, -0.060638427734375, -0.00103759765625, 0.058563232421875, 0.1181640625, 0.177764892578125, 0.23736572265625, 0.296966552734375, 0.3565673828125, 0.416168212890625, 0.47576904296875, 0.535369873046875, 0.594970703125, 0.654571533203125, 0.71417236328125, 0.773773193359375, 0.8333740234375, 0.892974853515625, 0.95257568359375, 1.012176513671875, 1.07177734375, 1.131378173828125, 1.19097900390625, 1.250579833984375, 1.3101806640625, 1.369781494140625, 1.42938232421875, 1.488983154296875, 1.548583984375, 1.608184814453125, 1.66778564453125, 1.727386474609375, 1.7869873046875, 1.846588134765625, 1.90618896484375, 1.965789794921875, 2.025390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 11.0, 10.0, 14.0, 14.0, 23.0, 22.0, 26.0, 34.0, 42.0, 39.0, 43.0, 45.0, 52.0, 56.0, 55.0, 46.0, 60.0, 47.0, 50.0, 39.0, 39.0, 43.0, 30.0, 23.0, 22.0, 24.0, 15.0, 14.0, 9.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.165167331695557, -6.930783271789551, -6.696399211883545, -6.462015151977539, -6.227631092071533, -5.993247032165527, -5.75886344909668, -5.524479389190674, -5.290095329284668, -5.055711269378662, -4.821327209472656, -4.58694314956665, -4.3525590896606445, -4.118175506591797, -3.883791208267212, -3.649407386779785, -3.4150230884552, -3.1806390285491943, -2.9462549686431885, -2.7118711471557617, -2.477487087249756, -2.24310302734375, -2.008718967437744, -1.7743350267410278, -1.539950966835022, -1.3055669069290161, -1.0711829662322998, -0.836798906326294, -0.6024149060249329, -0.3680309057235718, -0.13364684581756592, 0.10073709487915039, 0.33512115478515625, 0.5695051550865173, 0.8038891553878784, 1.0382732152938843, 1.2726571559906006, 1.5070412158966064, 1.7414252758026123, 1.9758092164993286, 2.210193157196045, 2.444577217102051, 2.6789612770080566, 2.9133453369140625, 3.1477291584014893, 3.382113218307495, 3.616497278213501, 3.8508810997009277, 4.085265159606934, 4.3196492195129395, 4.554033279418945, 4.788417339324951, 5.022801399230957, 5.257184982299805, 5.491569519042969, 5.725953102111816, 5.9603376388549805, 6.194721698760986, 6.429105758666992, 6.663489818572998, 6.897873878479004, 7.132257461547852, 7.366641998291016, 7.601025581359863, 7.835409641265869]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 11.0, 7.0, 9.0, 16.0, 24.0, 18.0, 24.0, 25.0, 22.0, 30.0, 35.0, 43.0, 53.0, 39.0, 35.0, 37.0, 48.0, 43.0, 37.0, 43.0, 43.0, 30.0, 44.0, 39.0, 38.0, 31.0, 26.0, 24.0, 20.0, 12.0, 15.0, 24.0, 12.0, 5.0, 7.0, 12.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-7.4405412673950195, -7.216803550720215, -6.99306583404541, -6.769328594207764, -6.545590877532959, -6.321853160858154, -6.098115921020508, -5.874378204345703, -5.650640487670898, -5.426902770996094, -5.203165054321289, -4.979427814483643, -4.755690097808838, -4.531952381134033, -4.308215141296387, -4.084477424621582, -3.8607397079467773, -3.6370019912719727, -3.413264513015747, -3.1895270347595215, -2.965789318084717, -2.742051601409912, -2.5183141231536865, -2.294576644897461, -2.0708389282226562, -1.8471013307571411, -1.623363733291626, -1.3996261358261108, -1.1758885383605957, -0.9521509408950806, -0.7284133434295654, -0.5046757459640503, -0.28093814849853516, -0.05720055103302002, 0.16653704643249512, 0.39027464389801025, 0.6140122413635254, 0.8377498388290405, 1.0614874362945557, 1.2852250337600708, 1.508962631225586, 1.732700228691101, 1.9564378261566162, 2.180175304412842, 2.4039130210876465, 2.627650737762451, 2.8513882160186768, 3.0751256942749023, 3.298863410949707, 3.5226011276245117, 3.7463386058807373, 3.970076084136963, 4.193813800811768, 4.417551517486572, 4.641288757324219, 4.865026473999023, 5.088764190673828, 5.312501907348633, 5.5362396240234375, 5.759976863861084, 5.983714580535889, 6.207452297210693, 6.43118953704834, 6.6549272537231445, 6.878664970397949]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 22.0, 28.0, 41.0, 64.0, 113.0, 136.0, 223.0, 334.0, 574.0, 752.0, 1230.0, 1981.0, 3198.0, 5240.0, 8476.0, 14183.0, 24206.0, 41031.0, 69443.0, 116249.0, 192348.0, 301194.0, 435832.0, 555518.0, 608164.0, 560952.0, 443606.0, 309359.0, 200103.0, 121359.0, 72251.0, 42888.0, 25362.0, 14607.0, 8817.0, 5379.0, 3230.0, 2047.0, 1304.0, 856.0, 539.0, 358.0, 225.0, 140.0, 104.0, 68.0, 39.0, 33.0, 27.0, 10.0, 10.0, 10.0, 6.0, 3.0, 2.0, 3.0], "bins": [-4.9921875, -4.8387451171875, -4.685302734375, -4.5318603515625, -4.37841796875, -4.2249755859375, -4.071533203125, -3.9180908203125, -3.7646484375, -3.6112060546875, -3.457763671875, -3.3043212890625, -3.15087890625, -2.9974365234375, -2.843994140625, -2.6905517578125, -2.537109375, -2.3836669921875, -2.230224609375, -2.0767822265625, -1.92333984375, -1.7698974609375, -1.616455078125, -1.4630126953125, -1.3095703125, -1.1561279296875, -1.002685546875, -0.8492431640625, -0.69580078125, -0.5423583984375, -0.388916015625, -0.2354736328125, -0.08203125, 0.0714111328125, 0.224853515625, 0.3782958984375, 0.53173828125, 0.6851806640625, 0.838623046875, 0.9920654296875, 1.1455078125, 1.2989501953125, 1.452392578125, 1.6058349609375, 1.75927734375, 1.9127197265625, 2.066162109375, 2.2196044921875, 2.373046875, 2.5264892578125, 2.679931640625, 2.8333740234375, 2.98681640625, 3.1402587890625, 3.293701171875, 3.4471435546875, 3.6005859375, 3.7540283203125, 3.907470703125, 4.0609130859375, 4.21435546875, 4.3677978515625, 4.521240234375, 4.6746826171875, 4.828125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 14.0, 18.0, 19.0, 18.0, 16.0, 27.0, 20.0, 31.0, 31.0, 33.0, 57.0, 40.0, 42.0, 43.0, 42.0, 33.0, 31.0, 41.0, 46.0, 44.0, 35.0, 36.0, 26.0, 33.0, 27.0, 30.0, 20.0, 23.0, 17.0, 14.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.84765625, -5.67333984375, -5.4990234375, -5.32470703125, -5.150390625, -4.97607421875, -4.8017578125, -4.62744140625, -4.453125, -4.27880859375, -4.1044921875, -3.93017578125, -3.755859375, -3.58154296875, -3.4072265625, -3.23291015625, -3.05859375, -2.88427734375, -2.7099609375, -2.53564453125, -2.361328125, -2.18701171875, -2.0126953125, -1.83837890625, -1.6640625, -1.48974609375, -1.3154296875, -1.14111328125, -0.966796875, -0.79248046875, -0.6181640625, -0.44384765625, -0.26953125, -0.09521484375, 0.0791015625, 0.25341796875, 0.427734375, 0.60205078125, 0.7763671875, 0.95068359375, 1.125, 1.29931640625, 1.4736328125, 1.64794921875, 1.822265625, 1.99658203125, 2.1708984375, 2.34521484375, 2.51953125, 2.69384765625, 2.8681640625, 3.04248046875, 3.216796875, 3.39111328125, 3.5654296875, 3.73974609375, 3.9140625, 4.08837890625, 4.2626953125, 4.43701171875, 4.611328125, 4.78564453125, 4.9599609375, 5.13427734375, 5.30859375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 12.0, 10.0, 16.0, 14.0, 39.0, 62.0, 99.0, 144.0, 267.0, 414.0, 803.0, 1434.0, 2478.0, 4548.0, 8752.0, 16713.0, 32105.0, 62040.0, 118840.0, 219323.0, 379313.0, 576576.0, 726330.0, 712502.0, 549800.0, 352036.0, 201769.0, 108915.0, 56807.0, 29427.0, 15102.0, 7973.0, 4292.0, 2274.0, 1248.0, 764.0, 412.0, 238.0, 160.0, 92.0, 50.0, 38.0, 22.0, 16.0, 9.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.384765625, -6.1640625, -5.943359375, -5.72265625, -5.501953125, -5.28125, -5.060546875, -4.83984375, -4.619140625, -4.3984375, -4.177734375, -3.95703125, -3.736328125, -3.515625, -3.294921875, -3.07421875, -2.853515625, -2.6328125, -2.412109375, -2.19140625, -1.970703125, -1.75, -1.529296875, -1.30859375, -1.087890625, -0.8671875, -0.646484375, -0.42578125, -0.205078125, 0.015625, 0.236328125, 0.45703125, 0.677734375, 0.8984375, 1.119140625, 1.33984375, 1.560546875, 1.78125, 2.001953125, 2.22265625, 2.443359375, 2.6640625, 2.884765625, 3.10546875, 3.326171875, 3.546875, 3.767578125, 3.98828125, 4.208984375, 4.4296875, 4.650390625, 4.87109375, 5.091796875, 5.3125, 5.533203125, 5.75390625, 5.974609375, 6.1953125, 6.416015625, 6.63671875, 6.857421875, 7.078125, 7.298828125, 7.51953125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 9.0, 11.0, 19.0, 18.0, 23.0, 42.0, 44.0, 64.0, 57.0, 75.0, 73.0, 103.0, 117.0, 139.0, 142.0, 172.0, 178.0, 206.0, 204.0, 222.0, 211.0, 211.0, 191.0, 202.0, 179.0, 167.0, 146.0, 136.0, 123.0, 94.0, 84.0, 74.0, 68.0, 51.0, 36.0, 28.0, 29.0, 21.0, 19.0, 17.0, 14.0, 13.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.326171875, -2.253662109375, -2.18115234375, -2.108642578125, -2.0361328125, -1.963623046875, -1.89111328125, -1.818603515625, -1.74609375, -1.673583984375, -1.60107421875, -1.528564453125, -1.4560546875, -1.383544921875, -1.31103515625, -1.238525390625, -1.166015625, -1.093505859375, -1.02099609375, -0.948486328125, -0.8759765625, -0.803466796875, -0.73095703125, -0.658447265625, -0.5859375, -0.513427734375, -0.44091796875, -0.368408203125, -0.2958984375, -0.223388671875, -0.15087890625, -0.078369140625, -0.005859375, 0.066650390625, 0.13916015625, 0.211669921875, 0.2841796875, 0.356689453125, 0.42919921875, 0.501708984375, 0.57421875, 0.646728515625, 0.71923828125, 0.791748046875, 0.8642578125, 0.936767578125, 1.00927734375, 1.081787109375, 1.154296875, 1.226806640625, 1.29931640625, 1.371826171875, 1.4443359375, 1.516845703125, 1.58935546875, 1.661865234375, 1.734375, 1.806884765625, 1.87939453125, 1.951904296875, 2.0244140625, 2.096923828125, 2.16943359375, 2.241943359375, 2.314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 17.0, 5.0, 17.0, 15.0, 27.0, 25.0, 32.0, 41.0, 43.0, 49.0, 55.0, 52.0, 54.0, 59.0, 58.0, 45.0, 56.0, 58.0, 42.0, 37.0, 33.0, 27.0, 33.0, 15.0, 20.0, 13.0, 16.0, 14.0, 6.0, 1.0, 9.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.797628402709961, -7.554989337921143, -7.312350273132324, -7.069711685180664, -6.827072620391846, -6.584433555603027, -6.341794490814209, -6.099155426025391, -5.8565168380737305, -5.613877773284912, -5.371238708496094, -5.128600120544434, -4.885961055755615, -4.643321990966797, -4.4006829261779785, -4.15804386138916, -3.915404796600342, -3.6727657318115234, -3.430126905441284, -3.187487840652466, -2.9448490142822266, -2.702209949493408, -2.45957088470459, -2.2169318199157715, -1.9742929935455322, -1.7316540479660034, -1.4890151023864746, -1.2463760375976562, -1.0037370920181274, -0.7610981464385986, -0.5184590816497803, -0.27582013607025146, -0.03318166732788086, 0.20945730805397034, 0.45209628343582153, 0.6947352886199951, 0.9373742341995239, 1.1800131797790527, 1.422652244567871, 1.6652911901474, 1.9079301357269287, 2.150569200515747, 2.3932080268859863, 2.6358470916748047, 2.878486156463623, 3.1211249828338623, 3.3637640476226807, 3.60640287399292, 3.8490419387817383, 4.091681003570557, 4.334320068359375, 4.576958656311035, 4.8195977210998535, 5.062236785888672, 5.30487585067749, 5.547514915466309, 5.790153503417969, 6.032792568206787, 6.2754316329956055, 6.518070220947266, 6.760709285736084, 7.003348350524902, 7.245987415313721, 7.488626480102539, 7.731265544891357]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 8.0, 7.0, 2.0, 8.0, 7.0, 10.0, 12.0, 14.0, 16.0, 22.0, 28.0, 22.0, 22.0, 31.0, 39.0, 36.0, 34.0, 45.0, 48.0, 40.0, 38.0, 56.0, 37.0, 41.0, 34.0, 41.0, 39.0, 26.0, 45.0, 21.0, 24.0, 17.0, 18.0, 26.0, 15.0, 12.0, 13.0, 15.0, 11.0, 5.0, 5.0, 2.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.80612850189209, -6.601604461669922, -6.397080421447754, -6.192555904388428, -5.98803186416626, -5.783507823944092, -5.578983783721924, -5.374459266662598, -5.16993522644043, -4.965411186218262, -4.760887145996094, -4.556362628936768, -4.3518385887146, -4.147314548492432, -3.9427905082702637, -3.7382662296295166, -3.5337421894073486, -3.3292181491851807, -3.1246938705444336, -2.9201698303222656, -2.7156455516815186, -2.5111215114593506, -2.3065972328186035, -2.1020731925964355, -1.897549033164978, -1.6930248737335205, -1.488500714302063, -1.2839765548706055, -1.0794525146484375, -0.87492835521698, -0.6704041957855225, -0.46588003635406494, -0.2613558769226074, -0.056831732392311096, 0.14769241213798523, 0.35221654176712036, 0.5567407011985779, 0.7612648010253906, 0.9657889604568481, 1.1703131198883057, 1.3748372793197632, 1.5793614387512207, 1.7838855981826782, 1.9884097576141357, 2.1929337978363037, 2.397458076477051, 2.6019821166992188, 2.8065061569213867, 3.011030435562134, 3.2155544757843018, 3.420078754425049, 3.624602794647217, 3.829127073287964, 4.033651351928711, 4.238175392150879, 4.442699432373047, 4.647223472595215, 4.851747512817383, 5.056271553039551, 5.260796070098877, 5.465320110321045, 5.669844150543213, 5.874368190765381, 6.078892707824707, 6.283416748046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 21.0, 18.0, 48.0, 74.0, 96.0, 140.0, 248.0, 380.0, 583.0, 874.0, 1375.0, 2256.0, 3588.0, 5815.0, 9237.0, 14823.0, 24950.0, 45250.0, 91596.0, 204086.0, 293700.0, 173366.0, 77907.0, 39609.0, 22505.0, 13508.0, 8389.0, 5240.0, 3252.0, 2106.0, 1318.0, 750.0, 499.0, 311.0, 203.0, 134.0, 77.0, 80.0, 49.0, 32.0, 23.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5703125, -13.1380615234375, -12.705810546875, -12.2735595703125, -11.84130859375, -11.4090576171875, -10.976806640625, -10.5445556640625, -10.1123046875, -9.6800537109375, -9.247802734375, -8.8155517578125, -8.38330078125, -7.9510498046875, -7.518798828125, -7.0865478515625, -6.654296875, -6.2220458984375, -5.789794921875, -5.3575439453125, -4.92529296875, -4.4930419921875, -4.060791015625, -3.6285400390625, -3.1962890625, -2.7640380859375, -2.331787109375, -1.8995361328125, -1.46728515625, -1.0350341796875, -0.602783203125, -0.1705322265625, 0.26171875, 0.6939697265625, 1.126220703125, 1.5584716796875, 1.99072265625, 2.4229736328125, 2.855224609375, 3.2874755859375, 3.7197265625, 4.1519775390625, 4.584228515625, 5.0164794921875, 5.44873046875, 5.8809814453125, 6.313232421875, 6.7454833984375, 7.177734375, 7.6099853515625, 8.042236328125, 8.4744873046875, 8.90673828125, 9.3389892578125, 9.771240234375, 10.2034912109375, 10.6357421875, 11.0679931640625, 11.500244140625, 11.9324951171875, 12.36474609375, 12.7969970703125, 13.229248046875, 13.6614990234375, 14.09375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 6.0, 7.0, 15.0, 7.0, 10.0, 19.0, 15.0, 25.0, 24.0, 22.0, 27.0, 38.0, 38.0, 43.0, 40.0, 49.0, 45.0, 33.0, 36.0, 38.0, 44.0, 46.0, 44.0, 32.0, 39.0, 29.0, 34.0, 19.0, 25.0, 26.0, 20.0, 13.0, 17.0, 9.0, 10.0, 9.0, 7.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9375, -5.75469970703125, -5.5718994140625, -5.38909912109375, -5.206298828125, -5.02349853515625, -4.8406982421875, -4.65789794921875, -4.47509765625, -4.29229736328125, -4.1094970703125, -3.92669677734375, -3.743896484375, -3.56109619140625, -3.3782958984375, -3.19549560546875, -3.0126953125, -2.82989501953125, -2.6470947265625, -2.46429443359375, -2.281494140625, -2.09869384765625, -1.9158935546875, -1.73309326171875, -1.55029296875, -1.36749267578125, -1.1846923828125, -1.00189208984375, -0.819091796875, -0.63629150390625, -0.4534912109375, -0.27069091796875, -0.087890625, 0.09490966796875, 0.2777099609375, 0.46051025390625, 0.643310546875, 0.82611083984375, 1.0089111328125, 1.19171142578125, 1.37451171875, 1.55731201171875, 1.7401123046875, 1.92291259765625, 2.105712890625, 2.28851318359375, 2.4713134765625, 2.65411376953125, 2.8369140625, 3.01971435546875, 3.2025146484375, 3.38531494140625, 3.568115234375, 3.75091552734375, 3.9337158203125, 4.11651611328125, 4.29931640625, 4.48211669921875, 4.6649169921875, 4.84771728515625, 5.030517578125, 5.21331787109375, 5.3961181640625, 5.57891845703125, 5.76171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 9.0, 8.0, 10.0, 18.0, 22.0, 18.0, 51.0, 67.0, 125.0, 212.0, 346.0, 551.0, 936.0, 1609.0, 2844.0, 5062.0, 9445.0, 18939.0, 40345.0, 101311.0, 337023.0, 343581.0, 103904.0, 41075.0, 19187.0, 9845.0, 5139.0, 2847.0, 1700.0, 929.0, 497.0, 335.0, 192.0, 155.0, 80.0, 55.0, 28.0, 26.0, 12.0, 11.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.141357421875, -19.47021484375, -18.799072265625, -18.1279296875, -17.456787109375, -16.78564453125, -16.114501953125, -15.443359375, -14.772216796875, -14.10107421875, -13.429931640625, -12.7587890625, -12.087646484375, -11.41650390625, -10.745361328125, -10.07421875, -9.403076171875, -8.73193359375, -8.060791015625, -7.3896484375, -6.718505859375, -6.04736328125, -5.376220703125, -4.705078125, -4.033935546875, -3.36279296875, -2.691650390625, -2.0205078125, -1.349365234375, -0.67822265625, -0.007080078125, 0.6640625, 1.335205078125, 2.00634765625, 2.677490234375, 3.3486328125, 4.019775390625, 4.69091796875, 5.362060546875, 6.033203125, 6.704345703125, 7.37548828125, 8.046630859375, 8.7177734375, 9.388916015625, 10.06005859375, 10.731201171875, 11.40234375, 12.073486328125, 12.74462890625, 13.415771484375, 14.0869140625, 14.758056640625, 15.42919921875, 16.100341796875, 16.771484375, 17.442626953125, 18.11376953125, 18.784912109375, 19.4560546875, 20.127197265625, 20.79833984375, 21.469482421875, 22.140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 13.0, 4.0, 1.0, 11.0, 11.0, 13.0, 18.0, 18.0, 21.0, 25.0, 28.0, 37.0, 38.0, 42.0, 38.0, 52.0, 41.0, 49.0, 52.0, 44.0, 55.0, 51.0, 45.0, 52.0, 42.0, 41.0, 22.0, 22.0, 29.0, 18.0, 12.0, 13.0, 5.0, 12.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.11328125, -4.9449462890625, -4.776611328125, -4.6082763671875, -4.43994140625, -4.2716064453125, -4.103271484375, -3.9349365234375, -3.7666015625, -3.5982666015625, -3.429931640625, -3.2615966796875, -3.09326171875, -2.9249267578125, -2.756591796875, -2.5882568359375, -2.419921875, -2.2515869140625, -2.083251953125, -1.9149169921875, -1.74658203125, -1.5782470703125, -1.409912109375, -1.2415771484375, -1.0732421875, -0.9049072265625, -0.736572265625, -0.5682373046875, -0.39990234375, -0.2315673828125, -0.063232421875, 0.1051025390625, 0.2734375, 0.4417724609375, 0.610107421875, 0.7784423828125, 0.94677734375, 1.1151123046875, 1.283447265625, 1.4517822265625, 1.6201171875, 1.7884521484375, 1.956787109375, 2.1251220703125, 2.29345703125, 2.4617919921875, 2.630126953125, 2.7984619140625, 2.966796875, 3.1351318359375, 3.303466796875, 3.4718017578125, 3.64013671875, 3.8084716796875, 3.976806640625, 4.1451416015625, 4.3134765625, 4.4818115234375, 4.650146484375, 4.8184814453125, 4.98681640625, 5.1551513671875, 5.323486328125, 5.4918212890625, 5.66015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 4.0, 8.0, 12.0, 21.0, 25.0, 35.0, 35.0, 61.0, 93.0, 99.0, 149.0, 216.0, 299.0, 400.0, 638.0, 989.0, 1680.0, 3212.0, 7798.0, 29918.0, 559765.0, 402027.0, 26173.0, 7058.0, 3031.0, 1718.0, 1024.0, 597.0, 419.0, 308.0, 191.0, 151.0, 86.0, 68.0, 55.0, 47.0, 39.0, 17.0, 26.0, 11.0, 12.0, 7.0, 7.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.4375, -34.32861328125, -33.2197265625, -32.11083984375, -31.001953125, -29.89306640625, -28.7841796875, -27.67529296875, -26.56640625, -25.45751953125, -24.3486328125, -23.23974609375, -22.130859375, -21.02197265625, -19.9130859375, -18.80419921875, -17.6953125, -16.58642578125, -15.4775390625, -14.36865234375, -13.259765625, -12.15087890625, -11.0419921875, -9.93310546875, -8.82421875, -7.71533203125, -6.6064453125, -5.49755859375, -4.388671875, -3.27978515625, -2.1708984375, -1.06201171875, 0.046875, 1.15576171875, 2.2646484375, 3.37353515625, 4.482421875, 5.59130859375, 6.7001953125, 7.80908203125, 8.91796875, 10.02685546875, 11.1357421875, 12.24462890625, 13.353515625, 14.46240234375, 15.5712890625, 16.68017578125, 17.7890625, 18.89794921875, 20.0068359375, 21.11572265625, 22.224609375, 23.33349609375, 24.4423828125, 25.55126953125, 26.66015625, 27.76904296875, 28.8779296875, 29.98681640625, 31.095703125, 32.20458984375, 33.3134765625, 34.42236328125, 35.53125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 9.0, 13.0, 17.0, 30.0, 51.0, 234.0, 465.0, 94.0, 33.0, 24.0, 8.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020294189453125, -0.0019339323043823242, -0.0018384456634521484, -0.0017429590225219727, -0.0016474723815917969, -0.001551985740661621, -0.0014564990997314453, -0.0013610124588012695, -0.0012655258178710938, -0.001170039176940918, -0.0010745525360107422, -0.0009790658950805664, -0.0008835792541503906, -0.0007880926132202148, -0.0006926059722900391, -0.0005971193313598633, -0.0005016326904296875, -0.0004061460494995117, -0.00031065940856933594, -0.00021517276763916016, -0.00011968612670898438, -2.4199485778808594e-05, 7.128715515136719e-05, 0.00016677379608154297, 0.00026226043701171875, 0.00035774707794189453, 0.0004532337188720703, 0.0005487203598022461, 0.0006442070007324219, 0.0007396936416625977, 0.0008351802825927734, 0.0009306669235229492, 0.001026153564453125, 0.0011216402053833008, 0.0012171268463134766, 0.0013126134872436523, 0.0014081001281738281, 0.001503586769104004, 0.0015990734100341797, 0.0016945600509643555, 0.0017900466918945312, 0.001885533332824707, 0.001981019973754883, 0.0020765066146850586, 0.0021719932556152344, 0.00226747989654541, 0.002362966537475586, 0.0024584531784057617, 0.0025539398193359375, 0.0026494264602661133, 0.002744913101196289, 0.002840399742126465, 0.0029358863830566406, 0.0030313730239868164, 0.003126859664916992, 0.003222346305847168, 0.0033178329467773438, 0.0034133195877075195, 0.0035088062286376953, 0.003604292869567871, 0.003699779510498047, 0.0037952661514282227, 0.0038907527923583984, 0.003986239433288574, 0.00408172607421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 21.0, 22.0, 26.0, 31.0, 46.0, 61.0, 86.0, 122.0, 163.0, 226.0, 293.0, 502.0, 701.0, 1246.0, 2412.0, 5380.0, 11996.0, 32193.0, 126737.0, 504080.0, 272063.0, 56209.0, 18365.0, 7640.0, 3415.0, 1696.0, 945.0, 581.0, 386.0, 237.0, 199.0, 133.0, 111.0, 61.0, 48.0, 32.0, 32.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9921875, -12.55517578125, -12.1181640625, -11.68115234375, -11.244140625, -10.80712890625, -10.3701171875, -9.93310546875, -9.49609375, -9.05908203125, -8.6220703125, -8.18505859375, -7.748046875, -7.31103515625, -6.8740234375, -6.43701171875, -6.0, -5.56298828125, -5.1259765625, -4.68896484375, -4.251953125, -3.81494140625, -3.3779296875, -2.94091796875, -2.50390625, -2.06689453125, -1.6298828125, -1.19287109375, -0.755859375, -0.31884765625, 0.1181640625, 0.55517578125, 0.9921875, 1.42919921875, 1.8662109375, 2.30322265625, 2.740234375, 3.17724609375, 3.6142578125, 4.05126953125, 4.48828125, 4.92529296875, 5.3623046875, 5.79931640625, 6.236328125, 6.67333984375, 7.1103515625, 7.54736328125, 7.984375, 8.42138671875, 8.8583984375, 9.29541015625, 9.732421875, 10.16943359375, 10.6064453125, 11.04345703125, 11.48046875, 11.91748046875, 12.3544921875, 12.79150390625, 13.228515625, 13.66552734375, 14.1025390625, 14.53955078125, 14.9765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 8.0, 7.0, 21.0, 8.0, 22.0, 25.0, 33.0, 54.0, 72.0, 91.0, 114.0, 106.0, 108.0, 82.0, 55.0, 39.0, 30.0, 28.0, 16.0, 13.0, 7.0, 9.0, 6.0, 3.0, 7.0, 7.0, 3.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-3.962890625, -3.86676025390625, -3.7706298828125, -3.67449951171875, -3.578369140625, -3.48223876953125, -3.3861083984375, -3.28997802734375, -3.19384765625, -3.09771728515625, -3.0015869140625, -2.90545654296875, -2.809326171875, -2.71319580078125, -2.6170654296875, -2.52093505859375, -2.4248046875, -2.32867431640625, -2.2325439453125, -2.13641357421875, -2.040283203125, -1.94415283203125, -1.8480224609375, -1.75189208984375, -1.65576171875, -1.55963134765625, -1.4635009765625, -1.36737060546875, -1.271240234375, -1.17510986328125, -1.0789794921875, -0.98284912109375, -0.88671875, -0.79058837890625, -0.6944580078125, -0.59832763671875, -0.502197265625, -0.40606689453125, -0.3099365234375, -0.21380615234375, -0.11767578125, -0.02154541015625, 0.0745849609375, 0.17071533203125, 0.266845703125, 0.36297607421875, 0.4591064453125, 0.55523681640625, 0.6513671875, 0.74749755859375, 0.8436279296875, 0.93975830078125, 1.035888671875, 1.13201904296875, 1.2281494140625, 1.32427978515625, 1.42041015625, 1.51654052734375, 1.6126708984375, 1.70880126953125, 1.804931640625, 1.90106201171875, 1.9971923828125, 2.09332275390625, 2.189453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 9.0, 3.0, 8.0, 12.0, 15.0, 21.0, 30.0, 36.0, 41.0, 51.0, 58.0, 53.0, 51.0, 60.0, 52.0, 68.0, 48.0, 50.0, 55.0, 50.0, 50.0, 41.0, 27.0, 21.0, 20.0, 12.0, 17.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5384087562561035, -6.295438289642334, -6.0524678230285645, -5.809497833251953, -5.566527366638184, -5.323556900024414, -5.0805864334106445, -4.837615966796875, -4.5946455001831055, -4.351675033569336, -4.108704566955566, -3.865734338760376, -3.6227641105651855, -3.379793643951416, -3.1368231773376465, -2.893852710723877, -2.6508827209472656, -2.407912254333496, -2.1649420261383057, -1.9219715595245361, -1.6790012121200562, -1.4360308647155762, -1.1930603981018066, -0.9500900506973267, -0.7071197032928467, -0.4641493260860443, -0.22117894887924194, 0.021791458129882812, 0.2647618055343628, 0.5077321529388428, 0.7507026195526123, 0.9936729669570923, 1.236642837524414, 1.479613184928894, 1.722583532333374, 1.9655539989471436, 2.208524227142334, 2.4514946937561035, 2.694465160369873, 2.9374356269836426, 3.180405855178833, 3.4233763217926025, 3.666346549987793, 3.9093170166015625, 4.152287483215332, 4.395257949829102, 4.638228416442871, 4.881198406219482, 5.124168872833252, 5.3671393394470215, 5.610109806060791, 5.853079795837402, 6.096050262451172, 6.339020729064941, 6.581991195678711, 6.8249616622924805, 7.06793212890625, 7.3109025955200195, 7.553873062133789, 7.796843528747559, 8.039813995361328, 8.282783508300781, 8.525754928588867, 8.76872444152832, 9.01169490814209]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 11.0, 9.0, 16.0, 9.0, 9.0, 16.0, 21.0, 22.0, 26.0, 26.0, 42.0, 41.0, 29.0, 39.0, 52.0, 49.0, 49.0, 51.0, 39.0, 38.0, 37.0, 32.0, 58.0, 39.0, 26.0, 22.0, 37.0, 24.0, 27.0, 22.0, 14.0, 11.0, 14.0, 11.0, 7.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.518105983734131, -6.313071250915527, -6.108036518096924, -5.90300178527832, -5.697967052459717, -5.492932319641113, -5.287897109985352, -5.082862854003906, -4.8778276443481445, -4.672792911529541, -4.4677581787109375, -4.262723445892334, -4.0576887130737305, -3.852653980255127, -3.6476190090179443, -3.442584276199341, -3.2375497817993164, -3.032515048980713, -2.8274803161621094, -2.622445583343506, -2.4174108505249023, -2.212376117706299, -2.007341146469116, -1.8023064136505127, -1.5972716808319092, -1.3922369480133057, -1.1872022151947021, -0.9821673631668091, -0.7771326303482056, -0.572097897529602, -0.367063045501709, -0.16202831268310547, 0.043005943298339844, 0.24804070591926575, 0.45307546854019165, 0.6581102609634399, 0.8631449937820435, 1.068179726600647, 1.27321457862854, 1.4782493114471436, 1.683284044265747, 1.8883187770843506, 2.093353509902954, 2.2983884811401367, 2.5034232139587402, 2.7084579467773438, 2.9134926795959473, 3.118527412414551, 3.3235621452331543, 3.528596878051758, 3.7336316108703613, 3.938666343688965, 4.143701076507568, 4.348735809326172, 4.553771018981934, 4.758805274963379, 4.963840484619141, 5.168875217437744, 5.373909950256348, 5.578944683074951, 5.783979415893555, 5.989014148712158, 6.194048881530762, 6.399084091186523, 6.604118347167969]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 11.0, 6.0, 10.0, 15.0, 41.0, 50.0, 80.0, 118.0, 162.0, 261.0, 386.0, 601.0, 925.0, 1449.0, 2205.0, 3339.0, 4810.0, 7483.0, 11048.0, 16199.0, 23415.0, 32746.0, 45289.0, 58916.0, 74237.0, 88489.0, 98765.0, 102099.0, 98545.0, 88687.0, 75302.0, 59742.0, 45770.0, 33566.0, 23865.0, 16407.0, 11279.0, 7541.0, 4991.0, 3327.0, 2205.0, 1418.0, 965.0, 646.0, 392.0, 283.0, 189.0, 105.0, 79.0, 46.0, 24.0, 13.0, 12.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.814453125, -3.689483642578125, -3.56451416015625, -3.439544677734375, -3.3145751953125, -3.189605712890625, -3.06463623046875, -2.939666748046875, -2.814697265625, -2.689727783203125, -2.56475830078125, -2.439788818359375, -2.3148193359375, -2.189849853515625, -2.06488037109375, -1.939910888671875, -1.81494140625, -1.689971923828125, -1.56500244140625, -1.440032958984375, -1.3150634765625, -1.190093994140625, -1.06512451171875, -0.940155029296875, -0.815185546875, -0.690216064453125, -0.56524658203125, -0.440277099609375, -0.3153076171875, -0.190338134765625, -0.06536865234375, 0.059600830078125, 0.1845703125, 0.309539794921875, 0.43450927734375, 0.559478759765625, 0.6844482421875, 0.809417724609375, 0.93438720703125, 1.059356689453125, 1.184326171875, 1.309295654296875, 1.43426513671875, 1.559234619140625, 1.6842041015625, 1.809173583984375, 1.93414306640625, 2.059112548828125, 2.18408203125, 2.309051513671875, 2.43402099609375, 2.558990478515625, 2.6839599609375, 2.808929443359375, 2.93389892578125, 3.058868408203125, 3.183837890625, 3.308807373046875, 3.43377685546875, 3.558746337890625, 3.6837158203125, 3.808685302734375, 3.93365478515625, 4.058624267578125, 4.18359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 2.0, 9.0, 3.0, 7.0, 13.0, 5.0, 20.0, 18.0, 14.0, 16.0, 21.0, 27.0, 33.0, 35.0, 41.0, 43.0, 37.0, 42.0, 54.0, 51.0, 40.0, 41.0, 41.0, 31.0, 45.0, 38.0, 26.0, 24.0, 31.0, 31.0, 27.0, 21.0, 18.0, 13.0, 24.0, 12.0, 11.0, 10.0, 11.0, 4.0, 5.0, 2.0, 1.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.80780029296875, -5.6116943359375, -5.41558837890625, -5.219482421875, -5.02337646484375, -4.8272705078125, -4.63116455078125, -4.43505859375, -4.23895263671875, -4.0428466796875, -3.84674072265625, -3.650634765625, -3.45452880859375, -3.2584228515625, -3.06231689453125, -2.8662109375, -2.67010498046875, -2.4739990234375, -2.27789306640625, -2.081787109375, -1.88568115234375, -1.6895751953125, -1.49346923828125, -1.29736328125, -1.10125732421875, -0.9051513671875, -0.70904541015625, -0.512939453125, -0.31683349609375, -0.1207275390625, 0.07537841796875, 0.271484375, 0.46759033203125, 0.6636962890625, 0.85980224609375, 1.055908203125, 1.25201416015625, 1.4481201171875, 1.64422607421875, 1.84033203125, 2.03643798828125, 2.2325439453125, 2.42864990234375, 2.624755859375, 2.82086181640625, 3.0169677734375, 3.21307373046875, 3.4091796875, 3.60528564453125, 3.8013916015625, 3.99749755859375, 4.193603515625, 4.38970947265625, 4.5858154296875, 4.78192138671875, 4.97802734375, 5.17413330078125, 5.3702392578125, 5.56634521484375, 5.762451171875, 5.95855712890625, 6.1546630859375, 6.35076904296875, 6.546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 14.0, 18.0, 29.0, 27.0, 43.0, 62.0, 132.0, 194.0, 277.0, 488.0, 690.0, 1184.0, 2060.0, 3363.0, 5674.0, 9014.0, 14783.0, 24026.0, 37313.0, 55996.0, 79844.0, 105002.0, 124343.0, 131697.0, 123185.0, 102163.0, 77837.0, 53813.0, 36136.0, 22772.0, 14134.0, 8597.0, 5396.0, 3160.0, 1952.0, 1176.0, 711.0, 458.0, 290.0, 174.0, 125.0, 85.0, 47.0, 27.0, 19.0, 7.0, 11.0, 3.0, 1.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0189208984375, -4.842529296875, -4.6661376953125, -4.48974609375, -4.3133544921875, -4.136962890625, -3.9605712890625, -3.7841796875, -3.6077880859375, -3.431396484375, -3.2550048828125, -3.07861328125, -2.9022216796875, -2.725830078125, -2.5494384765625, -2.373046875, -2.1966552734375, -2.020263671875, -1.8438720703125, -1.66748046875, -1.4910888671875, -1.314697265625, -1.1383056640625, -0.9619140625, -0.7855224609375, -0.609130859375, -0.4327392578125, -0.25634765625, -0.0799560546875, 0.096435546875, 0.2728271484375, 0.44921875, 0.6256103515625, 0.802001953125, 0.9783935546875, 1.15478515625, 1.3311767578125, 1.507568359375, 1.6839599609375, 1.8603515625, 2.0367431640625, 2.213134765625, 2.3895263671875, 2.56591796875, 2.7423095703125, 2.918701171875, 3.0950927734375, 3.271484375, 3.4478759765625, 3.624267578125, 3.8006591796875, 3.97705078125, 4.1534423828125, 4.329833984375, 4.5062255859375, 4.6826171875, 4.8590087890625, 5.035400390625, 5.2117919921875, 5.38818359375, 5.5645751953125, 5.740966796875, 5.9173583984375, 6.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 8.0, 10.0, 11.0, 10.0, 21.0, 20.0, 21.0, 30.0, 20.0, 31.0, 28.0, 43.0, 42.0, 29.0, 39.0, 33.0, 40.0, 58.0, 34.0, 31.0, 40.0, 34.0, 29.0, 34.0, 31.0, 24.0, 35.0, 31.0, 26.0, 17.0, 20.0, 18.0, 16.0, 9.0, 10.0, 10.0, 9.0, 2.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.824737548828125, -3.70220947265625, -3.579681396484375, -3.4571533203125, -3.334625244140625, -3.21209716796875, -3.089569091796875, -2.967041015625, -2.844512939453125, -2.72198486328125, -2.599456787109375, -2.4769287109375, -2.354400634765625, -2.23187255859375, -2.109344482421875, -1.98681640625, -1.864288330078125, -1.74176025390625, -1.619232177734375, -1.4967041015625, -1.374176025390625, -1.25164794921875, -1.129119873046875, -1.006591796875, -0.884063720703125, -0.76153564453125, -0.639007568359375, -0.5164794921875, -0.393951416015625, -0.27142333984375, -0.148895263671875, -0.0263671875, 0.096160888671875, 0.21868896484375, 0.341217041015625, 0.4637451171875, 0.586273193359375, 0.70880126953125, 0.831329345703125, 0.953857421875, 1.076385498046875, 1.19891357421875, 1.321441650390625, 1.4439697265625, 1.566497802734375, 1.68902587890625, 1.811553955078125, 1.93408203125, 2.056610107421875, 2.17913818359375, 2.301666259765625, 2.4241943359375, 2.546722412109375, 2.66925048828125, 2.791778564453125, 2.914306640625, 3.036834716796875, 3.15936279296875, 3.281890869140625, 3.4044189453125, 3.526947021484375, 3.64947509765625, 3.772003173828125, 3.89453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 6.0, 9.0, 23.0, 23.0, 35.0, 44.0, 75.0, 140.0, 157.0, 327.0, 528.0, 980.0, 1708.0, 3329.0, 6769.0, 14825.0, 33122.0, 71858.0, 145487.0, 228752.0, 236603.0, 156328.0, 79384.0, 36197.0, 16167.0, 7639.0, 3705.0, 1855.0, 1009.0, 565.0, 315.0, 206.0, 125.0, 75.0, 60.0, 41.0, 24.0, 16.0, 15.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.84405517578125, -5.6724853515625, -5.50091552734375, -5.329345703125, -5.15777587890625, -4.9862060546875, -4.81463623046875, -4.64306640625, -4.47149658203125, -4.2999267578125, -4.12835693359375, -3.956787109375, -3.78521728515625, -3.6136474609375, -3.44207763671875, -3.2705078125, -3.09893798828125, -2.9273681640625, -2.75579833984375, -2.584228515625, -2.41265869140625, -2.2410888671875, -2.06951904296875, -1.89794921875, -1.72637939453125, -1.5548095703125, -1.38323974609375, -1.211669921875, -1.04010009765625, -0.8685302734375, -0.69696044921875, -0.525390625, -0.35382080078125, -0.1822509765625, -0.01068115234375, 0.160888671875, 0.33245849609375, 0.5040283203125, 0.67559814453125, 0.84716796875, 1.01873779296875, 1.1903076171875, 1.36187744140625, 1.533447265625, 1.70501708984375, 1.8765869140625, 2.04815673828125, 2.2197265625, 2.39129638671875, 2.5628662109375, 2.73443603515625, 2.906005859375, 3.07757568359375, 3.2491455078125, 3.42071533203125, 3.59228515625, 3.76385498046875, 3.9354248046875, 4.10699462890625, 4.278564453125, 4.45013427734375, 4.6217041015625, 4.79327392578125, 4.96484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 14.0, 13.0, 21.0, 30.0, 33.0, 42.0, 48.0, 71.0, 66.0, 72.0, 88.0, 78.0, 81.0, 63.0, 52.0, 40.0, 38.0, 27.0, 28.0, 18.0, 12.0, 13.0, 15.0, 12.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005078315734863281, -0.0004917308688163757, -0.00047563016414642334, -0.00045952945947647095, -0.00044342875480651855, -0.00042732805013656616, -0.00041122734546661377, -0.0003951266407966614, -0.000379025936126709, -0.0003629252314567566, -0.0003468245267868042, -0.0003307238221168518, -0.0003146231174468994, -0.000298522412776947, -0.00028242170810699463, -0.00026632100343704224, -0.00025022029876708984, -0.00023411959409713745, -0.00021801888942718506, -0.00020191818475723267, -0.00018581748008728027, -0.00016971677541732788, -0.0001536160707473755, -0.0001375153660774231, -0.0001214146614074707, -0.00010531395673751831, -8.921325206756592e-05, -7.311254739761353e-05, -5.701184272766113e-05, -4.091113805770874e-05, -2.4810433387756348e-05, -8.709728717803955e-06, 7.3909759521484375e-06, 2.349168062210083e-05, 3.959238529205322e-05, 5.5693089962005615e-05, 7.179379463195801e-05, 8.78944993019104e-05, 0.00010399520397186279, 0.00012009590864181519, 0.00013619661331176758, 0.00015229731798171997, 0.00016839802265167236, 0.00018449872732162476, 0.00020059943199157715, 0.00021670013666152954, 0.00023280084133148193, 0.0002489015460014343, 0.0002650022506713867, 0.0002811029553413391, 0.0002972036600112915, 0.0003133043646812439, 0.0003294050693511963, 0.0003455057740211487, 0.0003616064786911011, 0.00037770718336105347, 0.00039380788803100586, 0.00040990859270095825, 0.00042600929737091064, 0.00044211000204086304, 0.00045821070671081543, 0.0004743114113807678, 0.0004904121160507202, 0.0005065128207206726, 0.000522613525390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 7.0, 11.0, 19.0, 34.0, 37.0, 59.0, 90.0, 125.0, 205.0, 301.0, 505.0, 788.0, 1337.0, 2250.0, 3718.0, 6802.0, 12131.0, 21179.0, 37650.0, 63485.0, 100856.0, 141363.0, 165700.0, 158629.0, 125390.0, 84926.0, 51733.0, 29826.0, 16844.0, 9354.0, 5256.0, 3138.0, 1847.0, 1106.0, 652.0, 412.0, 255.0, 167.0, 121.0, 69.0, 63.0, 39.0, 17.0, 11.0, 11.0, 5.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.513671875, -3.403167724609375, -3.29266357421875, -3.182159423828125, -3.0716552734375, -2.961151123046875, -2.85064697265625, -2.740142822265625, -2.629638671875, -2.519134521484375, -2.40863037109375, -2.298126220703125, -2.1876220703125, -2.077117919921875, -1.96661376953125, -1.856109619140625, -1.74560546875, -1.635101318359375, -1.52459716796875, -1.414093017578125, -1.3035888671875, -1.193084716796875, -1.08258056640625, -0.972076416015625, -0.861572265625, -0.751068115234375, -0.64056396484375, -0.530059814453125, -0.4195556640625, -0.309051513671875, -0.19854736328125, -0.088043212890625, 0.0224609375, 0.132965087890625, 0.24346923828125, 0.353973388671875, 0.4644775390625, 0.574981689453125, 0.68548583984375, 0.795989990234375, 0.906494140625, 1.016998291015625, 1.12750244140625, 1.238006591796875, 1.3485107421875, 1.459014892578125, 1.56951904296875, 1.680023193359375, 1.79052734375, 1.901031494140625, 2.01153564453125, 2.122039794921875, 2.2325439453125, 2.343048095703125, 2.45355224609375, 2.564056396484375, 2.674560546875, 2.785064697265625, 2.89556884765625, 3.006072998046875, 3.1165771484375, 3.227081298828125, 3.33758544921875, 3.448089599609375, 3.55859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 11.0, 8.0, 8.0, 16.0, 11.0, 19.0, 15.0, 31.0, 22.0, 38.0, 44.0, 48.0, 63.0, 50.0, 58.0, 44.0, 57.0, 59.0, 54.0, 49.0, 39.0, 38.0, 45.0, 26.0, 25.0, 24.0, 20.0, 17.0, 11.0, 9.0, 12.0, 9.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.002166748046875, -0.96527099609375, -0.928375244140625, -0.8914794921875, -0.854583740234375, -0.81768798828125, -0.780792236328125, -0.743896484375, -0.707000732421875, -0.67010498046875, -0.633209228515625, -0.5963134765625, -0.559417724609375, -0.52252197265625, -0.485626220703125, -0.44873046875, -0.411834716796875, -0.37493896484375, -0.338043212890625, -0.3011474609375, -0.264251708984375, -0.22735595703125, -0.190460205078125, -0.153564453125, -0.116668701171875, -0.07977294921875, -0.042877197265625, -0.0059814453125, 0.030914306640625, 0.06781005859375, 0.104705810546875, 0.1416015625, 0.178497314453125, 0.21539306640625, 0.252288818359375, 0.2891845703125, 0.326080322265625, 0.36297607421875, 0.399871826171875, 0.436767578125, 0.473663330078125, 0.51055908203125, 0.547454833984375, 0.5843505859375, 0.621246337890625, 0.65814208984375, 0.695037841796875, 0.73193359375, 0.768829345703125, 0.80572509765625, 0.842620849609375, 0.8795166015625, 0.916412353515625, 0.95330810546875, 0.990203857421875, 1.027099609375, 1.063995361328125, 1.10089111328125, 1.137786865234375, 1.1746826171875, 1.211578369140625, 1.24847412109375, 1.285369873046875, 1.322265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 9.0, 5.0, 7.0, 4.0, 8.0, 7.0, 23.0, 10.0, 15.0, 24.0, 32.0, 37.0, 39.0, 41.0, 45.0, 37.0, 62.0, 60.0, 45.0, 52.0, 54.0, 51.0, 42.0, 42.0, 47.0, 37.0, 30.0, 34.0, 19.0, 19.0, 9.0, 18.0, 10.0, 9.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.6572184562683105, -6.447844505310059, -6.238470554351807, -6.029096603393555, -5.819723129272461, -5.610349178314209, -5.400975227355957, -5.191601276397705, -4.982227325439453, -4.772853374481201, -4.563479423522949, -4.3541059494018555, -4.1447319984436035, -3.9353580474853516, -3.7259840965270996, -3.5166101455688477, -3.307236671447754, -3.097862720489502, -2.888489007949829, -2.679115056991577, -2.4697413444519043, -2.2603673934936523, -2.0509934425354004, -1.841619610786438, -1.6322457790374756, -1.4228719472885132, -1.2134981155395508, -1.0041241645812988, -0.7947503328323364, -0.585376501083374, -0.37600255012512207, -0.16662871837615967, 0.04274463653564453, 0.2521184980869293, 0.4614923596382141, 0.6708662509918213, 0.8802400827407837, 1.089613914489746, 1.298987865447998, 1.5083616971969604, 1.7177355289459229, 1.9271093606948853, 2.1364831924438477, 2.3458571434020996, 2.5552310943603516, 2.7646048069000244, 2.9739787578582764, 3.183352470397949, 3.392726421356201, 3.602100372314453, 3.811474084854126, 4.020848274230957, 4.230221748352051, 4.439595699310303, 4.648969650268555, 4.858343601226807, 5.067717552185059, 5.2770915031433105, 5.4864654541015625, 5.695838928222656, 5.905212879180908, 6.11458683013916, 6.323960781097412, 6.533334732055664, 6.742708206176758]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 3.0, 4.0, 6.0, 11.0, 7.0, 6.0, 17.0, 21.0, 22.0, 25.0, 27.0, 33.0, 30.0, 49.0, 40.0, 50.0, 42.0, 43.0, 46.0, 48.0, 45.0, 44.0, 41.0, 50.0, 41.0, 26.0, 32.0, 27.0, 33.0, 21.0, 16.0, 22.0, 10.0, 10.0, 25.0, 10.0, 1.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.617056369781494, -6.405831813812256, -6.194606781005859, -5.983382225036621, -5.772157192230225, -5.560932636260986, -5.34970760345459, -5.138483047485352, -4.927258491516113, -4.716033935546875, -4.5048089027404785, -4.29358434677124, -4.082359313964844, -3.8711347579956055, -3.659909963607788, -3.4486851692199707, -3.237460136413574, -3.026235342025757, -2.8150105476379395, -2.603785991668701, -2.3925609588623047, -2.1813364028930664, -1.970111608505249, -1.7588868141174316, -1.5476620197296143, -1.3364372253417969, -1.1252124309539795, -0.9139877557754517, -0.7027629613876343, -0.4915381669998169, -0.28031349182128906, -0.06908869743347168, 0.1421365737915039, 0.3533613383769989, 0.5645861029624939, 0.7758108377456665, 0.9870356321334839, 1.1982604265213013, 1.409485101699829, 1.6207098960876465, 1.8319346904754639, 2.0431594848632812, 2.2543842792510986, 2.465609073638916, 2.6768336296081543, 2.888058662414551, 3.099283218383789, 3.3105080127716064, 3.521732807159424, 3.732957601547241, 3.9441823959350586, 4.155406951904297, 4.366631984710693, 4.577856540679932, 4.789081573486328, 5.000306129455566, 5.211530685424805, 5.422755241394043, 5.6339802742004395, 5.845204830169678, 6.056429862976074, 6.2676544189453125, 6.478878974914551, 6.690104007720947, 6.901329040527344]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 4.0, 16.0, 25.0, 41.0, 48.0, 69.0, 129.0, 172.0, 260.0, 345.0, 579.0, 886.0, 1393.0, 2044.0, 3044.0, 4730.0, 7387.0, 11689.0, 18059.0, 28125.0, 44387.0, 70878.0, 110240.0, 168093.0, 247590.0, 346142.0, 445778.0, 511872.0, 523101.0, 469206.0, 373396.0, 274298.0, 187197.0, 123571.0, 79647.0, 50256.0, 32102.0, 20531.0, 13044.0, 8193.0, 5482.0, 3556.0, 2216.0, 1556.0, 965.0, 691.0, 462.0, 297.0, 169.0, 124.0, 95.0, 44.0, 24.0, 26.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-3.818359375, -3.699554443359375, -3.58074951171875, -3.461944580078125, -3.3431396484375, -3.224334716796875, -3.10552978515625, -2.986724853515625, -2.867919921875, -2.749114990234375, -2.63031005859375, -2.511505126953125, -2.3927001953125, -2.273895263671875, -2.15509033203125, -2.036285400390625, -1.91748046875, -1.798675537109375, -1.67987060546875, -1.561065673828125, -1.4422607421875, -1.323455810546875, -1.20465087890625, -1.085845947265625, -0.967041015625, -0.848236083984375, -0.72943115234375, -0.610626220703125, -0.4918212890625, -0.373016357421875, -0.25421142578125, -0.135406494140625, -0.0166015625, 0.102203369140625, 0.22100830078125, 0.339813232421875, 0.4586181640625, 0.577423095703125, 0.69622802734375, 0.815032958984375, 0.933837890625, 1.052642822265625, 1.17144775390625, 1.290252685546875, 1.4090576171875, 1.527862548828125, 1.64666748046875, 1.765472412109375, 1.88427734375, 2.003082275390625, 2.12188720703125, 2.240692138671875, 2.3594970703125, 2.478302001953125, 2.59710693359375, 2.715911865234375, 2.834716796875, 2.953521728515625, 3.07232666015625, 3.191131591796875, 3.3099365234375, 3.428741455078125, 3.54754638671875, 3.666351318359375, 3.78515625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 7.0, 2.0, 5.0, 6.0, 13.0, 11.0, 17.0, 20.0, 27.0, 25.0, 30.0, 25.0, 35.0, 31.0, 52.0, 52.0, 43.0, 44.0, 42.0, 49.0, 51.0, 49.0, 39.0, 35.0, 34.0, 44.0, 30.0, 34.0, 21.0, 17.0, 28.0, 23.0, 10.0, 12.0, 9.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.63671875, -5.4658203125, -5.294921875, -5.1240234375, -4.953125, -4.7822265625, -4.611328125, -4.4404296875, -4.26953125, -4.0986328125, -3.927734375, -3.7568359375, -3.5859375, -3.4150390625, -3.244140625, -3.0732421875, -2.90234375, -2.7314453125, -2.560546875, -2.3896484375, -2.21875, -2.0478515625, -1.876953125, -1.7060546875, -1.53515625, -1.3642578125, -1.193359375, -1.0224609375, -0.8515625, -0.6806640625, -0.509765625, -0.3388671875, -0.16796875, 0.0029296875, 0.173828125, 0.3447265625, 0.515625, 0.6865234375, 0.857421875, 1.0283203125, 1.19921875, 1.3701171875, 1.541015625, 1.7119140625, 1.8828125, 2.0537109375, 2.224609375, 2.3955078125, 2.56640625, 2.7373046875, 2.908203125, 3.0791015625, 3.25, 3.4208984375, 3.591796875, 3.7626953125, 3.93359375, 4.1044921875, 4.275390625, 4.4462890625, 4.6171875, 4.7880859375, 4.958984375, 5.1298828125, 5.30078125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 25.0, 36.0, 75.0, 108.0, 198.0, 352.0, 567.0, 867.0, 1540.0, 2917.0, 5238.0, 9590.0, 17592.0, 33331.0, 62705.0, 115601.0, 204601.0, 342946.0, 516868.0, 666751.0, 696084.0, 572132.0, 396524.0, 243358.0, 139093.0, 75955.0, 40909.0, 22228.0, 11691.0, 6371.0, 3432.0, 1841.0, 1121.0, 669.0, 371.0, 231.0, 135.0, 75.0, 43.0, 40.0, 23.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.63671875, -5.4498291015625, -5.262939453125, -5.0760498046875, -4.88916015625, -4.7022705078125, -4.515380859375, -4.3284912109375, -4.1416015625, -3.9547119140625, -3.767822265625, -3.5809326171875, -3.39404296875, -3.2071533203125, -3.020263671875, -2.8333740234375, -2.646484375, -2.4595947265625, -2.272705078125, -2.0858154296875, -1.89892578125, -1.7120361328125, -1.525146484375, -1.3382568359375, -1.1513671875, -0.9644775390625, -0.777587890625, -0.5906982421875, -0.40380859375, -0.2169189453125, -0.030029296875, 0.1568603515625, 0.34375, 0.5306396484375, 0.717529296875, 0.9044189453125, 1.09130859375, 1.2781982421875, 1.465087890625, 1.6519775390625, 1.8388671875, 2.0257568359375, 2.212646484375, 2.3995361328125, 2.58642578125, 2.7733154296875, 2.960205078125, 3.1470947265625, 3.333984375, 3.5208740234375, 3.707763671875, 3.8946533203125, 4.08154296875, 4.2684326171875, 4.455322265625, 4.6422119140625, 4.8291015625, 5.0159912109375, 5.202880859375, 5.3897705078125, 5.57666015625, 5.7635498046875, 5.950439453125, 6.1373291015625, 6.32421875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 9.0, 8.0, 10.0, 24.0, 16.0, 23.0, 27.0, 25.0, 47.0, 52.0, 68.0, 102.0, 61.0, 117.0, 124.0, 135.0, 179.0, 152.0, 164.0, 204.0, 194.0, 218.0, 222.0, 200.0, 195.0, 193.0, 194.0, 168.0, 140.0, 133.0, 99.0, 70.0, 75.0, 81.0, 63.0, 61.0, 43.0, 41.0, 27.0, 24.0, 24.0, 17.0, 13.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.857421875, -1.79510498046875, -1.7327880859375, -1.67047119140625, -1.608154296875, -1.54583740234375, -1.4835205078125, -1.42120361328125, -1.35888671875, -1.29656982421875, -1.2342529296875, -1.17193603515625, -1.109619140625, -1.04730224609375, -0.9849853515625, -0.92266845703125, -0.8603515625, -0.79803466796875, -0.7357177734375, -0.67340087890625, -0.611083984375, -0.54876708984375, -0.4864501953125, -0.42413330078125, -0.36181640625, -0.29949951171875, -0.2371826171875, -0.17486572265625, -0.112548828125, -0.05023193359375, 0.0120849609375, 0.07440185546875, 0.13671875, 0.19903564453125, 0.2613525390625, 0.32366943359375, 0.385986328125, 0.44830322265625, 0.5106201171875, 0.57293701171875, 0.63525390625, 0.69757080078125, 0.7598876953125, 0.82220458984375, 0.884521484375, 0.94683837890625, 1.0091552734375, 1.07147216796875, 1.1337890625, 1.19610595703125, 1.2584228515625, 1.32073974609375, 1.383056640625, 1.44537353515625, 1.5076904296875, 1.57000732421875, 1.63232421875, 1.69464111328125, 1.7569580078125, 1.81927490234375, 1.881591796875, 1.94390869140625, 2.0062255859375, 2.06854248046875, 2.130859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 15.0, 16.0, 19.0, 15.0, 22.0, 31.0, 44.0, 25.0, 29.0, 37.0, 41.0, 44.0, 53.0, 41.0, 43.0, 56.0, 59.0, 51.0, 43.0, 40.0, 43.0, 29.0, 27.0, 33.0, 19.0, 20.0, 25.0, 15.0, 15.0, 8.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.944758892059326, -6.751553058624268, -6.558347225189209, -6.36514139175415, -6.171935081481934, -5.978729248046875, -5.785523414611816, -5.592317581176758, -5.399111747741699, -5.205905914306641, -5.012700080871582, -4.819494247436523, -4.626288414001465, -4.433082103729248, -4.2398762702941895, -4.046670436859131, -3.8534646034240723, -3.6602587699890137, -3.467052936553955, -3.2738468647003174, -3.080641031265259, -2.8874351978302, -2.6942291259765625, -2.501023292541504, -2.3078174591064453, -2.1146116256713867, -1.9214056730270386, -1.7281997203826904, -1.5349938869476318, -1.3417880535125732, -1.148582100868225, -0.955376148223877, -0.7621707916259766, -0.5689648985862732, -0.3757590055465698, -0.18255311250686646, 0.010652780532836914, 0.20385867357254028, 0.39706456661224365, 0.5902705192565918, 0.7834763526916504, 0.9766822457313538, 1.1698881387710571, 1.3630940914154053, 1.5562999248504639, 1.7495057582855225, 1.9427117109298706, 2.1359176635742188, 2.3291234970092773, 2.522329330444336, 2.7155351638793945, 2.9087412357330322, 3.101947069168091, 3.2951529026031494, 3.488358974456787, 3.6815648078918457, 3.8747706413269043, 4.067976474761963, 4.2611823081970215, 4.45438814163208, 4.647594451904297, 4.8408002853393555, 5.034006118774414, 5.227211952209473, 5.420417785644531]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 5.0, 9.0, 13.0, 19.0, 17.0, 19.0, 27.0, 26.0, 26.0, 24.0, 32.0, 36.0, 47.0, 38.0, 45.0, 44.0, 58.0, 45.0, 45.0, 57.0, 42.0, 30.0, 27.0, 42.0, 35.0, 33.0, 24.0, 26.0, 19.0, 11.0, 11.0, 19.0, 10.0, 7.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.331544876098633, -6.138935565948486, -5.946326732635498, -5.753717422485352, -5.561108112335205, -5.368499279022217, -5.17588996887207, -4.983281135559082, -4.7906718254089355, -4.598062515258789, -4.405453681945801, -4.212844371795654, -4.020235061645508, -3.8276262283325195, -3.635016918182373, -3.4424078464508057, -3.249798536300659, -3.057189464569092, -2.8645801544189453, -2.671971082687378, -2.4793620109558105, -2.286752700805664, -2.0941436290740967, -1.9015345573425293, -1.7089253664016724, -1.5163161754608154, -1.323707103729248, -1.1310979127883911, -0.938488781452179, -0.7458796501159668, -0.5532704591751099, -0.3606613874435425, -0.16805219650268555, 0.024556949734687805, 0.21716609597206116, 0.4097752571105957, 0.6023843884468079, 0.79499351978302, 0.987602710723877, 1.1802117824554443, 1.3728209733963013, 1.5654301643371582, 1.7580392360687256, 1.9506484270095825, 2.1432576179504395, 2.335866689682007, 2.528475761413574, 2.7210850715637207, 2.913694143295288, 3.1063032150268555, 3.298912525177002, 3.4915215969085693, 3.6841306686401367, 3.876739978790283, 4.06934928894043, 4.261958122253418, 4.4545674324035645, 4.647176742553711, 4.839785575866699, 5.032394886016846, 5.225004196166992, 5.4176130294799805, 5.610222339630127, 5.802831649780273, 5.995440483093262]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 10.0, 8.0, 15.0, 27.0, 30.0, 58.0, 68.0, 80.0, 113.0, 180.0, 231.0, 320.0, 476.0, 734.0, 967.0, 1438.0, 2214.0, 3271.0, 5059.0, 8101.0, 13354.0, 23527.0, 45159.0, 97972.0, 212579.0, 286136.0, 176260.0, 79998.0, 37788.0, 19953.0, 11559.0, 7121.0, 4470.0, 2968.0, 1916.0, 1271.0, 925.0, 615.0, 437.0, 324.0, 224.0, 172.0, 125.0, 79.0, 60.0, 43.0, 29.0, 16.0, 14.0, 20.0, 12.0, 7.0, 9.0, 0.0, 4.0, 3.0, 4.0], "bins": [-10.28125, -9.963623046875, -9.64599609375, -9.328369140625, -9.0107421875, -8.693115234375, -8.37548828125, -8.057861328125, -7.740234375, -7.422607421875, -7.10498046875, -6.787353515625, -6.4697265625, -6.152099609375, -5.83447265625, -5.516845703125, -5.19921875, -4.881591796875, -4.56396484375, -4.246337890625, -3.9287109375, -3.611083984375, -3.29345703125, -2.975830078125, -2.658203125, -2.340576171875, -2.02294921875, -1.705322265625, -1.3876953125, -1.070068359375, -0.75244140625, -0.434814453125, -0.1171875, 0.200439453125, 0.51806640625, 0.835693359375, 1.1533203125, 1.470947265625, 1.78857421875, 2.106201171875, 2.423828125, 2.741455078125, 3.05908203125, 3.376708984375, 3.6943359375, 4.011962890625, 4.32958984375, 4.647216796875, 4.96484375, 5.282470703125, 5.60009765625, 5.917724609375, 6.2353515625, 6.552978515625, 6.87060546875, 7.188232421875, 7.505859375, 7.823486328125, 8.14111328125, 8.458740234375, 8.7763671875, 9.093994140625, 9.41162109375, 9.729248046875, 10.046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 4.0, 10.0, 11.0, 11.0, 23.0, 15.0, 19.0, 23.0, 30.0, 27.0, 35.0, 29.0, 35.0, 30.0, 44.0, 42.0, 42.0, 40.0, 45.0, 53.0, 44.0, 56.0, 40.0, 40.0, 23.0, 36.0, 30.0, 28.0, 17.0, 24.0, 22.0, 16.0, 4.0, 9.0, 12.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.10546875, -5.921142578125, -5.73681640625, -5.552490234375, -5.3681640625, -5.183837890625, -4.99951171875, -4.815185546875, -4.630859375, -4.446533203125, -4.26220703125, -4.077880859375, -3.8935546875, -3.709228515625, -3.52490234375, -3.340576171875, -3.15625, -2.971923828125, -2.78759765625, -2.603271484375, -2.4189453125, -2.234619140625, -2.05029296875, -1.865966796875, -1.681640625, -1.497314453125, -1.31298828125, -1.128662109375, -0.9443359375, -0.760009765625, -0.57568359375, -0.391357421875, -0.20703125, -0.022705078125, 0.16162109375, 0.345947265625, 0.5302734375, 0.714599609375, 0.89892578125, 1.083251953125, 1.267578125, 1.451904296875, 1.63623046875, 1.820556640625, 2.0048828125, 2.189208984375, 2.37353515625, 2.557861328125, 2.7421875, 2.926513671875, 3.11083984375, 3.295166015625, 3.4794921875, 3.663818359375, 3.84814453125, 4.032470703125, 4.216796875, 4.401123046875, 4.58544921875, 4.769775390625, 4.9541015625, 5.138427734375, 5.32275390625, 5.507080078125, 5.69140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 13.0, 28.0, 34.0, 36.0, 58.0, 83.0, 121.0, 204.0, 273.0, 373.0, 541.0, 815.0, 1233.0, 1954.0, 3056.0, 4904.0, 7746.0, 12795.0, 22519.0, 41345.0, 84656.0, 185877.0, 297192.0, 193819.0, 87787.0, 42838.0, 23410.0, 13132.0, 7977.0, 4844.0, 3008.0, 1957.0, 1238.0, 859.0, 605.0, 379.0, 255.0, 170.0, 136.0, 100.0, 55.0, 38.0, 20.0, 25.0, 15.0, 12.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.6043701171875, -9.279052734375, -8.9537353515625, -8.62841796875, -8.3031005859375, -7.977783203125, -7.6524658203125, -7.3271484375, -7.0018310546875, -6.676513671875, -6.3511962890625, -6.02587890625, -5.7005615234375, -5.375244140625, -5.0499267578125, -4.724609375, -4.3992919921875, -4.073974609375, -3.7486572265625, -3.42333984375, -3.0980224609375, -2.772705078125, -2.4473876953125, -2.1220703125, -1.7967529296875, -1.471435546875, -1.1461181640625, -0.82080078125, -0.4954833984375, -0.170166015625, 0.1551513671875, 0.48046875, 0.8057861328125, 1.131103515625, 1.4564208984375, 1.78173828125, 2.1070556640625, 2.432373046875, 2.7576904296875, 3.0830078125, 3.4083251953125, 3.733642578125, 4.0589599609375, 4.38427734375, 4.7095947265625, 5.034912109375, 5.3602294921875, 5.685546875, 6.0108642578125, 6.336181640625, 6.6614990234375, 6.98681640625, 7.3121337890625, 7.637451171875, 7.9627685546875, 8.2880859375, 8.6134033203125, 8.938720703125, 9.2640380859375, 9.58935546875, 9.9146728515625, 10.239990234375, 10.5653076171875, 10.890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 8.0, 6.0, 5.0, 16.0, 20.0, 14.0, 26.0, 11.0, 23.0, 36.0, 23.0, 35.0, 25.0, 37.0, 32.0, 38.0, 41.0, 50.0, 34.0, 49.0, 41.0, 40.0, 33.0, 29.0, 38.0, 29.0, 30.0, 28.0, 28.0, 26.0, 23.0, 19.0, 18.0, 15.0, 10.0, 7.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.08984375, -2.97564697265625, -2.8614501953125, -2.74725341796875, -2.633056640625, -2.51885986328125, -2.4046630859375, -2.29046630859375, -2.17626953125, -2.06207275390625, -1.9478759765625, -1.83367919921875, -1.719482421875, -1.60528564453125, -1.4910888671875, -1.37689208984375, -1.2626953125, -1.14849853515625, -1.0343017578125, -0.92010498046875, -0.805908203125, -0.69171142578125, -0.5775146484375, -0.46331787109375, -0.34912109375, -0.23492431640625, -0.1207275390625, -0.00653076171875, 0.107666015625, 0.22186279296875, 0.3360595703125, 0.45025634765625, 0.564453125, 0.67864990234375, 0.7928466796875, 0.90704345703125, 1.021240234375, 1.13543701171875, 1.2496337890625, 1.36383056640625, 1.47802734375, 1.59222412109375, 1.7064208984375, 1.82061767578125, 1.934814453125, 2.04901123046875, 2.1632080078125, 2.27740478515625, 2.3916015625, 2.50579833984375, 2.6199951171875, 2.73419189453125, 2.848388671875, 2.96258544921875, 3.0767822265625, 3.19097900390625, 3.30517578125, 3.41937255859375, 3.5335693359375, 3.64776611328125, 3.761962890625, 3.87615966796875, 3.9903564453125, 4.10455322265625, 4.21875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 11.0, 7.0, 14.0, 20.0, 23.0, 39.0, 42.0, 76.0, 85.0, 133.0, 199.0, 270.0, 415.0, 642.0, 975.0, 1452.0, 2727.0, 6210.0, 37075.0, 860317.0, 119363.0, 9935.0, 3386.0, 1797.0, 1136.0, 716.0, 459.0, 336.0, 194.0, 146.0, 93.0, 63.0, 57.0, 45.0, 27.0, 18.0, 17.0, 12.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.484375, -24.65380859375, -23.8232421875, -22.99267578125, -22.162109375, -21.33154296875, -20.5009765625, -19.67041015625, -18.83984375, -18.00927734375, -17.1787109375, -16.34814453125, -15.517578125, -14.68701171875, -13.8564453125, -13.02587890625, -12.1953125, -11.36474609375, -10.5341796875, -9.70361328125, -8.873046875, -8.04248046875, -7.2119140625, -6.38134765625, -5.55078125, -4.72021484375, -3.8896484375, -3.05908203125, -2.228515625, -1.39794921875, -0.5673828125, 0.26318359375, 1.09375, 1.92431640625, 2.7548828125, 3.58544921875, 4.416015625, 5.24658203125, 6.0771484375, 6.90771484375, 7.73828125, 8.56884765625, 9.3994140625, 10.22998046875, 11.060546875, 11.89111328125, 12.7216796875, 13.55224609375, 14.3828125, 15.21337890625, 16.0439453125, 16.87451171875, 17.705078125, 18.53564453125, 19.3662109375, 20.19677734375, 21.02734375, 21.85791015625, 22.6884765625, 23.51904296875, 24.349609375, 25.18017578125, 26.0107421875, 26.84130859375, 27.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 17.0, 31.0, 63.0, 244.0, 435.0, 127.0, 40.0, 17.0, 10.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020503997802734375, -0.0019905567169189453, -0.0019307136535644531, -0.001870870590209961, -0.0018110275268554688, -0.0017511844635009766, -0.0016913414001464844, -0.0016314983367919922, -0.0015716552734375, -0.0015118122100830078, -0.0014519691467285156, -0.0013921260833740234, -0.0013322830200195312, -0.001272439956665039, -0.0012125968933105469, -0.0011527538299560547, -0.0010929107666015625, -0.0010330677032470703, -0.0009732246398925781, -0.0009133815765380859, -0.0008535385131835938, -0.0007936954498291016, -0.0007338523864746094, -0.0006740093231201172, -0.000614166259765625, -0.0005543231964111328, -0.0004944801330566406, -0.00043463706970214844, -0.00037479400634765625, -0.00031495094299316406, -0.0002551078796386719, -0.0001952648162841797, -0.0001354217529296875, -7.557868957519531e-05, -1.5735626220703125e-05, 4.410743713378906e-05, 0.00010395050048828125, 0.00016379356384277344, 0.00022363662719726562, 0.0002834796905517578, 0.00034332275390625, 0.0004031658172607422, 0.0004630088806152344, 0.0005228519439697266, 0.0005826950073242188, 0.0006425380706787109, 0.0007023811340332031, 0.0007622241973876953, 0.0008220672607421875, 0.0008819103240966797, 0.0009417533874511719, 0.001001596450805664, 0.0010614395141601562, 0.0011212825775146484, 0.0011811256408691406, 0.0012409687042236328, 0.001300811767578125, 0.0013606548309326172, 0.0014204978942871094, 0.0014803409576416016, 0.0015401840209960938, 0.001600027084350586, 0.0016598701477050781, 0.0017197132110595703, 0.0017795562744140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 13.0, 19.0, 42.0, 29.0, 48.0, 71.0, 86.0, 148.0, 202.0, 276.0, 355.0, 467.0, 642.0, 920.0, 1345.0, 2048.0, 3376.0, 6857.0, 16759.0, 56526.0, 241358.0, 484426.0, 165141.0, 39664.0, 13018.0, 5614.0, 2961.0, 1836.0, 1190.0, 865.0, 623.0, 425.0, 326.0, 259.0, 178.0, 102.0, 90.0, 54.0, 42.0, 37.0, 30.0, 27.0, 16.0, 11.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.62353515625, -8.3486328125, -8.07373046875, -7.798828125, -7.52392578125, -7.2490234375, -6.97412109375, -6.69921875, -6.42431640625, -6.1494140625, -5.87451171875, -5.599609375, -5.32470703125, -5.0498046875, -4.77490234375, -4.5, -4.22509765625, -3.9501953125, -3.67529296875, -3.400390625, -3.12548828125, -2.8505859375, -2.57568359375, -2.30078125, -2.02587890625, -1.7509765625, -1.47607421875, -1.201171875, -0.92626953125, -0.6513671875, -0.37646484375, -0.1015625, 0.17333984375, 0.4482421875, 0.72314453125, 0.998046875, 1.27294921875, 1.5478515625, 1.82275390625, 2.09765625, 2.37255859375, 2.6474609375, 2.92236328125, 3.197265625, 3.47216796875, 3.7470703125, 4.02197265625, 4.296875, 4.57177734375, 4.8466796875, 5.12158203125, 5.396484375, 5.67138671875, 5.9462890625, 6.22119140625, 6.49609375, 6.77099609375, 7.0458984375, 7.32080078125, 7.595703125, 7.87060546875, 8.1455078125, 8.42041015625, 8.6953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 6.0, 10.0, 14.0, 8.0, 31.0, 51.0, 67.0, 93.0, 150.0, 155.0, 147.0, 99.0, 66.0, 33.0, 19.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -3.044952392578125, -2.95904541015625, -2.873138427734375, -2.7872314453125, -2.701324462890625, -2.61541748046875, -2.529510498046875, -2.443603515625, -2.357696533203125, -2.27178955078125, -2.185882568359375, -2.0999755859375, -2.014068603515625, -1.92816162109375, -1.842254638671875, -1.75634765625, -1.670440673828125, -1.58453369140625, -1.498626708984375, -1.4127197265625, -1.326812744140625, -1.24090576171875, -1.154998779296875, -1.069091796875, -0.983184814453125, -0.89727783203125, -0.811370849609375, -0.7254638671875, -0.639556884765625, -0.55364990234375, -0.467742919921875, -0.3818359375, -0.295928955078125, -0.21002197265625, -0.124114990234375, -0.0382080078125, 0.047698974609375, 0.13360595703125, 0.219512939453125, 0.305419921875, 0.391326904296875, 0.47723388671875, 0.563140869140625, 0.6490478515625, 0.734954833984375, 0.82086181640625, 0.906768798828125, 0.99267578125, 1.078582763671875, 1.16448974609375, 1.250396728515625, 1.3363037109375, 1.422210693359375, 1.50811767578125, 1.594024658203125, 1.679931640625, 1.765838623046875, 1.85174560546875, 1.937652587890625, 2.0235595703125, 2.109466552734375, 2.19537353515625, 2.281280517578125, 2.3671875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 7.0, 8.0, 20.0, 23.0, 19.0, 26.0, 29.0, 29.0, 33.0, 38.0, 42.0, 49.0, 64.0, 52.0, 37.0, 54.0, 56.0, 59.0, 48.0, 37.0, 44.0, 27.0, 33.0, 24.0, 27.0, 21.0, 13.0, 12.0, 14.0, 7.0, 7.0, 7.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.434037208557129, -6.23962926864624, -6.045221328735352, -5.850813388824463, -5.656405448913574, -5.461997032165527, -5.267589092254639, -5.07318115234375, -4.878773212432861, -4.684365272521973, -4.489957332611084, -4.295549392700195, -4.101140975952148, -3.906733274459839, -3.712325096130371, -3.5179171562194824, -3.3235092163085938, -3.129101276397705, -2.9346933364868164, -2.7402851581573486, -2.54587721824646, -2.3514692783355713, -2.1570611000061035, -1.9626531600952148, -1.7682452201843262, -1.5738372802734375, -1.3794292211532593, -1.185021162033081, -0.9906132221221924, -0.7962052226066589, -0.6017972230911255, -0.40738916397094727, -0.2129817008972168, -0.01857370138168335, 0.1758342981338501, 0.37024229764938354, 0.564650297164917, 0.7590582966804504, 0.9534662961959839, 1.147874355316162, 1.3422822952270508, 1.5366902351379395, 1.7310982942581177, 1.925506353378296, 2.1199142932891846, 2.3143222332000732, 2.508730411529541, 2.7031383514404297, 2.8975462913513184, 3.091954231262207, 3.2863621711730957, 3.4807703495025635, 3.675178289413452, 3.869586229324341, 4.063994407653809, 4.258402347564697, 4.452810287475586, 4.647218227386475, 4.841626167297363, 5.036034107208252, 5.230442047119141, 5.4248504638671875, 5.619258403778076, 5.813666343688965, 6.0080742835998535]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 17.0, 15.0, 16.0, 19.0, 30.0, 25.0, 32.0, 23.0, 33.0, 38.0, 36.0, 45.0, 42.0, 38.0, 49.0, 58.0, 46.0, 39.0, 39.0, 38.0, 35.0, 39.0, 37.0, 21.0, 27.0, 24.0, 25.0, 13.0, 22.0, 8.0, 12.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.0276007652282715, -5.844745635986328, -5.661890506744385, -5.479035377502441, -5.29617977142334, -5.1133246421813965, -4.930469512939453, -4.74761438369751, -4.564759254455566, -4.381904125213623, -4.19904899597168, -4.016193866729736, -3.833338499069214, -3.6504833698272705, -3.467628002166748, -3.2847728729248047, -3.1019177436828613, -2.919062614440918, -2.7362074851989746, -2.553352117538452, -2.370496988296509, -2.1876418590545654, -2.004786491394043, -1.8219313621520996, -1.6390762329101562, -1.456221103668213, -1.27336585521698, -1.090510606765747, -0.9076554775238037, -0.7248002886772156, -0.5419450998306274, -0.35908985137939453, -0.17623519897460938, 0.00661998987197876, 0.1894751787185669, 0.37233036756515503, 0.5551855564117432, 0.7380407452583313, 0.9208959341049194, 1.1037511825561523, 1.2866063117980957, 1.469461441040039, 1.652316689491272, 1.8351719379425049, 2.0180270671844482, 2.2008821964263916, 2.383737564086914, 2.5665926933288574, 2.749447822570801, 2.932302951812744, 3.1151580810546875, 3.29801344871521, 3.4808685779571533, 3.6637237071990967, 3.846579074859619, 4.0294342041015625, 4.212289333343506, 4.395144462585449, 4.577999591827393, 4.760854721069336, 4.9437103271484375, 5.126565456390381, 5.309420585632324, 5.492275714874268, 5.675130844116211]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 3.0, 12.0, 17.0, 26.0, 42.0, 54.0, 93.0, 137.0, 220.0, 324.0, 439.0, 684.0, 1104.0, 1778.0, 2921.0, 4954.0, 8692.0, 15355.0, 27095.0, 47847.0, 81666.0, 124759.0, 162492.0, 172022.0, 145616.0, 102374.0, 63348.0, 36611.0, 19973.0, 11342.0, 6538.0, 3755.0, 2199.0, 1360.0, 963.0, 583.0, 402.0, 243.0, 147.0, 107.0, 83.0, 59.0, 31.0, 23.0, 17.0, 15.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-7.19921875, -6.989013671875, -6.77880859375, -6.568603515625, -6.3583984375, -6.148193359375, -5.93798828125, -5.727783203125, -5.517578125, -5.307373046875, -5.09716796875, -4.886962890625, -4.6767578125, -4.466552734375, -4.25634765625, -4.046142578125, -3.8359375, -3.625732421875, -3.41552734375, -3.205322265625, -2.9951171875, -2.784912109375, -2.57470703125, -2.364501953125, -2.154296875, -1.944091796875, -1.73388671875, -1.523681640625, -1.3134765625, -1.103271484375, -0.89306640625, -0.682861328125, -0.47265625, -0.262451171875, -0.05224609375, 0.157958984375, 0.3681640625, 0.578369140625, 0.78857421875, 0.998779296875, 1.208984375, 1.419189453125, 1.62939453125, 1.839599609375, 2.0498046875, 2.260009765625, 2.47021484375, 2.680419921875, 2.890625, 3.100830078125, 3.31103515625, 3.521240234375, 3.7314453125, 3.941650390625, 4.15185546875, 4.362060546875, 4.572265625, 4.782470703125, 4.99267578125, 5.202880859375, 5.4130859375, 5.623291015625, 5.83349609375, 6.043701171875, 6.25390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 18.0, 17.0, 20.0, 21.0, 23.0, 25.0, 25.0, 39.0, 45.0, 43.0, 41.0, 41.0, 39.0, 43.0, 50.0, 55.0, 35.0, 48.0, 39.0, 40.0, 38.0, 41.0, 24.0, 25.0, 24.0, 20.0, 14.0, 15.0, 11.0, 12.0, 6.0, 4.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625, -5.4443359375, -5.263671875, -5.0830078125, -4.90234375, -4.7216796875, -4.541015625, -4.3603515625, -4.1796875, -3.9990234375, -3.818359375, -3.6376953125, -3.45703125, -3.2763671875, -3.095703125, -2.9150390625, -2.734375, -2.5537109375, -2.373046875, -2.1923828125, -2.01171875, -1.8310546875, -1.650390625, -1.4697265625, -1.2890625, -1.1083984375, -0.927734375, -0.7470703125, -0.56640625, -0.3857421875, -0.205078125, -0.0244140625, 0.15625, 0.3369140625, 0.517578125, 0.6982421875, 0.87890625, 1.0595703125, 1.240234375, 1.4208984375, 1.6015625, 1.7822265625, 1.962890625, 2.1435546875, 2.32421875, 2.5048828125, 2.685546875, 2.8662109375, 3.046875, 3.2275390625, 3.408203125, 3.5888671875, 3.76953125, 3.9501953125, 4.130859375, 4.3115234375, 4.4921875, 4.6728515625, 4.853515625, 5.0341796875, 5.21484375, 5.3955078125, 5.576171875, 5.7568359375, 5.9375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 7.0, 13.0, 18.0, 25.0, 37.0, 57.0, 69.0, 113.0, 169.0, 249.0, 343.0, 480.0, 733.0, 1141.0, 1706.0, 2551.0, 4081.0, 6212.0, 9873.0, 15521.0, 24296.0, 37382.0, 55762.0, 79166.0, 105422.0, 125533.0, 132893.0, 123067.0, 100522.0, 73716.0, 51264.0, 34183.0, 22184.0, 14153.0, 9062.0, 5732.0, 3663.0, 2388.0, 1596.0, 1030.0, 665.0, 453.0, 293.0, 223.0, 159.0, 123.0, 66.0, 48.0, 33.0, 19.0, 25.0, 16.0, 4.0, 5.0, 7.0, 4.0, 0.0, 2.0], "bins": [-5.73828125, -5.5611572265625, -5.384033203125, -5.2069091796875, -5.02978515625, -4.8526611328125, -4.675537109375, -4.4984130859375, -4.3212890625, -4.1441650390625, -3.967041015625, -3.7899169921875, -3.61279296875, -3.4356689453125, -3.258544921875, -3.0814208984375, -2.904296875, -2.7271728515625, -2.550048828125, -2.3729248046875, -2.19580078125, -2.0186767578125, -1.841552734375, -1.6644287109375, -1.4873046875, -1.3101806640625, -1.133056640625, -0.9559326171875, -0.77880859375, -0.6016845703125, -0.424560546875, -0.2474365234375, -0.0703125, 0.1068115234375, 0.283935546875, 0.4610595703125, 0.63818359375, 0.8153076171875, 0.992431640625, 1.1695556640625, 1.3466796875, 1.5238037109375, 1.700927734375, 1.8780517578125, 2.05517578125, 2.2322998046875, 2.409423828125, 2.5865478515625, 2.763671875, 2.9407958984375, 3.117919921875, 3.2950439453125, 3.47216796875, 3.6492919921875, 3.826416015625, 4.0035400390625, 4.1806640625, 4.3577880859375, 4.534912109375, 4.7120361328125, 4.88916015625, 5.0662841796875, 5.243408203125, 5.4205322265625, 5.59765625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 0.0, 6.0, 6.0, 11.0, 7.0, 10.0, 17.0, 16.0, 9.0, 16.0, 23.0, 25.0, 17.0, 23.0, 21.0, 35.0, 31.0, 46.0, 39.0, 47.0, 26.0, 32.0, 40.0, 40.0, 33.0, 27.0, 31.0, 35.0, 32.0, 27.0, 18.0, 29.0, 18.0, 29.0, 24.0, 10.0, 15.0, 17.0, 13.0, 24.0, 18.0, 10.0, 6.0, 10.0, 4.0, 4.0, 9.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.880859375, -2.78302001953125, -2.6851806640625, -2.58734130859375, -2.489501953125, -2.39166259765625, -2.2938232421875, -2.19598388671875, -2.09814453125, -2.00030517578125, -1.9024658203125, -1.80462646484375, -1.706787109375, -1.60894775390625, -1.5111083984375, -1.41326904296875, -1.3154296875, -1.21759033203125, -1.1197509765625, -1.02191162109375, -0.924072265625, -0.82623291015625, -0.7283935546875, -0.63055419921875, -0.53271484375, -0.43487548828125, -0.3370361328125, -0.23919677734375, -0.141357421875, -0.04351806640625, 0.0543212890625, 0.15216064453125, 0.25, 0.34783935546875, 0.4456787109375, 0.54351806640625, 0.641357421875, 0.73919677734375, 0.8370361328125, 0.93487548828125, 1.03271484375, 1.13055419921875, 1.2283935546875, 1.32623291015625, 1.424072265625, 1.52191162109375, 1.6197509765625, 1.71759033203125, 1.8154296875, 1.91326904296875, 2.0111083984375, 2.10894775390625, 2.206787109375, 2.30462646484375, 2.4024658203125, 2.50030517578125, 2.59814453125, 2.69598388671875, 2.7938232421875, 2.89166259765625, 2.989501953125, 3.08734130859375, 3.1851806640625, 3.28302001953125, 3.380859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 23.0, 25.0, 30.0, 58.0, 108.0, 104.0, 182.0, 260.0, 356.0, 512.0, 715.0, 1056.0, 1539.0, 2535.0, 4010.0, 6432.0, 10534.0, 18245.0, 32099.0, 56521.0, 97346.0, 153518.0, 191573.0, 175283.0, 122160.0, 73006.0, 41126.0, 23498.0, 13708.0, 8093.0, 4831.0, 2976.0, 1994.0, 1292.0, 853.0, 552.0, 412.0, 278.0, 207.0, 160.0, 96.0, 80.0, 43.0, 35.0, 33.0, 15.0, 15.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.60150146484375, -3.4803466796875, -3.35919189453125, -3.238037109375, -3.11688232421875, -2.9957275390625, -2.87457275390625, -2.75341796875, -2.63226318359375, -2.5111083984375, -2.38995361328125, -2.268798828125, -2.14764404296875, -2.0264892578125, -1.90533447265625, -1.7841796875, -1.66302490234375, -1.5418701171875, -1.42071533203125, -1.299560546875, -1.17840576171875, -1.0572509765625, -0.93609619140625, -0.81494140625, -0.69378662109375, -0.5726318359375, -0.45147705078125, -0.330322265625, -0.20916748046875, -0.0880126953125, 0.03314208984375, 0.154296875, 0.27545166015625, 0.3966064453125, 0.51776123046875, 0.638916015625, 0.76007080078125, 0.8812255859375, 1.00238037109375, 1.12353515625, 1.24468994140625, 1.3658447265625, 1.48699951171875, 1.608154296875, 1.72930908203125, 1.8504638671875, 1.97161865234375, 2.0927734375, 2.21392822265625, 2.3350830078125, 2.45623779296875, 2.577392578125, 2.69854736328125, 2.8197021484375, 2.94085693359375, 3.06201171875, 3.18316650390625, 3.3043212890625, 3.42547607421875, 3.546630859375, 3.66778564453125, 3.7889404296875, 3.91009521484375, 4.03125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 9.0, 7.0, 12.0, 12.0, 30.0, 28.0, 36.0, 50.0, 63.0, 64.0, 67.0, 62.0, 79.0, 76.0, 64.0, 56.0, 58.0, 47.0, 36.0, 33.0, 18.0, 20.0, 13.0, 8.0, 5.0, 9.0, 4.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004787445068359375, -0.00046315044164657593, -0.00044755637645721436, -0.0004319623112678528, -0.0004163682460784912, -0.00040077418088912964, -0.00038518011569976807, -0.0003695860505104065, -0.0003539919853210449, -0.00033839792013168335, -0.0003228038549423218, -0.0003072097897529602, -0.00029161572456359863, -0.00027602165937423706, -0.0002604275941848755, -0.0002448335289955139, -0.00022923946380615234, -0.00021364539861679077, -0.0001980513334274292, -0.00018245726823806763, -0.00016686320304870605, -0.00015126913785934448, -0.0001356750726699829, -0.00012008100748062134, -0.00010448694229125977, -8.88928771018982e-05, -7.329881191253662e-05, -5.770474672317505e-05, -4.2110681533813477e-05, -2.6516616344451904e-05, -1.0922551155090332e-05, 4.67151403427124e-06, 2.0265579223632812e-05, 3.5859644412994385e-05, 5.145370960235596e-05, 6.704777479171753e-05, 8.26418399810791e-05, 9.823590517044067e-05, 0.00011382997035980225, 0.00012942403554916382, 0.0001450181007385254, 0.00016061216592788696, 0.00017620623111724854, 0.0001918002963066101, 0.00020739436149597168, 0.00022298842668533325, 0.00023858249187469482, 0.0002541765570640564, 0.00026977062225341797, 0.00028536468744277954, 0.0003009587526321411, 0.0003165528178215027, 0.00033214688301086426, 0.00034774094820022583, 0.0003633350133895874, 0.000378929078578949, 0.00039452314376831055, 0.0004101172089576721, 0.0004257112741470337, 0.00044130533933639526, 0.00045689940452575684, 0.0004724934697151184, 0.00048808753490448, 0.0005036816000938416, 0.0005192756652832031]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 9.0, 14.0, 16.0, 27.0, 47.0, 63.0, 117.0, 168.0, 227.0, 347.0, 511.0, 832.0, 1167.0, 1719.0, 2638.0, 3859.0, 6285.0, 9355.0, 14518.0, 22585.0, 35245.0, 54221.0, 79880.0, 111077.0, 137046.0, 143709.0, 127187.0, 98217.0, 68389.0, 45443.0, 29376.0, 18843.0, 12193.0, 7869.0, 5238.0, 3420.0, 2218.0, 1403.0, 1051.0, 688.0, 453.0, 292.0, 201.0, 134.0, 88.0, 58.0, 41.0, 24.0, 19.0, 12.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.67578125, -2.592926025390625, -2.51007080078125, -2.427215576171875, -2.3443603515625, -2.261505126953125, -2.17864990234375, -2.095794677734375, -2.012939453125, -1.930084228515625, -1.84722900390625, -1.764373779296875, -1.6815185546875, -1.598663330078125, -1.51580810546875, -1.432952880859375, -1.35009765625, -1.267242431640625, -1.18438720703125, -1.101531982421875, -1.0186767578125, -0.935821533203125, -0.85296630859375, -0.770111083984375, -0.687255859375, -0.604400634765625, -0.52154541015625, -0.438690185546875, -0.3558349609375, -0.272979736328125, -0.19012451171875, -0.107269287109375, -0.0244140625, 0.058441162109375, 0.14129638671875, 0.224151611328125, 0.3070068359375, 0.389862060546875, 0.47271728515625, 0.555572509765625, 0.638427734375, 0.721282958984375, 0.80413818359375, 0.886993408203125, 0.9698486328125, 1.052703857421875, 1.13555908203125, 1.218414306640625, 1.30126953125, 1.384124755859375, 1.46697998046875, 1.549835205078125, 1.6326904296875, 1.715545654296875, 1.79840087890625, 1.881256103515625, 1.964111328125, 2.046966552734375, 2.12982177734375, 2.212677001953125, 2.2955322265625, 2.378387451171875, 2.46124267578125, 2.544097900390625, 2.626953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 7.0, 9.0, 12.0, 11.0, 15.0, 18.0, 34.0, 30.0, 33.0, 52.0, 52.0, 47.0, 45.0, 47.0, 55.0, 67.0, 62.0, 55.0, 41.0, 40.0, 38.0, 34.0, 32.0, 24.0, 21.0, 20.0, 20.0, 10.0, 13.0, 5.0, 8.0, 11.0, 6.0, 1.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.12109375, -1.08599853515625, -1.0509033203125, -1.01580810546875, -0.980712890625, -0.94561767578125, -0.9105224609375, -0.87542724609375, -0.84033203125, -0.80523681640625, -0.7701416015625, -0.73504638671875, -0.699951171875, -0.66485595703125, -0.6297607421875, -0.59466552734375, -0.5595703125, -0.52447509765625, -0.4893798828125, -0.45428466796875, -0.419189453125, -0.38409423828125, -0.3489990234375, -0.31390380859375, -0.27880859375, -0.24371337890625, -0.2086181640625, -0.17352294921875, -0.138427734375, -0.10333251953125, -0.0682373046875, -0.03314208984375, 0.001953125, 0.03704833984375, 0.0721435546875, 0.10723876953125, 0.142333984375, 0.17742919921875, 0.2125244140625, 0.24761962890625, 0.28271484375, 0.31781005859375, 0.3529052734375, 0.38800048828125, 0.423095703125, 0.45819091796875, 0.4932861328125, 0.52838134765625, 0.5634765625, 0.59857177734375, 0.6336669921875, 0.66876220703125, 0.703857421875, 0.73895263671875, 0.7740478515625, 0.80914306640625, 0.84423828125, 0.87933349609375, 0.9144287109375, 0.94952392578125, 0.984619140625, 1.01971435546875, 1.0548095703125, 1.08990478515625, 1.125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 10.0, 12.0, 9.0, 12.0, 19.0, 18.0, 25.0, 23.0, 27.0, 29.0, 41.0, 54.0, 37.0, 43.0, 49.0, 56.0, 45.0, 39.0, 49.0, 40.0, 45.0, 39.0, 38.0, 25.0, 33.0, 28.0, 28.0, 17.0, 17.0, 19.0, 10.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.244438648223877, -6.06928014755249, -5.8941216468811035, -5.718963146209717, -5.54380464553833, -5.368646621704102, -5.193488121032715, -5.018329620361328, -4.843171119689941, -4.668012619018555, -4.492854118347168, -4.317695617675781, -4.1425371170043945, -3.967378854751587, -3.7922203540802, -3.6170620918273926, -3.4419033527374268, -3.26674485206604, -3.0915863513946533, -2.9164280891418457, -2.741269588470459, -2.5661110877990723, -2.3909525871276855, -2.215794086456299, -2.040635585784912, -1.8654770851135254, -1.6903187036514282, -1.5151602029800415, -1.3400018215179443, -1.1648433208465576, -0.9896848201751709, -0.8145264387130737, -0.6393680572509766, -0.4642096161842346, -0.2890511453151703, -0.11389267444610596, 0.061265766620635986, 0.23642420768737793, 0.41158270835876465, 0.5867410898208618, 0.7618995904922485, 0.9370580315589905, 1.1122164726257324, 1.2873749732971191, 1.4625334739685059, 1.637691855430603, 1.8128503561019897, 1.988008737564087, 2.1631672382354736, 2.3383257389068604, 2.513484239578247, 2.6886425018310547, 2.8638010025024414, 3.038959503173828, 3.214118003845215, 3.3892765045166016, 3.5644350051879883, 3.739593505859375, 3.9147520065307617, 4.089910507202148, 4.265069007873535, 4.440227508544922, 4.615386009216309, 4.790544033050537, 4.965702533721924]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 12.0, 8.0, 14.0, 22.0, 27.0, 10.0, 27.0, 32.0, 24.0, 31.0, 34.0, 33.0, 36.0, 37.0, 48.0, 50.0, 43.0, 59.0, 44.0, 43.0, 39.0, 47.0, 44.0, 33.0, 27.0, 24.0, 22.0, 16.0, 22.0, 14.0, 19.0, 14.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.886569976806641, -5.693611145019531, -5.500651836395264, -5.307692527770996, -5.114733695983887, -4.921774864196777, -4.72881555557251, -4.535856246948242, -4.342897415161133, -4.149938583374023, -3.956979274749756, -3.7640202045440674, -3.571061134338379, -3.3781020641326904, -3.185142993927002, -2.9921839237213135, -2.799224853515625, -2.6062657833099365, -2.413306713104248, -2.2203476428985596, -2.027388572692871, -1.8344295024871826, -1.6414704322814941, -1.4485113620758057, -1.2555522918701172, -1.0625932216644287, -0.8696341514587402, -0.6766750812530518, -0.4837160110473633, -0.2907569408416748, -0.09779787063598633, 0.09516119956970215, 0.28812074661254883, 0.4810798168182373, 0.6740388870239258, 0.8669979572296143, 1.0599570274353027, 1.2529160976409912, 1.4458751678466797, 1.6388342380523682, 1.8317933082580566, 2.024752378463745, 2.2177114486694336, 2.410670518875122, 2.6036295890808105, 2.796588659286499, 2.9895477294921875, 3.182506799697876, 3.3754658699035645, 3.568424940109253, 3.7613840103149414, 3.95434308052063, 4.147302150726318, 4.340261459350586, 4.533220291137695, 4.726179122924805, 4.919138431549072, 5.11209774017334, 5.305056571960449, 5.498015403747559, 5.690974712371826, 5.883934020996094, 6.076892852783203, 6.2698516845703125, 6.46281099319458]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 18.0, 14.0, 31.0, 47.0, 58.0, 90.0, 168.0, 197.0, 338.0, 536.0, 812.0, 1335.0, 2156.0, 3624.0, 6124.0, 10377.0, 17693.0, 32193.0, 56776.0, 101228.0, 175653.0, 293279.0, 446552.0, 596114.0, 664017.0, 603845.0, 456646.0, 301391.0, 180915.0, 104422.0, 57976.0, 33043.0, 19007.0, 10881.0, 6360.0, 3893.0, 2310.0, 1496.0, 903.0, 594.0, 384.0, 238.0, 186.0, 120.0, 79.0, 57.0, 41.0, 25.0, 13.0, 13.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.4765625, -4.3345947265625, -4.192626953125, -4.0506591796875, -3.90869140625, -3.7667236328125, -3.624755859375, -3.4827880859375, -3.3408203125, -3.1988525390625, -3.056884765625, -2.9149169921875, -2.77294921875, -2.6309814453125, -2.489013671875, -2.3470458984375, -2.205078125, -2.0631103515625, -1.921142578125, -1.7791748046875, -1.63720703125, -1.4952392578125, -1.353271484375, -1.2113037109375, -1.0693359375, -0.9273681640625, -0.785400390625, -0.6434326171875, -0.50146484375, -0.3594970703125, -0.217529296875, -0.0755615234375, 0.06640625, 0.2083740234375, 0.350341796875, 0.4923095703125, 0.63427734375, 0.7762451171875, 0.918212890625, 1.0601806640625, 1.2021484375, 1.3441162109375, 1.486083984375, 1.6280517578125, 1.77001953125, 1.9119873046875, 2.053955078125, 2.1959228515625, 2.337890625, 2.4798583984375, 2.621826171875, 2.7637939453125, 2.90576171875, 3.0477294921875, 3.189697265625, 3.3316650390625, 3.4736328125, 3.6156005859375, 3.757568359375, 3.8995361328125, 4.04150390625, 4.1834716796875, 4.325439453125, 4.4674072265625, 4.609375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 5.0, 9.0, 13.0, 11.0, 12.0, 13.0, 17.0, 15.0, 24.0, 28.0, 25.0, 29.0, 19.0, 31.0, 33.0, 40.0, 41.0, 36.0, 37.0, 36.0, 32.0, 48.0, 53.0, 32.0, 39.0, 25.0, 33.0, 33.0, 33.0, 27.0, 27.0, 16.0, 17.0, 24.0, 12.0, 12.0, 9.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.44921875, -4.31085205078125, -4.1724853515625, -4.03411865234375, -3.895751953125, -3.75738525390625, -3.6190185546875, -3.48065185546875, -3.34228515625, -3.20391845703125, -3.0655517578125, -2.92718505859375, -2.788818359375, -2.65045166015625, -2.5120849609375, -2.37371826171875, -2.2353515625, -2.09698486328125, -1.9586181640625, -1.82025146484375, -1.681884765625, -1.54351806640625, -1.4051513671875, -1.26678466796875, -1.12841796875, -0.99005126953125, -0.8516845703125, -0.71331787109375, -0.574951171875, -0.43658447265625, -0.2982177734375, -0.15985107421875, -0.021484375, 0.11688232421875, 0.2552490234375, 0.39361572265625, 0.531982421875, 0.67034912109375, 0.8087158203125, 0.94708251953125, 1.08544921875, 1.22381591796875, 1.3621826171875, 1.50054931640625, 1.638916015625, 1.77728271484375, 1.9156494140625, 2.05401611328125, 2.1923828125, 2.33074951171875, 2.4691162109375, 2.60748291015625, 2.745849609375, 2.88421630859375, 3.0225830078125, 3.16094970703125, 3.29931640625, 3.43768310546875, 3.5760498046875, 3.71441650390625, 3.852783203125, 3.99114990234375, 4.1295166015625, 4.26788330078125, 4.40625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 9.0, 14.0, 28.0, 39.0, 56.0, 91.0, 157.0, 232.0, 391.0, 697.0, 1066.0, 1911.0, 3358.0, 5669.0, 10184.0, 18077.0, 32065.0, 56394.0, 98827.0, 167830.0, 273063.0, 409480.0, 551340.0, 630967.0, 602585.0, 480681.0, 335709.0, 214298.0, 128008.0, 74068.0, 42032.0, 23622.0, 13400.0, 7596.0, 4298.0, 2491.0, 1436.0, 764.0, 514.0, 323.0, 156.0, 126.0, 73.0, 51.0, 34.0, 17.0, 14.0, 12.0, 11.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.75042724609375, -4.5906982421875, -4.43096923828125, -4.271240234375, -4.11151123046875, -3.9517822265625, -3.79205322265625, -3.63232421875, -3.47259521484375, -3.3128662109375, -3.15313720703125, -2.993408203125, -2.83367919921875, -2.6739501953125, -2.51422119140625, -2.3544921875, -2.19476318359375, -2.0350341796875, -1.87530517578125, -1.715576171875, -1.55584716796875, -1.3961181640625, -1.23638916015625, -1.07666015625, -0.91693115234375, -0.7572021484375, -0.59747314453125, -0.437744140625, -0.27801513671875, -0.1182861328125, 0.04144287109375, 0.201171875, 0.36090087890625, 0.5206298828125, 0.68035888671875, 0.840087890625, 0.99981689453125, 1.1595458984375, 1.31927490234375, 1.47900390625, 1.63873291015625, 1.7984619140625, 1.95819091796875, 2.117919921875, 2.27764892578125, 2.4373779296875, 2.59710693359375, 2.7568359375, 2.91656494140625, 3.0762939453125, 3.23602294921875, 3.395751953125, 3.55548095703125, 3.7152099609375, 3.87493896484375, 4.03466796875, 4.19439697265625, 4.3541259765625, 4.51385498046875, 4.673583984375, 4.83331298828125, 4.9930419921875, 5.15277099609375, 5.3125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 10.0, 21.0, 12.0, 27.0, 33.0, 28.0, 36.0, 48.0, 80.0, 72.0, 84.0, 115.0, 138.0, 158.0, 176.0, 197.0, 178.0, 224.0, 213.0, 200.0, 242.0, 210.0, 211.0, 209.0, 178.0, 142.0, 165.0, 115.0, 100.0, 86.0, 66.0, 59.0, 50.0, 42.0, 27.0, 31.0, 20.0, 11.0, 9.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.224609375, -2.1610870361328125, -2.097564697265625, -2.0340423583984375, -1.97052001953125, -1.9069976806640625, -1.843475341796875, -1.7799530029296875, -1.7164306640625, -1.6529083251953125, -1.589385986328125, -1.5258636474609375, -1.46234130859375, -1.3988189697265625, -1.335296630859375, -1.2717742919921875, -1.208251953125, -1.1447296142578125, -1.081207275390625, -1.0176849365234375, -0.95416259765625, -0.8906402587890625, -0.827117919921875, -0.7635955810546875, -0.7000732421875, -0.6365509033203125, -0.573028564453125, -0.5095062255859375, -0.44598388671875, -0.3824615478515625, -0.318939208984375, -0.2554168701171875, -0.19189453125, -0.1283721923828125, -0.064849853515625, -0.0013275146484375, 0.06219482421875, 0.1257171630859375, 0.189239501953125, 0.2527618408203125, 0.3162841796875, 0.3798065185546875, 0.443328857421875, 0.5068511962890625, 0.57037353515625, 0.6338958740234375, 0.697418212890625, 0.7609405517578125, 0.824462890625, 0.8879852294921875, 0.951507568359375, 1.0150299072265625, 1.07855224609375, 1.1420745849609375, 1.205596923828125, 1.2691192626953125, 1.3326416015625, 1.3961639404296875, 1.459686279296875, 1.5232086181640625, 1.58673095703125, 1.6502532958984375, 1.713775634765625, 1.7772979736328125, 1.8408203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 10.0, 14.0, 16.0, 19.0, 16.0, 13.0, 22.0, 22.0, 27.0, 44.0, 45.0, 45.0, 37.0, 53.0, 36.0, 49.0, 42.0, 44.0, 35.0, 45.0, 32.0, 37.0, 33.0, 40.0, 21.0, 24.0, 21.0, 21.0, 19.0, 21.0, 16.0, 4.0, 6.0, 9.0, 17.0, 2.0, 5.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.722733020782471, -4.564280986785889, -4.405828475952148, -4.247376441955566, -4.088924407958984, -3.9304721355438232, -3.772019863128662, -3.61356782913208, -3.455115556716919, -3.296663284301758, -3.138211250305176, -2.9797589778900146, -2.8213067054748535, -2.6628546714782715, -2.5044023990631104, -2.345950126647949, -2.187498092651367, -2.029045820236206, -1.870593786239624, -1.712141513824463, -1.5536893606185913, -1.3952372074127197, -1.2367849349975586, -1.078332781791687, -0.9198806285858154, -0.7614284753799438, -0.6029762625694275, -0.4445240795612335, -0.28607189655303955, -0.12761974334716797, 0.03083246946334839, 0.18928468227386475, 0.34773731231689453, 0.5061894655227661, 0.6646416783332825, 0.8230938911437988, 0.9815460443496704, 1.139998197555542, 1.2984504699707031, 1.4569026231765747, 1.6153547763824463, 1.7738069295883179, 1.9322590827941895, 2.0907113552093506, 2.2491636276245117, 2.4076156616210938, 2.566067934036255, 2.724520206451416, 2.882972240447998, 3.041424512863159, 3.199876546859741, 3.3583288192749023, 3.5167808532714844, 3.6752331256866455, 3.8336853981018066, 3.9921374320983887, 4.150589942932129, 4.309041976928711, 4.467494487762451, 4.625946521759033, 4.784398555755615, 4.9428510665893555, 5.1013031005859375, 5.2597551345825195, 5.418207168579102]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 0.0, 3.0, 8.0, 8.0, 9.0, 15.0, 9.0, 8.0, 16.0, 14.0, 24.0, 27.0, 24.0, 25.0, 17.0, 36.0, 35.0, 31.0, 39.0, 34.0, 40.0, 43.0, 43.0, 43.0, 32.0, 35.0, 43.0, 28.0, 31.0, 44.0, 32.0, 34.0, 20.0, 21.0, 22.0, 9.0, 18.0, 18.0, 9.0, 12.0, 15.0, 8.0, 8.0, 6.0, 0.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94888162612915, -4.793622970581055, -4.638364791870117, -4.4831061363220215, -4.327847480773926, -4.172589302062988, -4.017330646514893, -3.862071990966797, -3.7068135738372803, -3.5515551567077637, -3.396296501159668, -3.2410380840301514, -3.0857796669006348, -2.930521011352539, -2.7752625942230225, -2.620004177093506, -2.46474552154541, -2.3094871044158936, -2.154228448867798, -1.9989700317382812, -1.843711495399475, -1.688452959060669, -1.5331945419311523, -1.3779360055923462, -1.22267746925354, -1.0674189329147339, -0.9121604561805725, -0.7569019794464111, -0.601643443107605, -0.44638490676879883, -0.29112643003463745, -0.13586795330047607, 0.01939105987548828, 0.17464956641197205, 0.3299080729484558, 0.4851665794849396, 0.6404250860214233, 0.7956836223602295, 0.9509420990943909, 1.1062005758285522, 1.2614591121673584, 1.4167176485061646, 1.5719761848449707, 1.7272346019744873, 1.8824931383132935, 2.0377516746520996, 2.193010091781616, 2.348268508911133, 2.5035271644592285, 2.658785581588745, 2.814044237136841, 2.9693026542663574, 3.124561309814453, 3.2798197269439697, 3.4350781440734863, 3.590336799621582, 3.7455952167510986, 3.9008536338806152, 4.056112289428711, 4.211370944976807, 4.366629123687744, 4.52188777923584, 4.6771464347839355, 4.832404613494873, 4.987663269042969]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 8.0, 9.0, 19.0, 23.0, 24.0, 49.0, 62.0, 116.0, 137.0, 221.0, 325.0, 489.0, 707.0, 1052.0, 1510.0, 2324.0, 3426.0, 5198.0, 7846.0, 12447.0, 21384.0, 39623.0, 79994.0, 172806.0, 274175.0, 209037.0, 100701.0, 48225.0, 25172.0, 14752.0, 8920.0, 5796.0, 3838.0, 2668.0, 1830.0, 1189.0, 777.0, 516.0, 385.0, 259.0, 147.0, 113.0, 86.0, 59.0, 29.0, 25.0, 16.0, 11.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0], "bins": [-8.296875, -8.05029296875, -7.8037109375, -7.55712890625, -7.310546875, -7.06396484375, -6.8173828125, -6.57080078125, -6.32421875, -6.07763671875, -5.8310546875, -5.58447265625, -5.337890625, -5.09130859375, -4.8447265625, -4.59814453125, -4.3515625, -4.10498046875, -3.8583984375, -3.61181640625, -3.365234375, -3.11865234375, -2.8720703125, -2.62548828125, -2.37890625, -2.13232421875, -1.8857421875, -1.63916015625, -1.392578125, -1.14599609375, -0.8994140625, -0.65283203125, -0.40625, -0.15966796875, 0.0869140625, 0.33349609375, 0.580078125, 0.82666015625, 1.0732421875, 1.31982421875, 1.56640625, 1.81298828125, 2.0595703125, 2.30615234375, 2.552734375, 2.79931640625, 3.0458984375, 3.29248046875, 3.5390625, 3.78564453125, 4.0322265625, 4.27880859375, 4.525390625, 4.77197265625, 5.0185546875, 5.26513671875, 5.51171875, 5.75830078125, 6.0048828125, 6.25146484375, 6.498046875, 6.74462890625, 6.9912109375, 7.23779296875, 7.484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 7.0, 20.0, 15.0, 20.0, 18.0, 24.0, 28.0, 26.0, 20.0, 27.0, 35.0, 43.0, 50.0, 40.0, 45.0, 48.0, 34.0, 38.0, 50.0, 50.0, 38.0, 40.0, 21.0, 29.0, 39.0, 28.0, 22.0, 26.0, 18.0, 21.0, 11.0, 7.0, 15.0, 4.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37890625, -5.21234130859375, -5.0457763671875, -4.87921142578125, -4.712646484375, -4.54608154296875, -4.3795166015625, -4.21295166015625, -4.04638671875, -3.87982177734375, -3.7132568359375, -3.54669189453125, -3.380126953125, -3.21356201171875, -3.0469970703125, -2.88043212890625, -2.7138671875, -2.54730224609375, -2.3807373046875, -2.21417236328125, -2.047607421875, -1.88104248046875, -1.7144775390625, -1.54791259765625, -1.38134765625, -1.21478271484375, -1.0482177734375, -0.88165283203125, -0.715087890625, -0.54852294921875, -0.3819580078125, -0.21539306640625, -0.048828125, 0.11773681640625, 0.2843017578125, 0.45086669921875, 0.617431640625, 0.78399658203125, 0.9505615234375, 1.11712646484375, 1.28369140625, 1.45025634765625, 1.6168212890625, 1.78338623046875, 1.949951171875, 2.11651611328125, 2.2830810546875, 2.44964599609375, 2.6162109375, 2.78277587890625, 2.9493408203125, 3.11590576171875, 3.282470703125, 3.44903564453125, 3.6156005859375, 3.78216552734375, 3.94873046875, 4.11529541015625, 4.2818603515625, 4.44842529296875, 4.614990234375, 4.78155517578125, 4.9481201171875, 5.11468505859375, 5.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 13.0, 14.0, 14.0, 24.0, 29.0, 64.0, 77.0, 122.0, 172.0, 239.0, 397.0, 609.0, 846.0, 1283.0, 2001.0, 3176.0, 5118.0, 8183.0, 13334.0, 22909.0, 41660.0, 83434.0, 182658.0, 288451.0, 197270.0, 90491.0, 44429.0, 24419.0, 13791.0, 8574.0, 5147.0, 3414.0, 2143.0, 1380.0, 848.0, 581.0, 382.0, 286.0, 168.0, 124.0, 75.0, 54.0, 46.0, 37.0, 27.0, 6.0, 7.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.5390625, -8.2767333984375, -8.014404296875, -7.7520751953125, -7.48974609375, -7.2274169921875, -6.965087890625, -6.7027587890625, -6.4404296875, -6.1781005859375, -5.915771484375, -5.6534423828125, -5.39111328125, -5.1287841796875, -4.866455078125, -4.6041259765625, -4.341796875, -4.0794677734375, -3.817138671875, -3.5548095703125, -3.29248046875, -3.0301513671875, -2.767822265625, -2.5054931640625, -2.2431640625, -1.9808349609375, -1.718505859375, -1.4561767578125, -1.19384765625, -0.9315185546875, -0.669189453125, -0.4068603515625, -0.14453125, 0.1177978515625, 0.380126953125, 0.6424560546875, 0.90478515625, 1.1671142578125, 1.429443359375, 1.6917724609375, 1.9541015625, 2.2164306640625, 2.478759765625, 2.7410888671875, 3.00341796875, 3.2657470703125, 3.528076171875, 3.7904052734375, 4.052734375, 4.3150634765625, 4.577392578125, 4.8397216796875, 5.10205078125, 5.3643798828125, 5.626708984375, 5.8890380859375, 6.1513671875, 6.4136962890625, 6.676025390625, 6.9383544921875, 7.20068359375, 7.4630126953125, 7.725341796875, 7.9876708984375, 8.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 5.0, 8.0, 8.0, 9.0, 16.0, 24.0, 14.0, 25.0, 26.0, 25.0, 34.0, 37.0, 38.0, 29.0, 43.0, 35.0, 31.0, 41.0, 45.0, 37.0, 61.0, 54.0, 46.0, 30.0, 36.0, 36.0, 30.0, 27.0, 41.0, 20.0, 15.0, 19.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.808135986328125, -3.68853759765625, -3.568939208984375, -3.4493408203125, -3.329742431640625, -3.21014404296875, -3.090545654296875, -2.970947265625, -2.851348876953125, -2.73175048828125, -2.612152099609375, -2.4925537109375, -2.372955322265625, -2.25335693359375, -2.133758544921875, -2.01416015625, -1.894561767578125, -1.77496337890625, -1.655364990234375, -1.5357666015625, -1.416168212890625, -1.29656982421875, -1.176971435546875, -1.057373046875, -0.937774658203125, -0.81817626953125, -0.698577880859375, -0.5789794921875, -0.459381103515625, -0.33978271484375, -0.220184326171875, -0.1005859375, 0.019012451171875, 0.13861083984375, 0.258209228515625, 0.3778076171875, 0.497406005859375, 0.61700439453125, 0.736602783203125, 0.856201171875, 0.975799560546875, 1.09539794921875, 1.214996337890625, 1.3345947265625, 1.454193115234375, 1.57379150390625, 1.693389892578125, 1.81298828125, 1.932586669921875, 2.05218505859375, 2.171783447265625, 2.2913818359375, 2.410980224609375, 2.53057861328125, 2.650177001953125, 2.769775390625, 2.889373779296875, 3.00897216796875, 3.128570556640625, 3.2481689453125, 3.367767333984375, 3.48736572265625, 3.606964111328125, 3.7265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 1.0, 7.0, 11.0, 12.0, 19.0, 24.0, 34.0, 57.0, 77.0, 88.0, 184.0, 273.0, 367.0, 523.0, 933.0, 1604.0, 2518.0, 4360.0, 8161.0, 17665.0, 49799.0, 274782.0, 540180.0, 95422.0, 26266.0, 11369.0, 5641.0, 3082.0, 1880.0, 1166.0, 695.0, 438.0, 300.0, 195.0, 135.0, 74.0, 51.0, 47.0, 36.0, 18.0, 15.0, 17.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-10.15625, -9.8758544921875, -9.595458984375, -9.3150634765625, -9.03466796875, -8.7542724609375, -8.473876953125, -8.1934814453125, -7.9130859375, -7.6326904296875, -7.352294921875, -7.0718994140625, -6.79150390625, -6.5111083984375, -6.230712890625, -5.9503173828125, -5.669921875, -5.3895263671875, -5.109130859375, -4.8287353515625, -4.54833984375, -4.2679443359375, -3.987548828125, -3.7071533203125, -3.4267578125, -3.1463623046875, -2.865966796875, -2.5855712890625, -2.30517578125, -2.0247802734375, -1.744384765625, -1.4639892578125, -1.18359375, -0.9031982421875, -0.622802734375, -0.3424072265625, -0.06201171875, 0.2183837890625, 0.498779296875, 0.7791748046875, 1.0595703125, 1.3399658203125, 1.620361328125, 1.9007568359375, 2.18115234375, 2.4615478515625, 2.741943359375, 3.0223388671875, 3.302734375, 3.5831298828125, 3.863525390625, 4.1439208984375, 4.42431640625, 4.7047119140625, 4.985107421875, 5.2655029296875, 5.5458984375, 5.8262939453125, 6.106689453125, 6.3870849609375, 6.66748046875, 6.9478759765625, 7.228271484375, 7.5086669921875, 7.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 3.0, 5.0, 14.0, 29.0, 32.0, 52.0, 124.0, 276.0, 203.0, 106.0, 46.0, 20.0, 19.0, 8.0, 9.0, 3.0, 8.0, 6.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007257461547851562, -0.0007022172212600708, -0.0006786882877349854, -0.0006551593542098999, -0.0006316304206848145, -0.000608101487159729, -0.0005845725536346436, -0.0005610436201095581, -0.0005375146865844727, -0.0005139857530593872, -0.0004904568195343018, -0.0004669278860092163, -0.00044339895248413086, -0.0004198700189590454, -0.00039634108543395996, -0.0003728121519088745, -0.00034928321838378906, -0.0003257542848587036, -0.00030222535133361816, -0.0002786964178085327, -0.00025516748428344727, -0.00023163855075836182, -0.00020810961723327637, -0.00018458068370819092, -0.00016105175018310547, -0.00013752281665802002, -0.00011399388313293457, -9.046494960784912e-05, -6.693601608276367e-05, -4.340708255767822e-05, -1.9878149032592773e-05, 3.6507844924926758e-06, 2.7179718017578125e-05, 5.0708651542663574e-05, 7.423758506774902e-05, 9.776651859283447e-05, 0.00012129545211791992, 0.00014482438564300537, 0.00016835331916809082, 0.00019188225269317627, 0.00021541118621826172, 0.00023894011974334717, 0.0002624690532684326, 0.00028599798679351807, 0.0003095269203186035, 0.00033305585384368896, 0.0003565847873687744, 0.00038011372089385986, 0.0004036426544189453, 0.00042717158794403076, 0.0004507005214691162, 0.00047422945499420166, 0.0004977583885192871, 0.0005212873220443726, 0.000544816255569458, 0.0005683451890945435, 0.0005918741226196289, 0.0006154030561447144, 0.0006389319896697998, 0.0006624609231948853, 0.0006859898567199707, 0.0007095187902450562, 0.0007330477237701416, 0.000756576657295227, 0.0007801055908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 12.0, 7.0, 13.0, 21.0, 27.0, 36.0, 54.0, 87.0, 116.0, 142.0, 216.0, 284.0, 429.0, 614.0, 868.0, 1315.0, 2131.0, 3684.0, 6275.0, 11623.0, 24288.0, 62583.0, 202996.0, 409724.0, 204709.0, 63415.0, 24634.0, 11931.0, 6266.0, 3584.0, 2163.0, 1353.0, 904.0, 629.0, 423.0, 292.0, 214.0, 141.0, 99.0, 75.0, 60.0, 26.0, 24.0, 20.0, 11.0, 10.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-6.21484375, -6.017578125, -5.8203125, -5.623046875, -5.42578125, -5.228515625, -5.03125, -4.833984375, -4.63671875, -4.439453125, -4.2421875, -4.044921875, -3.84765625, -3.650390625, -3.453125, -3.255859375, -3.05859375, -2.861328125, -2.6640625, -2.466796875, -2.26953125, -2.072265625, -1.875, -1.677734375, -1.48046875, -1.283203125, -1.0859375, -0.888671875, -0.69140625, -0.494140625, -0.296875, -0.099609375, 0.09765625, 0.294921875, 0.4921875, 0.689453125, 0.88671875, 1.083984375, 1.28125, 1.478515625, 1.67578125, 1.873046875, 2.0703125, 2.267578125, 2.46484375, 2.662109375, 2.859375, 3.056640625, 3.25390625, 3.451171875, 3.6484375, 3.845703125, 4.04296875, 4.240234375, 4.4375, 4.634765625, 4.83203125, 5.029296875, 5.2265625, 5.423828125, 5.62109375, 5.818359375, 6.015625, 6.212890625, 6.41015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 10.0, 6.0, 5.0, 16.0, 18.0, 22.0, 24.0, 34.0, 47.0, 61.0, 76.0, 91.0, 102.0, 80.0, 83.0, 77.0, 42.0, 38.0, 29.0, 20.0, 21.0, 15.0, 11.0, 15.0, 5.0, 8.0, 2.0, 8.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6818084716796875, -1.632171630859375, -1.5825347900390625, -1.53289794921875, -1.4832611083984375, -1.433624267578125, -1.3839874267578125, -1.3343505859375, -1.2847137451171875, -1.235076904296875, -1.1854400634765625, -1.13580322265625, -1.0861663818359375, -1.036529541015625, -0.9868927001953125, -0.937255859375, -0.8876190185546875, -0.837982177734375, -0.7883453369140625, -0.73870849609375, -0.6890716552734375, -0.639434814453125, -0.5897979736328125, -0.5401611328125, -0.4905242919921875, -0.440887451171875, -0.3912506103515625, -0.34161376953125, -0.2919769287109375, -0.242340087890625, -0.1927032470703125, -0.14306640625, -0.0934295654296875, -0.043792724609375, 0.0058441162109375, 0.05548095703125, 0.1051177978515625, 0.154754638671875, 0.2043914794921875, 0.2540283203125, 0.3036651611328125, 0.353302001953125, 0.4029388427734375, 0.45257568359375, 0.5022125244140625, 0.551849365234375, 0.6014862060546875, 0.651123046875, 0.7007598876953125, 0.750396728515625, 0.8000335693359375, 0.84967041015625, 0.8993072509765625, 0.948944091796875, 0.9985809326171875, 1.0482177734375, 1.0978546142578125, 1.147491455078125, 1.1971282958984375, 1.24676513671875, 1.2964019775390625, 1.346038818359375, 1.3956756591796875, 1.4453125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 5.0, 10.0, 3.0, 11.0, 8.0, 17.0, 18.0, 16.0, 28.0, 23.0, 29.0, 25.0, 33.0, 35.0, 39.0, 43.0, 41.0, 39.0, 35.0, 43.0, 52.0, 48.0, 51.0, 40.0, 39.0, 31.0, 25.0, 19.0, 24.0, 26.0, 26.0, 21.0, 13.0, 15.0, 9.0, 16.0, 7.0, 10.0, 5.0, 0.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.3656439781188965, -4.21091365814209, -4.056183815002441, -3.9014534950256348, -3.7467234134674072, -3.5919933319091797, -3.437263011932373, -3.2825329303741455, -3.127802848815918, -2.9730727672576904, -2.818342447280884, -2.6636123657226562, -2.5088822841644287, -2.354152202606201, -2.1994218826293945, -2.044691801071167, -1.8899614810943604, -1.7352312803268433, -1.5805011987686157, -1.4257709980010986, -1.271040916442871, -1.116310715675354, -0.9615805149078369, -0.8068504333496094, -0.6521202325820923, -0.49739009141921997, -0.34265992045402527, -0.18792974948883057, -0.03319960832595825, 0.12153053283691406, 0.27626073360443115, 0.4309908151626587, 0.5857210159301758, 0.7404511570930481, 0.8951812982559204, 1.0499114990234375, 1.204641580581665, 1.3593717813491821, 1.5141019821166992, 1.6688320636749268, 1.8235622644424438, 1.978292465209961, 2.1330225467681885, 2.287752628326416, 2.4424829483032227, 2.59721302986145, 2.7519431114196777, 2.9066734313964844, 3.061403512954712, 3.2161335945129395, 3.370863914489746, 3.5255939960479736, 3.680324077606201, 3.835054397583008, 3.9897844791412354, 4.144514560699463, 4.2992448806762695, 4.453975200653076, 4.608705043792725, 4.763435363769531, 4.918165683746338, 5.072895526885986, 5.227625846862793, 5.382355690002441, 5.537086009979248]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 8.0, 9.0, 13.0, 12.0, 9.0, 12.0, 21.0, 25.0, 18.0, 21.0, 28.0, 31.0, 26.0, 35.0, 31.0, 42.0, 36.0, 29.0, 43.0, 53.0, 40.0, 32.0, 36.0, 40.0, 41.0, 26.0, 31.0, 30.0, 40.0, 18.0, 29.0, 13.0, 16.0, 13.0, 18.0, 13.0, 12.0, 8.0, 7.0, 6.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.02628231048584, -4.877121448516846, -4.727960586547852, -4.578800201416016, -4.4296393394470215, -4.280478477478027, -4.131317615509033, -3.982156753540039, -3.832996129989624, -3.68383526802063, -3.534674644470215, -3.3855137825012207, -3.2363529205322266, -3.0871922969818115, -2.9380314350128174, -2.7888708114624023, -2.639709949493408, -2.490549087524414, -2.341388463973999, -2.192227602005005, -2.04306697845459, -1.8939061164855957, -1.7447452545166016, -1.595584511756897, -1.4464237689971924, -1.2972630262374878, -1.1481022834777832, -0.9989414215087891, -0.8497806787490845, -0.7006199359893799, -0.5514591336250305, -0.40229833126068115, -0.25313758850097656, -0.10397681593894958, 0.04518395662307739, 0.19434472918510437, 0.34350550174713135, 0.49266624450683594, 0.6418270468711853, 0.7909878492355347, 0.9401485919952393, 1.0893093347549438, 1.2384700775146484, 1.3876309394836426, 1.5367916822433472, 1.6859524250030518, 1.835113286972046, 1.9842740297317505, 2.133434772491455, 2.282595634460449, 2.4317562580108643, 2.5809171199798584, 2.7300777435302734, 2.8792386054992676, 3.0283994674682617, 3.177560329437256, 3.326720952987671, 3.475881814956665, 3.62504243850708, 3.774203300476074, 3.9233641624450684, 4.0725250244140625, 4.221685409545898, 4.370846271514893, 4.520007133483887]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 5.0, 7.0, 17.0, 21.0, 34.0, 39.0, 49.0, 82.0, 147.0, 241.0, 351.0, 573.0, 861.0, 1448.0, 2321.0, 3530.0, 5649.0, 8529.0, 12998.0, 19439.0, 28419.0, 39838.0, 54770.0, 71022.0, 87586.0, 100544.0, 107886.0, 105490.0, 96427.0, 81215.0, 64933.0, 48340.0, 34709.0, 24197.0, 16294.0, 10831.0, 7078.0, 4614.0, 3011.0, 1836.0, 1146.0, 712.0, 505.0, 309.0, 173.0, 119.0, 93.0, 41.0, 26.0, 20.0, 13.0, 13.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.03143310546875, -2.9261474609375, -2.82086181640625, -2.715576171875, -2.61029052734375, -2.5050048828125, -2.39971923828125, -2.29443359375, -2.18914794921875, -2.0838623046875, -1.97857666015625, -1.873291015625, -1.76800537109375, -1.6627197265625, -1.55743408203125, -1.4521484375, -1.34686279296875, -1.2415771484375, -1.13629150390625, -1.031005859375, -0.92572021484375, -0.8204345703125, -0.71514892578125, -0.60986328125, -0.50457763671875, -0.3992919921875, -0.29400634765625, -0.188720703125, -0.08343505859375, 0.0218505859375, 0.12713623046875, 0.232421875, 0.33770751953125, 0.4429931640625, 0.54827880859375, 0.653564453125, 0.75885009765625, 0.8641357421875, 0.96942138671875, 1.07470703125, 1.17999267578125, 1.2852783203125, 1.39056396484375, 1.495849609375, 1.60113525390625, 1.7064208984375, 1.81170654296875, 1.9169921875, 2.02227783203125, 2.1275634765625, 2.23284912109375, 2.338134765625, 2.44342041015625, 2.5487060546875, 2.65399169921875, 2.75927734375, 2.86456298828125, 2.9698486328125, 3.07513427734375, 3.180419921875, 3.28570556640625, 3.3909912109375, 3.49627685546875, 3.6015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 10.0, 8.0, 12.0, 10.0, 23.0, 18.0, 21.0, 20.0, 18.0, 24.0, 28.0, 29.0, 37.0, 26.0, 32.0, 42.0, 30.0, 40.0, 33.0, 45.0, 31.0, 31.0, 45.0, 34.0, 37.0, 32.0, 38.0, 33.0, 27.0, 28.0, 33.0, 14.0, 16.0, 15.0, 13.0, 11.0, 4.0, 12.0, 5.0, 8.0, 3.0, 3.0, 10.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.91796875, -4.7716064453125, -4.625244140625, -4.4788818359375, -4.33251953125, -4.1861572265625, -4.039794921875, -3.8934326171875, -3.7470703125, -3.6007080078125, -3.454345703125, -3.3079833984375, -3.16162109375, -3.0152587890625, -2.868896484375, -2.7225341796875, -2.576171875, -2.4298095703125, -2.283447265625, -2.1370849609375, -1.99072265625, -1.8443603515625, -1.697998046875, -1.5516357421875, -1.4052734375, -1.2589111328125, -1.112548828125, -0.9661865234375, -0.81982421875, -0.6734619140625, -0.527099609375, -0.3807373046875, -0.234375, -0.0880126953125, 0.058349609375, 0.2047119140625, 0.35107421875, 0.4974365234375, 0.643798828125, 0.7901611328125, 0.9365234375, 1.0828857421875, 1.229248046875, 1.3756103515625, 1.52197265625, 1.6683349609375, 1.814697265625, 1.9610595703125, 2.107421875, 2.2537841796875, 2.400146484375, 2.5465087890625, 2.69287109375, 2.8392333984375, 2.985595703125, 3.1319580078125, 3.2783203125, 3.4246826171875, 3.571044921875, 3.7174072265625, 3.86376953125, 4.0101318359375, 4.156494140625, 4.3028564453125, 4.44921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 8.0, 17.0, 18.0, 26.0, 42.0, 68.0, 129.0, 203.0, 328.0, 551.0, 966.0, 1693.0, 3011.0, 5359.0, 9531.0, 16741.0, 29001.0, 47934.0, 74772.0, 107171.0, 133977.0, 148504.0, 139922.0, 114496.0, 82204.0, 54183.0, 32712.0, 19312.0, 11318.0, 6168.0, 3483.0, 1960.0, 1161.0, 646.0, 383.0, 236.0, 129.0, 71.0, 44.0, 28.0, 27.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.462646484375, -4.31201171875, -4.161376953125, -4.0107421875, -3.860107421875, -3.70947265625, -3.558837890625, -3.408203125, -3.257568359375, -3.10693359375, -2.956298828125, -2.8056640625, -2.655029296875, -2.50439453125, -2.353759765625, -2.203125, -2.052490234375, -1.90185546875, -1.751220703125, -1.6005859375, -1.449951171875, -1.29931640625, -1.148681640625, -0.998046875, -0.847412109375, -0.69677734375, -0.546142578125, -0.3955078125, -0.244873046875, -0.09423828125, 0.056396484375, 0.20703125, 0.357666015625, 0.50830078125, 0.658935546875, 0.8095703125, 0.960205078125, 1.11083984375, 1.261474609375, 1.412109375, 1.562744140625, 1.71337890625, 1.864013671875, 2.0146484375, 2.165283203125, 2.31591796875, 2.466552734375, 2.6171875, 2.767822265625, 2.91845703125, 3.069091796875, 3.2197265625, 3.370361328125, 3.52099609375, 3.671630859375, 3.822265625, 3.972900390625, 4.12353515625, 4.274169921875, 4.4248046875, 4.575439453125, 4.72607421875, 4.876708984375, 5.02734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 4.0, 9.0, 10.0, 12.0, 16.0, 17.0, 18.0, 34.0, 19.0, 31.0, 23.0, 24.0, 31.0, 33.0, 30.0, 41.0, 37.0, 37.0, 38.0, 40.0, 38.0, 46.0, 36.0, 41.0, 45.0, 33.0, 41.0, 25.0, 31.0, 23.0, 17.0, 15.0, 14.0, 13.0, 10.0, 14.0, 12.0, 12.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.484375, -3.385711669921875, -3.28704833984375, -3.188385009765625, -3.0897216796875, -2.991058349609375, -2.89239501953125, -2.793731689453125, -2.695068359375, -2.596405029296875, -2.49774169921875, -2.399078369140625, -2.3004150390625, -2.201751708984375, -2.10308837890625, -2.004425048828125, -1.90576171875, -1.807098388671875, -1.70843505859375, -1.609771728515625, -1.5111083984375, -1.412445068359375, -1.31378173828125, -1.215118408203125, -1.116455078125, -1.017791748046875, -0.91912841796875, -0.820465087890625, -0.7218017578125, -0.623138427734375, -0.52447509765625, -0.425811767578125, -0.3271484375, -0.228485107421875, -0.12982177734375, -0.031158447265625, 0.0675048828125, 0.166168212890625, 0.26483154296875, 0.363494873046875, 0.462158203125, 0.560821533203125, 0.65948486328125, 0.758148193359375, 0.8568115234375, 0.955474853515625, 1.05413818359375, 1.152801513671875, 1.25146484375, 1.350128173828125, 1.44879150390625, 1.547454833984375, 1.6461181640625, 1.744781494140625, 1.84344482421875, 1.942108154296875, 2.040771484375, 2.139434814453125, 2.23809814453125, 2.336761474609375, 2.4354248046875, 2.534088134765625, 2.63275146484375, 2.731414794921875, 2.830078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 7.0, 3.0, 5.0, 9.0, 16.0, 26.0, 36.0, 40.0, 76.0, 97.0, 145.0, 201.0, 284.0, 432.0, 609.0, 904.0, 1503.0, 2446.0, 3930.0, 6663.0, 11305.0, 19354.0, 33355.0, 54812.0, 86617.0, 123320.0, 152525.0, 157618.0, 134966.0, 97457.0, 63825.0, 39005.0, 23054.0, 13442.0, 7819.0, 4697.0, 2805.0, 1793.0, 1151.0, 695.0, 452.0, 379.0, 206.0, 154.0, 85.0, 72.0, 58.0, 34.0, 21.0, 22.0, 14.0, 6.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.421875, -2.344146728515625, -2.26641845703125, -2.188690185546875, -2.1109619140625, -2.033233642578125, -1.95550537109375, -1.877777099609375, -1.800048828125, -1.722320556640625, -1.64459228515625, -1.566864013671875, -1.4891357421875, -1.411407470703125, -1.33367919921875, -1.255950927734375, -1.17822265625, -1.100494384765625, -1.02276611328125, -0.945037841796875, -0.8673095703125, -0.789581298828125, -0.71185302734375, -0.634124755859375, -0.556396484375, -0.478668212890625, -0.40093994140625, -0.323211669921875, -0.2454833984375, -0.167755126953125, -0.09002685546875, -0.012298583984375, 0.0654296875, 0.143157958984375, 0.22088623046875, 0.298614501953125, 0.3763427734375, 0.454071044921875, 0.53179931640625, 0.609527587890625, 0.687255859375, 0.764984130859375, 0.84271240234375, 0.920440673828125, 0.9981689453125, 1.075897216796875, 1.15362548828125, 1.231353759765625, 1.30908203125, 1.386810302734375, 1.46453857421875, 1.542266845703125, 1.6199951171875, 1.697723388671875, 1.77545166015625, 1.853179931640625, 1.930908203125, 2.008636474609375, 2.08636474609375, 2.164093017578125, 2.2418212890625, 2.319549560546875, 2.39727783203125, 2.475006103515625, 2.552734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 16.0, 10.0, 15.0, 22.0, 37.0, 35.0, 36.0, 47.0, 49.0, 74.0, 67.0, 74.0, 70.0, 75.0, 70.0, 60.0, 45.0, 35.0, 37.0, 27.0, 23.0, 18.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00042819976806640625, -0.00041722506284713745, -0.00040625035762786865, -0.00039527565240859985, -0.00038430094718933105, -0.00037332624197006226, -0.00036235153675079346, -0.00035137683153152466, -0.00034040212631225586, -0.00032942742109298706, -0.00031845271587371826, -0.00030747801065444946, -0.00029650330543518066, -0.00028552860021591187, -0.00027455389499664307, -0.00026357918977737427, -0.00025260448455810547, -0.00024162977933883667, -0.00023065507411956787, -0.00021968036890029907, -0.00020870566368103027, -0.00019773095846176147, -0.00018675625324249268, -0.00017578154802322388, -0.00016480684280395508, -0.00015383213758468628, -0.00014285743236541748, -0.00013188272714614868, -0.00012090802192687988, -0.00010993331670761108, -9.895861148834229e-05, -8.798390626907349e-05, -7.700920104980469e-05, -6.603449583053589e-05, -5.505979061126709e-05, -4.408508539199829e-05, -3.311038017272949e-05, -2.2135674953460693e-05, -1.1160969734191895e-05, -1.862645149230957e-07, 1.0788440704345703e-05, 2.1763145923614502e-05, 3.27378511428833e-05, 4.37125563621521e-05, 5.46872615814209e-05, 6.56619668006897e-05, 7.66366720199585e-05, 8.76113772392273e-05, 9.85860824584961e-05, 0.00010956078767776489, 0.00012053549289703369, 0.0001315101981163025, 0.0001424849033355713, 0.0001534596085548401, 0.0001644343137741089, 0.00017540901899337769, 0.00018638372421264648, 0.00019735842943191528, 0.00020833313465118408, 0.00021930783987045288, 0.00023028254508972168, 0.00024125725030899048, 0.0002522319555282593, 0.0002632066607475281, 0.0002741813659667969]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 11.0, 12.0, 22.0, 29.0, 50.0, 71.0, 120.0, 180.0, 248.0, 417.0, 604.0, 919.0, 1397.0, 2142.0, 3183.0, 4790.0, 7530.0, 11168.0, 16766.0, 25368.0, 36721.0, 51947.0, 71029.0, 90855.0, 107273.0, 116229.0, 113721.0, 101400.0, 82506.0, 62376.0, 45023.0, 31441.0, 21291.0, 14296.0, 9398.0, 6088.0, 4112.0, 2632.0, 1696.0, 1184.0, 735.0, 530.0, 333.0, 227.0, 170.0, 92.0, 83.0, 49.0, 36.0, 20.0, 9.0, 12.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.818359375, -1.7611541748046875, -1.703948974609375, -1.6467437744140625, -1.58953857421875, -1.5323333740234375, -1.475128173828125, -1.4179229736328125, -1.3607177734375, -1.3035125732421875, -1.246307373046875, -1.1891021728515625, -1.13189697265625, -1.0746917724609375, -1.017486572265625, -0.9602813720703125, -0.903076171875, -0.8458709716796875, -0.788665771484375, -0.7314605712890625, -0.67425537109375, -0.6170501708984375, -0.559844970703125, -0.5026397705078125, -0.4454345703125, -0.3882293701171875, -0.331024169921875, -0.2738189697265625, -0.21661376953125, -0.1594085693359375, -0.102203369140625, -0.0449981689453125, 0.01220703125, 0.0694122314453125, 0.126617431640625, 0.1838226318359375, 0.24102783203125, 0.2982330322265625, 0.355438232421875, 0.4126434326171875, 0.4698486328125, 0.5270538330078125, 0.584259033203125, 0.6414642333984375, 0.69866943359375, 0.7558746337890625, 0.813079833984375, 0.8702850341796875, 0.927490234375, 0.9846954345703125, 1.041900634765625, 1.0991058349609375, 1.15631103515625, 1.2135162353515625, 1.270721435546875, 1.3279266357421875, 1.3851318359375, 1.4423370361328125, 1.499542236328125, 1.5567474365234375, 1.61395263671875, 1.6711578369140625, 1.728363037109375, 1.7855682373046875, 1.8427734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 10.0, 10.0, 11.0, 20.0, 20.0, 24.0, 27.0, 35.0, 27.0, 36.0, 29.0, 32.0, 48.0, 38.0, 46.0, 49.0, 58.0, 41.0, 47.0, 41.0, 43.0, 49.0, 25.0, 29.0, 33.0, 13.0, 16.0, 24.0, 15.0, 14.0, 10.0, 11.0, 5.0, 9.0, 10.0, 4.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.845703125, -0.8206939697265625, -0.795684814453125, -0.7706756591796875, -0.74566650390625, -0.7206573486328125, -0.695648193359375, -0.6706390380859375, -0.6456298828125, -0.6206207275390625, -0.595611572265625, -0.5706024169921875, -0.54559326171875, -0.5205841064453125, -0.495574951171875, -0.4705657958984375, -0.445556640625, -0.4205474853515625, -0.395538330078125, -0.3705291748046875, -0.34552001953125, -0.3205108642578125, -0.295501708984375, -0.2704925537109375, -0.2454833984375, -0.2204742431640625, -0.195465087890625, -0.1704559326171875, -0.14544677734375, -0.1204376220703125, -0.095428466796875, -0.0704193115234375, -0.04541015625, -0.0204010009765625, 0.004608154296875, 0.0296173095703125, 0.05462646484375, 0.0796356201171875, 0.104644775390625, 0.1296539306640625, 0.1546630859375, 0.1796722412109375, 0.204681396484375, 0.2296905517578125, 0.25469970703125, 0.2797088623046875, 0.304718017578125, 0.3297271728515625, 0.354736328125, 0.3797454833984375, 0.404754638671875, 0.4297637939453125, 0.45477294921875, 0.4797821044921875, 0.504791259765625, 0.5298004150390625, 0.5548095703125, 0.5798187255859375, 0.604827880859375, 0.6298370361328125, 0.65484619140625, 0.6798553466796875, 0.704864501953125, 0.7298736572265625, 0.7548828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 5.0, 8.0, 6.0, 9.0, 16.0, 11.0, 25.0, 17.0, 21.0, 19.0, 26.0, 27.0, 33.0, 33.0, 47.0, 39.0, 41.0, 35.0, 39.0, 45.0, 41.0, 38.0, 33.0, 38.0, 37.0, 32.0, 33.0, 20.0, 28.0, 28.0, 21.0, 17.0, 19.0, 18.0, 12.0, 13.0, 6.0, 13.0, 5.0, 11.0, 2.0, 2.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.208166122436523, -4.067146301269531, -3.926126480102539, -3.785106658935547, -3.6440868377685547, -3.5030670166015625, -3.3620471954345703, -3.221027374267578, -3.080007553100586, -2.9389877319335938, -2.7979679107666016, -2.6569480895996094, -2.515928268432617, -2.374908447265625, -2.233888626098633, -2.0928688049316406, -1.9518489837646484, -1.8108291625976562, -1.669809341430664, -1.5287895202636719, -1.3877696990966797, -1.2467498779296875, -1.1057300567626953, -0.9647102355957031, -0.8236904144287109, -0.6826705932617188, -0.5416507720947266, -0.4006309509277344, -0.2596111297607422, -0.11859130859375, 0.022428512573242188, 0.16344833374023438, 0.30446815490722656, 0.44548797607421875, 0.5865077972412109, 0.7275276184082031, 0.8685474395751953, 1.0095672607421875, 1.1505870819091797, 1.2916069030761719, 1.432626724243164, 1.5736465454101562, 1.7146663665771484, 1.8556861877441406, 1.9967060089111328, 2.137725830078125, 2.278745651245117, 2.4197654724121094, 2.5607852935791016, 2.7018051147460938, 2.842824935913086, 2.983844757080078, 3.1248645782470703, 3.2658843994140625, 3.4069042205810547, 3.547924041748047, 3.688943862915039, 3.8299636840820312, 3.9709835052490234, 4.112003326416016, 4.253023147583008, 4.39404296875, 4.535062789916992, 4.676082611083984, 4.817102432250977]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 9.0, 13.0, 13.0, 21.0, 12.0, 14.0, 24.0, 23.0, 25.0, 32.0, 40.0, 26.0, 39.0, 45.0, 36.0, 32.0, 42.0, 38.0, 48.0, 45.0, 49.0, 35.0, 34.0, 35.0, 34.0, 29.0, 33.0, 20.0, 28.0, 18.0, 16.0, 13.0, 14.0, 8.0, 6.0, 8.0, 7.0, 4.0, 11.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.225409507751465, -5.069153785705566, -4.912898540496826, -4.756642818450928, -4.600387096405029, -4.444131374359131, -4.287876129150391, -4.131620407104492, -3.9753646850585938, -3.8191092014312744, -3.662853479385376, -3.5065979957580566, -3.350342273712158, -3.194086790084839, -3.0378313064575195, -2.881575584411621, -2.7253201007843018, -2.5690646171569824, -2.412808895111084, -2.2565534114837646, -2.100297689437866, -1.9440422058105469, -1.787786602973938, -1.631531000137329, -1.4752753973007202, -1.3190197944641113, -1.1627641916275024, -1.0065085887908936, -0.8502530455589294, -0.6939974427223206, -0.5377418994903564, -0.38148629665374756, -0.22523069381713867, -0.06897510588169098, 0.08728048205375671, 0.2435360550880432, 0.3997916579246521, 0.556047260761261, 0.7123028039932251, 0.868558406829834, 1.0248140096664429, 1.1810696125030518, 1.3373252153396606, 1.4935808181762695, 1.6498363018035889, 1.8060920238494873, 1.9623475074768066, 2.118603229522705, 2.2748587131500244, 2.4311141967773438, 2.587369918823242, 2.7436254024505615, 2.89988112449646, 3.0561366081237793, 3.2123923301696777, 3.368647813796997, 3.5249032974243164, 3.6811587810516357, 3.837414503097534, 3.9936699867248535, 4.149925708770752, 4.30618143081665, 4.462436676025391, 4.618692398071289, 4.7749481201171875]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 14.0, 30.0, 52.0, 78.0, 107.0, 194.0, 318.0, 483.0, 746.0, 1198.0, 1924.0, 3332.0, 5399.0, 9243.0, 15439.0, 27321.0, 47224.0, 82410.0, 141939.0, 239183.0, 372571.0, 526423.0, 632674.0, 632057.0, 522028.0, 367902.0, 232897.0, 138560.0, 80402.0, 46132.0, 26244.0, 15606.0, 9143.0, 5453.0, 3360.0, 2112.0, 1424.0, 922.0, 591.0, 410.0, 260.0, 166.0, 96.0, 68.0, 47.0, 29.0, 31.0, 15.0, 11.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.69293212890625, -3.5655517578125, -3.43817138671875, -3.310791015625, -3.18341064453125, -3.0560302734375, -2.92864990234375, -2.80126953125, -2.67388916015625, -2.5465087890625, -2.41912841796875, -2.291748046875, -2.16436767578125, -2.0369873046875, -1.90960693359375, -1.7822265625, -1.65484619140625, -1.5274658203125, -1.40008544921875, -1.272705078125, -1.14532470703125, -1.0179443359375, -0.89056396484375, -0.76318359375, -0.63580322265625, -0.5084228515625, -0.38104248046875, -0.253662109375, -0.12628173828125, 0.0010986328125, 0.12847900390625, 0.255859375, 0.38323974609375, 0.5106201171875, 0.63800048828125, 0.765380859375, 0.89276123046875, 1.0201416015625, 1.14752197265625, 1.27490234375, 1.40228271484375, 1.5296630859375, 1.65704345703125, 1.784423828125, 1.91180419921875, 2.0391845703125, 2.16656494140625, 2.2939453125, 2.42132568359375, 2.5487060546875, 2.67608642578125, 2.803466796875, 2.93084716796875, 3.0582275390625, 3.18560791015625, 3.31298828125, 3.44036865234375, 3.5677490234375, 3.69512939453125, 3.822509765625, 3.94989013671875, 4.0772705078125, 4.20465087890625, 4.33203125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 10.0, 6.0, 8.0, 8.0, 11.0, 19.0, 13.0, 14.0, 14.0, 11.0, 22.0, 26.0, 27.0, 23.0, 28.0, 37.0, 24.0, 39.0, 32.0, 30.0, 33.0, 47.0, 32.0, 42.0, 38.0, 31.0, 44.0, 41.0, 29.0, 33.0, 32.0, 25.0, 22.0, 22.0, 17.0, 21.0, 15.0, 14.0, 8.0, 8.0, 7.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.595703125, -3.4844970703125, -3.373291015625, -3.2620849609375, -3.15087890625, -3.0396728515625, -2.928466796875, -2.8172607421875, -2.7060546875, -2.5948486328125, -2.483642578125, -2.3724365234375, -2.26123046875, -2.1500244140625, -2.038818359375, -1.9276123046875, -1.81640625, -1.7052001953125, -1.593994140625, -1.4827880859375, -1.37158203125, -1.2603759765625, -1.149169921875, -1.0379638671875, -0.9267578125, -0.8155517578125, -0.704345703125, -0.5931396484375, -0.48193359375, -0.3707275390625, -0.259521484375, -0.1483154296875, -0.037109375, 0.0740966796875, 0.185302734375, 0.2965087890625, 0.40771484375, 0.5189208984375, 0.630126953125, 0.7413330078125, 0.8525390625, 0.9637451171875, 1.074951171875, 1.1861572265625, 1.29736328125, 1.4085693359375, 1.519775390625, 1.6309814453125, 1.7421875, 1.8533935546875, 1.964599609375, 2.0758056640625, 2.18701171875, 2.2982177734375, 2.409423828125, 2.5206298828125, 2.6318359375, 2.7430419921875, 2.854248046875, 2.9654541015625, 3.07666015625, 3.1878662109375, 3.299072265625, 3.4102783203125, 3.521484375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 15.0, 27.0, 33.0, 54.0, 104.0, 158.0, 264.0, 436.0, 775.0, 1197.0, 2047.0, 3340.0, 5734.0, 9616.0, 16898.0, 27776.0, 47354.0, 78541.0, 125982.0, 199733.0, 299357.0, 416667.0, 523780.0, 571148.0, 536805.0, 437912.0, 319580.0, 216233.0, 138925.0, 86170.0, 52014.0, 30863.0, 18348.0, 10788.0, 6342.0, 3730.0, 2244.0, 1313.0, 811.0, 473.0, 261.0, 169.0, 99.0, 60.0, 35.0, 19.0, 20.0, 11.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.96795654296875, -3.8382568359375, -3.70855712890625, -3.578857421875, -3.44915771484375, -3.3194580078125, -3.18975830078125, -3.06005859375, -2.93035888671875, -2.8006591796875, -2.67095947265625, -2.541259765625, -2.41156005859375, -2.2818603515625, -2.15216064453125, -2.0224609375, -1.89276123046875, -1.7630615234375, -1.63336181640625, -1.503662109375, -1.37396240234375, -1.2442626953125, -1.11456298828125, -0.98486328125, -0.85516357421875, -0.7254638671875, -0.59576416015625, -0.466064453125, -0.33636474609375, -0.2066650390625, -0.07696533203125, 0.052734375, 0.18243408203125, 0.3121337890625, 0.44183349609375, 0.571533203125, 0.70123291015625, 0.8309326171875, 0.96063232421875, 1.09033203125, 1.22003173828125, 1.3497314453125, 1.47943115234375, 1.609130859375, 1.73883056640625, 1.8685302734375, 1.99822998046875, 2.1279296875, 2.25762939453125, 2.3873291015625, 2.51702880859375, 2.646728515625, 2.77642822265625, 2.9061279296875, 3.03582763671875, 3.16552734375, 3.29522705078125, 3.4249267578125, 3.55462646484375, 3.684326171875, 3.81402587890625, 3.9437255859375, 4.07342529296875, 4.203125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 10.0, 13.0, 18.0, 18.0, 28.0, 25.0, 39.0, 29.0, 58.0, 69.0, 70.0, 92.0, 102.0, 116.0, 164.0, 166.0, 182.0, 172.0, 217.0, 219.0, 215.0, 213.0, 181.0, 194.0, 186.0, 158.0, 186.0, 153.0, 107.0, 126.0, 90.0, 72.0, 76.0, 59.0, 48.0, 39.0, 32.0, 23.0, 27.0, 21.0, 7.0, 8.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 3.0, 2.0, 1.0], "bins": [-1.8408203125, -1.7875518798828125, -1.734283447265625, -1.6810150146484375, -1.62774658203125, -1.5744781494140625, -1.521209716796875, -1.4679412841796875, -1.4146728515625, -1.3614044189453125, -1.308135986328125, -1.2548675537109375, -1.20159912109375, -1.1483306884765625, -1.095062255859375, -1.0417938232421875, -0.988525390625, -0.9352569580078125, -0.881988525390625, -0.8287200927734375, -0.77545166015625, -0.7221832275390625, -0.668914794921875, -0.6156463623046875, -0.5623779296875, -0.5091094970703125, -0.455841064453125, -0.4025726318359375, -0.34930419921875, -0.2960357666015625, -0.242767333984375, -0.1894989013671875, -0.13623046875, -0.0829620361328125, -0.029693603515625, 0.0235748291015625, 0.07684326171875, 0.1301116943359375, 0.183380126953125, 0.2366485595703125, 0.2899169921875, 0.3431854248046875, 0.396453857421875, 0.4497222900390625, 0.50299072265625, 0.5562591552734375, 0.609527587890625, 0.6627960205078125, 0.716064453125, 0.7693328857421875, 0.822601318359375, 0.8758697509765625, 0.92913818359375, 0.9824066162109375, 1.035675048828125, 1.0889434814453125, 1.1422119140625, 1.1954803466796875, 1.248748779296875, 1.3020172119140625, 1.35528564453125, 1.4085540771484375, 1.461822509765625, 1.5150909423828125, 1.568359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 4.0, 9.0, 4.0, 6.0, 17.0, 12.0, 20.0, 22.0, 27.0, 24.0, 27.0, 37.0, 36.0, 38.0, 34.0, 44.0, 45.0, 43.0, 50.0, 48.0, 32.0, 41.0, 45.0, 35.0, 35.0, 33.0, 23.0, 24.0, 40.0, 22.0, 21.0, 29.0, 14.0, 6.0, 9.0, 12.0, 4.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.987844467163086, -3.8380789756774902, -3.6883134841918945, -3.538548231124878, -3.3887827396392822, -3.2390172481536865, -3.08925199508667, -2.939486503601074, -2.7897210121154785, -2.639955520629883, -2.490190029144287, -2.3404247760772705, -2.190659284591675, -2.040893793106079, -1.891128420829773, -1.7413630485534668, -1.591597557067871, -1.4418320655822754, -1.2920666933059692, -1.142301321029663, -0.9925358295440674, -0.8427703976631165, -0.6930049657821655, -0.5432395935058594, -0.39347410202026367, -0.24370867013931274, -0.09394323825836182, 0.05582219362258911, 0.20558762550354004, 0.35535305738449097, 0.5051184892654419, 0.654883861541748, 0.8046488761901855, 0.9544143080711365, 1.1041797399520874, 1.2539451122283936, 1.4037106037139893, 1.553476095199585, 1.7032414674758911, 1.8530068397521973, 2.002772331237793, 2.1525378227233887, 2.3023033142089844, 2.452068567276001, 2.6018340587615967, 2.7515995502471924, 2.901364803314209, 3.0511302947998047, 3.2008957862854004, 3.350661277770996, 3.500426769256592, 3.6501920223236084, 3.799957513809204, 3.9497230052948, 4.099488258361816, 4.249253749847412, 4.399019241333008, 4.5487847328186035, 4.698550224304199, 4.848315715789795, 4.998081207275391, 5.147846221923828, 5.297611713409424, 5.4473772048950195, 5.597142696380615]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 13.0, 8.0, 11.0, 12.0, 17.0, 16.0, 18.0, 20.0, 21.0, 20.0, 23.0, 34.0, 30.0, 29.0, 47.0, 31.0, 36.0, 38.0, 37.0, 39.0, 57.0, 49.0, 46.0, 41.0, 44.0, 33.0, 28.0, 23.0, 26.0, 17.0, 26.0, 17.0, 15.0, 11.0, 9.0, 8.0, 5.0, 6.0, 10.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.606178283691406, -4.466039657592773, -4.325901508331299, -4.185763359069824, -4.045624732971191, -3.9054863452911377, -3.765347957611084, -3.6252095699310303, -3.4850711822509766, -3.344932794570923, -3.204794406890869, -3.0646560192108154, -2.9245176315307617, -2.784379243850708, -2.6442408561706543, -2.5041024684906006, -2.363964080810547, -2.223825693130493, -2.0836873054504395, -1.9435489177703857, -1.803410530090332, -1.6632721424102783, -1.5231337547302246, -1.382995367050171, -1.2428569793701172, -1.1027185916900635, -0.9625802040100098, -0.822441816329956, -0.6823034286499023, -0.5421650409698486, -0.4020266532897949, -0.2618882656097412, -0.1217503547668457, 0.018388032913208008, 0.15852642059326172, 0.29866480827331543, 0.43880319595336914, 0.5789415836334229, 0.7190799713134766, 0.8592183589935303, 0.999356746673584, 1.1394951343536377, 1.2796335220336914, 1.4197719097137451, 1.5599102973937988, 1.7000486850738525, 1.8401870727539062, 1.98032546043396, 2.1204638481140137, 2.2606022357940674, 2.400740623474121, 2.540879011154175, 2.6810173988342285, 2.8211557865142822, 2.961294174194336, 3.1014325618743896, 3.2415709495544434, 3.381709337234497, 3.521847724914551, 3.6619861125946045, 3.802124500274658, 3.942262887954712, 4.082401275634766, 4.222539901733398, 4.362678050994873]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 16.0, 26.0, 54.0, 67.0, 103.0, 117.0, 199.0, 303.0, 414.0, 568.0, 885.0, 1286.0, 2013.0, 3088.0, 4571.0, 7164.0, 11508.0, 18394.0, 29188.0, 46955.0, 73001.0, 107186.0, 139515.0, 153943.0, 140115.0, 107054.0, 73157.0, 47137.0, 29541.0, 18387.0, 11420.0, 7266.0, 4792.0, 3093.0, 2011.0, 1270.0, 871.0, 589.0, 380.0, 280.0, 192.0, 124.0, 83.0, 69.0, 38.0, 32.0, 30.0, 9.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.7890625, -2.7032470703125, -2.617431640625, -2.5316162109375, -2.44580078125, -2.3599853515625, -2.274169921875, -2.1883544921875, -2.1025390625, -2.0167236328125, -1.930908203125, -1.8450927734375, -1.75927734375, -1.6734619140625, -1.587646484375, -1.5018310546875, -1.416015625, -1.3302001953125, -1.244384765625, -1.1585693359375, -1.07275390625, -0.9869384765625, -0.901123046875, -0.8153076171875, -0.7294921875, -0.6436767578125, -0.557861328125, -0.4720458984375, -0.38623046875, -0.3004150390625, -0.214599609375, -0.1287841796875, -0.04296875, 0.0428466796875, 0.128662109375, 0.2144775390625, 0.30029296875, 0.3861083984375, 0.471923828125, 0.5577392578125, 0.6435546875, 0.7293701171875, 0.815185546875, 0.9010009765625, 0.98681640625, 1.0726318359375, 1.158447265625, 1.2442626953125, 1.330078125, 1.4158935546875, 1.501708984375, 1.5875244140625, 1.67333984375, 1.7591552734375, 1.844970703125, 1.9307861328125, 2.0166015625, 2.1024169921875, 2.188232421875, 2.2740478515625, 2.35986328125, 2.4456787109375, 2.531494140625, 2.6173095703125, 2.703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 5.0, 10.0, 14.0, 14.0, 23.0, 18.0, 26.0, 22.0, 24.0, 21.0, 42.0, 33.0, 35.0, 45.0, 31.0, 41.0, 31.0, 55.0, 49.0, 49.0, 37.0, 46.0, 52.0, 34.0, 39.0, 19.0, 31.0, 21.0, 15.0, 17.0, 16.0, 13.0, 12.0, 9.0, 10.0, 5.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18365478515625, -5.0274658203125, -4.87127685546875, -4.715087890625, -4.55889892578125, -4.4027099609375, -4.24652099609375, -4.09033203125, -3.93414306640625, -3.7779541015625, -3.62176513671875, -3.465576171875, -3.30938720703125, -3.1531982421875, -2.99700927734375, -2.8408203125, -2.68463134765625, -2.5284423828125, -2.37225341796875, -2.216064453125, -2.05987548828125, -1.9036865234375, -1.74749755859375, -1.59130859375, -1.43511962890625, -1.2789306640625, -1.12274169921875, -0.966552734375, -0.81036376953125, -0.6541748046875, -0.49798583984375, -0.341796875, -0.18560791015625, -0.0294189453125, 0.12677001953125, 0.282958984375, 0.43914794921875, 0.5953369140625, 0.75152587890625, 0.90771484375, 1.06390380859375, 1.2200927734375, 1.37628173828125, 1.532470703125, 1.68865966796875, 1.8448486328125, 2.00103759765625, 2.1572265625, 2.31341552734375, 2.4696044921875, 2.62579345703125, 2.781982421875, 2.93817138671875, 3.0943603515625, 3.25054931640625, 3.40673828125, 3.56292724609375, 3.7191162109375, 3.87530517578125, 4.031494140625, 4.18768310546875, 4.3438720703125, 4.50006103515625, 4.65625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 10.0, 13.0, 30.0, 48.0, 57.0, 95.0, 132.0, 190.0, 236.0, 379.0, 590.0, 936.0, 1516.0, 2570.0, 4421.0, 8073.0, 15978.0, 33697.0, 72325.0, 152408.0, 253736.0, 240370.0, 135980.0, 63097.0, 29730.0, 14281.0, 7236.0, 4017.0, 2416.0, 1429.0, 888.0, 518.0, 390.0, 253.0, 164.0, 96.0, 75.0, 45.0, 28.0, 25.0, 19.0, 17.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.46875, -5.3026123046875, -5.136474609375, -4.9703369140625, -4.80419921875, -4.6380615234375, -4.471923828125, -4.3057861328125, -4.1396484375, -3.9735107421875, -3.807373046875, -3.6412353515625, -3.47509765625, -3.3089599609375, -3.142822265625, -2.9766845703125, -2.810546875, -2.6444091796875, -2.478271484375, -2.3121337890625, -2.14599609375, -1.9798583984375, -1.813720703125, -1.6475830078125, -1.4814453125, -1.3153076171875, -1.149169921875, -0.9830322265625, -0.81689453125, -0.6507568359375, -0.484619140625, -0.3184814453125, -0.15234375, 0.0137939453125, 0.179931640625, 0.3460693359375, 0.51220703125, 0.6783447265625, 0.844482421875, 1.0106201171875, 1.1767578125, 1.3428955078125, 1.509033203125, 1.6751708984375, 1.84130859375, 2.0074462890625, 2.173583984375, 2.3397216796875, 2.505859375, 2.6719970703125, 2.838134765625, 3.0042724609375, 3.17041015625, 3.3365478515625, 3.502685546875, 3.6688232421875, 3.8349609375, 4.0010986328125, 4.167236328125, 4.3333740234375, 4.49951171875, 4.6656494140625, 4.831787109375, 4.9979248046875, 5.1640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 4.0, 12.0, 9.0, 9.0, 18.0, 20.0, 18.0, 22.0, 26.0, 27.0, 30.0, 32.0, 42.0, 42.0, 42.0, 36.0, 51.0, 44.0, 54.0, 44.0, 36.0, 51.0, 36.0, 37.0, 41.0, 37.0, 20.0, 26.0, 29.0, 22.0, 17.0, 12.0, 13.0, 13.0, 9.0, 3.0, 6.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.351348876953125, -3.24761962890625, -3.143890380859375, -3.0401611328125, -2.936431884765625, -2.83270263671875, -2.728973388671875, -2.625244140625, -2.521514892578125, -2.41778564453125, -2.314056396484375, -2.2103271484375, -2.106597900390625, -2.00286865234375, -1.899139404296875, -1.79541015625, -1.691680908203125, -1.58795166015625, -1.484222412109375, -1.3804931640625, -1.276763916015625, -1.17303466796875, -1.069305419921875, -0.965576171875, -0.861846923828125, -0.75811767578125, -0.654388427734375, -0.5506591796875, -0.446929931640625, -0.34320068359375, -0.239471435546875, -0.1357421875, -0.032012939453125, 0.07171630859375, 0.175445556640625, 0.2791748046875, 0.382904052734375, 0.48663330078125, 0.590362548828125, 0.694091796875, 0.797821044921875, 0.90155029296875, 1.005279541015625, 1.1090087890625, 1.212738037109375, 1.31646728515625, 1.420196533203125, 1.52392578125, 1.627655029296875, 1.73138427734375, 1.835113525390625, 1.9388427734375, 2.042572021484375, 2.14630126953125, 2.250030517578125, 2.353759765625, 2.457489013671875, 2.56121826171875, 2.664947509765625, 2.7686767578125, 2.872406005859375, 2.97613525390625, 3.079864501953125, 3.18359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 10.0, 13.0, 8.0, 28.0, 38.0, 56.0, 62.0, 113.0, 147.0, 238.0, 362.0, 517.0, 768.0, 1327.0, 2216.0, 4035.0, 8319.0, 20704.0, 62961.0, 212315.0, 418183.0, 213671.0, 63284.0, 20815.0, 8335.0, 4133.0, 2224.0, 1301.0, 784.0, 526.0, 337.0, 209.0, 166.0, 102.0, 74.0, 46.0, 38.0, 28.0, 15.0, 17.0, 10.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.10546875, -3.000213623046875, -2.89495849609375, -2.789703369140625, -2.6844482421875, -2.579193115234375, -2.47393798828125, -2.368682861328125, -2.263427734375, -2.158172607421875, -2.05291748046875, -1.947662353515625, -1.8424072265625, -1.737152099609375, -1.63189697265625, -1.526641845703125, -1.42138671875, -1.316131591796875, -1.21087646484375, -1.105621337890625, -1.0003662109375, -0.895111083984375, -0.78985595703125, -0.684600830078125, -0.579345703125, -0.474090576171875, -0.36883544921875, -0.263580322265625, -0.1583251953125, -0.053070068359375, 0.05218505859375, 0.157440185546875, 0.2626953125, 0.367950439453125, 0.47320556640625, 0.578460693359375, 0.6837158203125, 0.788970947265625, 0.89422607421875, 0.999481201171875, 1.104736328125, 1.209991455078125, 1.31524658203125, 1.420501708984375, 1.5257568359375, 1.631011962890625, 1.73626708984375, 1.841522216796875, 1.94677734375, 2.052032470703125, 2.15728759765625, 2.262542724609375, 2.3677978515625, 2.473052978515625, 2.57830810546875, 2.683563232421875, 2.788818359375, 2.894073486328125, 2.99932861328125, 3.104583740234375, 3.2098388671875, 3.315093994140625, 3.42034912109375, 3.525604248046875, 3.630859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 17.0, 19.0, 27.0, 49.0, 68.0, 109.0, 135.0, 167.0, 125.0, 109.0, 70.0, 40.0, 19.0, 12.0, 12.0, 4.0, 8.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020360946655273438, -0.0001955777406692505, -0.0001875460147857666, -0.00017951428890228271, -0.00017148256301879883, -0.00016345083713531494, -0.00015541911125183105, -0.00014738738536834717, -0.00013935565948486328, -0.0001313239336013794, -0.0001232922077178955, -0.00011526048183441162, -0.00010722875595092773, -9.919703006744385e-05, -9.116530418395996e-05, -8.313357830047607e-05, -7.510185241699219e-05, -6.70701265335083e-05, -5.9038400650024414e-05, -5.100667476654053e-05, -4.297494888305664e-05, -3.4943222999572754e-05, -2.6911497116088867e-05, -1.887977123260498e-05, -1.0848045349121094e-05, -2.816319465637207e-06, 5.21540641784668e-06, 1.3247132301330566e-05, 2.1278858184814453e-05, 2.931058406829834e-05, 3.7342309951782227e-05, 4.537403583526611e-05, 5.340576171875e-05, 6.143748760223389e-05, 6.946921348571777e-05, 7.750093936920166e-05, 8.553266525268555e-05, 9.356439113616943e-05, 0.00010159611701965332, 0.00010962784290313721, 0.0001176595687866211, 0.00012569129467010498, 0.00013372302055358887, 0.00014175474643707275, 0.00014978647232055664, 0.00015781819820404053, 0.00016584992408752441, 0.0001738816499710083, 0.0001819133758544922, 0.00018994510173797607, 0.00019797682762145996, 0.00020600855350494385, 0.00021404027938842773, 0.00022207200527191162, 0.0002301037311553955, 0.0002381354570388794, 0.0002461671829223633, 0.00025419890880584717, 0.00026223063468933105, 0.00027026236057281494, 0.00027829408645629883, 0.0002863258123397827, 0.0002943575382232666, 0.0003023892641067505, 0.0003104209899902344]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 13.0, 13.0, 20.0, 24.0, 29.0, 45.0, 69.0, 105.0, 167.0, 244.0, 383.0, 594.0, 1030.0, 1811.0, 3160.0, 6218.0, 13268.0, 29432.0, 72097.0, 168417.0, 283058.0, 248279.0, 125496.0, 51843.0, 21548.0, 9917.0, 4942.0, 2568.0, 1459.0, 841.0, 495.0, 319.0, 214.0, 129.0, 91.0, 73.0, 48.0, 30.0, 20.0, 7.0, 11.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.57659912109375, -2.4871826171875, -2.39776611328125, -2.308349609375, -2.21893310546875, -2.1295166015625, -2.04010009765625, -1.95068359375, -1.86126708984375, -1.7718505859375, -1.68243408203125, -1.593017578125, -1.50360107421875, -1.4141845703125, -1.32476806640625, -1.2353515625, -1.14593505859375, -1.0565185546875, -0.96710205078125, -0.877685546875, -0.78826904296875, -0.6988525390625, -0.60943603515625, -0.52001953125, -0.43060302734375, -0.3411865234375, -0.25177001953125, -0.162353515625, -0.07293701171875, 0.0164794921875, 0.10589599609375, 0.1953125, 0.28472900390625, 0.3741455078125, 0.46356201171875, 0.552978515625, 0.64239501953125, 0.7318115234375, 0.82122802734375, 0.91064453125, 1.00006103515625, 1.0894775390625, 1.17889404296875, 1.268310546875, 1.35772705078125, 1.4471435546875, 1.53656005859375, 1.6259765625, 1.71539306640625, 1.8048095703125, 1.89422607421875, 1.983642578125, 2.07305908203125, 2.1624755859375, 2.25189208984375, 2.34130859375, 2.43072509765625, 2.5201416015625, 2.60955810546875, 2.698974609375, 2.78839111328125, 2.8778076171875, 2.96722412109375, 3.056640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 2.0, 2.0, 5.0, 4.0, 7.0, 9.0, 13.0, 18.0, 16.0, 26.0, 39.0, 54.0, 61.0, 60.0, 63.0, 65.0, 55.0, 77.0, 63.0, 66.0, 54.0, 55.0, 37.0, 33.0, 24.0, 22.0, 16.0, 14.0, 12.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8295440673828125, -0.805084228515625, -0.7806243896484375, -0.75616455078125, -0.7317047119140625, -0.707244873046875, -0.6827850341796875, -0.6583251953125, -0.6338653564453125, -0.609405517578125, -0.5849456787109375, -0.56048583984375, -0.5360260009765625, -0.511566162109375, -0.4871063232421875, -0.462646484375, -0.4381866455078125, -0.413726806640625, -0.3892669677734375, -0.36480712890625, -0.3403472900390625, -0.315887451171875, -0.2914276123046875, -0.2669677734375, -0.2425079345703125, -0.218048095703125, -0.1935882568359375, -0.16912841796875, -0.1446685791015625, -0.120208740234375, -0.0957489013671875, -0.0712890625, -0.0468292236328125, -0.022369384765625, 0.0020904541015625, 0.02655029296875, 0.0510101318359375, 0.075469970703125, 0.0999298095703125, 0.1243896484375, 0.1488494873046875, 0.173309326171875, 0.1977691650390625, 0.22222900390625, 0.2466888427734375, 0.271148681640625, 0.2956085205078125, 0.320068359375, 0.3445281982421875, 0.368988037109375, 0.3934478759765625, 0.41790771484375, 0.4423675537109375, 0.466827392578125, 0.4912872314453125, 0.5157470703125, 0.5402069091796875, 0.564666748046875, 0.5891265869140625, 0.61358642578125, 0.6380462646484375, 0.662506103515625, 0.6869659423828125, 0.71142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 11.0, 8.0, 4.0, 10.0, 9.0, 12.0, 23.0, 25.0, 16.0, 31.0, 29.0, 34.0, 22.0, 31.0, 30.0, 36.0, 49.0, 38.0, 38.0, 45.0, 43.0, 38.0, 36.0, 41.0, 44.0, 29.0, 28.0, 28.0, 27.0, 26.0, 38.0, 24.0, 18.0, 16.0, 10.0, 12.0, 5.0, 12.0, 3.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.637547492980957, -3.4985151290893555, -3.359483003616333, -3.2204508781433105, -3.081418514251709, -2.9423861503601074, -2.803354024887085, -2.6643218994140625, -2.525289535522461, -2.3862571716308594, -2.247225046157837, -2.1081929206848145, -1.969160556793213, -1.8301283121109009, -1.6910960674285889, -1.5520638227462769, -1.4130315780639648, -1.2739993333816528, -1.1349670886993408, -0.9959348440170288, -0.8569025993347168, -0.7178703546524048, -0.5788381099700928, -0.43980586528778076, -0.30077362060546875, -0.16174137592315674, -0.022709131240844727, 0.11632311344146729, 0.2553553581237793, 0.3943876028060913, 0.5334198474884033, 0.6724520921707153, 0.8114848136901855, 0.9505170583724976, 1.0895493030548096, 1.2285815477371216, 1.3676137924194336, 1.5066460371017456, 1.6456782817840576, 1.7847105264663696, 1.9237427711486816, 2.062775135040283, 2.2018072605133057, 2.340839385986328, 2.4798717498779297, 2.6189041137695312, 2.7579362392425537, 2.896968364715576, 3.0360007286071777, 3.1750330924987793, 3.3140652179718018, 3.453097343444824, 3.592129707336426, 3.7311620712280273, 3.87019419670105, 4.009226322174072, 4.148258686065674, 4.287291049957275, 4.426322937011719, 4.56535530090332, 4.704387664794922, 4.843420028686523, 4.982452392578125, 5.121484279632568, 5.26051664352417]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 12.0, 10.0, 11.0, 10.0, 11.0, 15.0, 25.0, 19.0, 16.0, 16.0, 36.0, 25.0, 33.0, 23.0, 44.0, 42.0, 28.0, 35.0, 31.0, 46.0, 49.0, 51.0, 55.0, 37.0, 39.0, 41.0, 35.0, 18.0, 19.0, 27.0, 19.0, 31.0, 16.0, 8.0, 8.0, 9.0, 8.0, 6.0, 8.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.497466564178467, -4.358645439147949, -4.219824314117432, -4.081003189086914, -3.9421818256378174, -3.8033607006073, -3.664539337158203, -3.5257182121276855, -3.386897087097168, -3.2480759620666504, -3.109254837036133, -2.970433473587036, -2.8316123485565186, -2.692791223526001, -2.5539698600769043, -2.4151487350463867, -2.276327610015869, -2.1375064849853516, -1.9986852407455444, -1.8598639965057373, -1.7210428714752197, -1.5822217464447021, -1.443400502204895, -1.304579257965088, -1.1657581329345703, -1.0269370079040527, -0.8881157636642456, -0.7492945790290833, -0.6104733943939209, -0.47165220975875854, -0.3328310251235962, -0.19400984048843384, -0.05518913269042969, 0.08363205194473267, 0.22245323657989502, 0.3612744212150574, 0.5000956058502197, 0.6389167904853821, 0.7777379751205444, 0.9165591597557068, 1.0553803443908691, 1.1942014694213867, 1.3330227136611938, 1.471843957901001, 1.6106650829315186, 1.7494862079620361, 1.8883074522018433, 2.0271286964416504, 2.165949821472168, 2.3047709465026855, 2.443592071533203, 2.5824134349823, 2.7212345600128174, 2.860055685043335, 2.9988770484924316, 3.137698173522949, 3.276519298553467, 3.4153404235839844, 3.554161548614502, 3.6929829120635986, 3.831804037094116, 3.970625162124634, 4.1094465255737305, 4.248267650604248, 4.387088775634766]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 5.0, 15.0, 31.0, 27.0, 48.0, 81.0, 124.0, 146.0, 287.0, 447.0, 708.0, 991.0, 1466.0, 2303.0, 3398.0, 5013.0, 7208.0, 10531.0, 15047.0, 21106.0, 28726.0, 38081.0, 49406.0, 61058.0, 72446.0, 82299.0, 88428.0, 90483.0, 88041.0, 80185.0, 70193.0, 58425.0, 46068.0, 35758.0, 26629.0, 19433.0, 14109.0, 9510.0, 6715.0, 4567.0, 3106.0, 2025.0, 1406.0, 891.0, 553.0, 378.0, 210.0, 176.0, 94.0, 62.0, 45.0, 26.0, 13.0, 15.0, 12.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-2.251953125, -2.177825927734375, -2.10369873046875, -2.029571533203125, -1.9554443359375, -1.881317138671875, -1.80718994140625, -1.733062744140625, -1.658935546875, -1.584808349609375, -1.51068115234375, -1.436553955078125, -1.3624267578125, -1.288299560546875, -1.21417236328125, -1.140045166015625, -1.06591796875, -0.991790771484375, -0.91766357421875, -0.843536376953125, -0.7694091796875, -0.695281982421875, -0.62115478515625, -0.547027587890625, -0.472900390625, -0.398773193359375, -0.32464599609375, -0.250518798828125, -0.1763916015625, -0.102264404296875, -0.02813720703125, 0.045989990234375, 0.1201171875, 0.194244384765625, 0.26837158203125, 0.342498779296875, 0.4166259765625, 0.490753173828125, 0.56488037109375, 0.639007568359375, 0.713134765625, 0.787261962890625, 0.86138916015625, 0.935516357421875, 1.0096435546875, 1.083770751953125, 1.15789794921875, 1.232025146484375, 1.30615234375, 1.380279541015625, 1.45440673828125, 1.528533935546875, 1.6026611328125, 1.676788330078125, 1.75091552734375, 1.825042724609375, 1.899169921875, 1.973297119140625, 2.04742431640625, 2.121551513671875, 2.1956787109375, 2.269805908203125, 2.34393310546875, 2.418060302734375, 2.4921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 6.0, 12.0, 6.0, 17.0, 9.0, 13.0, 17.0, 20.0, 15.0, 22.0, 34.0, 26.0, 23.0, 32.0, 33.0, 29.0, 36.0, 46.0, 40.0, 46.0, 45.0, 40.0, 45.0, 38.0, 46.0, 39.0, 31.0, 30.0, 23.0, 28.0, 19.0, 16.0, 21.0, 16.0, 15.0, 14.0, 12.0, 11.0, 2.0, 5.0, 3.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-4.98828125, -4.8460693359375, -4.703857421875, -4.5616455078125, -4.41943359375, -4.2772216796875, -4.135009765625, -3.9927978515625, -3.8505859375, -3.7083740234375, -3.566162109375, -3.4239501953125, -3.28173828125, -3.1395263671875, -2.997314453125, -2.8551025390625, -2.712890625, -2.5706787109375, -2.428466796875, -2.2862548828125, -2.14404296875, -2.0018310546875, -1.859619140625, -1.7174072265625, -1.5751953125, -1.4329833984375, -1.290771484375, -1.1485595703125, -1.00634765625, -0.8641357421875, -0.721923828125, -0.5797119140625, -0.4375, -0.2952880859375, -0.153076171875, -0.0108642578125, 0.13134765625, 0.2735595703125, 0.415771484375, 0.5579833984375, 0.7001953125, 0.8424072265625, 0.984619140625, 1.1268310546875, 1.26904296875, 1.4112548828125, 1.553466796875, 1.6956787109375, 1.837890625, 1.9801025390625, 2.122314453125, 2.2645263671875, 2.40673828125, 2.5489501953125, 2.691162109375, 2.8333740234375, 2.9755859375, 3.1177978515625, 3.260009765625, 3.4022216796875, 3.54443359375, 3.6866455078125, 3.828857421875, 3.9710693359375, 4.11328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 7.0, 17.0, 19.0, 33.0, 60.0, 83.0, 121.0, 179.0, 237.0, 346.0, 555.0, 839.0, 1278.0, 1904.0, 2843.0, 4128.0, 6101.0, 8739.0, 12733.0, 18175.0, 25155.0, 34115.0, 44907.0, 57229.0, 70031.0, 80860.0, 88370.0, 92115.0, 90248.0, 84385.0, 74578.0, 62686.0, 50674.0, 38354.0, 28565.0, 20673.0, 14737.0, 10314.0, 7174.0, 4920.0, 3323.0, 2184.0, 1486.0, 1058.0, 664.0, 451.0, 288.0, 211.0, 149.0, 82.0, 67.0, 34.0, 29.0, 18.0, 13.0, 6.0, 3.0, 3.0], "bins": [-2.580078125, -2.5035400390625, -2.427001953125, -2.3504638671875, -2.27392578125, -2.1973876953125, -2.120849609375, -2.0443115234375, -1.9677734375, -1.8912353515625, -1.814697265625, -1.7381591796875, -1.66162109375, -1.5850830078125, -1.508544921875, -1.4320068359375, -1.35546875, -1.2789306640625, -1.202392578125, -1.1258544921875, -1.04931640625, -0.9727783203125, -0.896240234375, -0.8197021484375, -0.7431640625, -0.6666259765625, -0.590087890625, -0.5135498046875, -0.43701171875, -0.3604736328125, -0.283935546875, -0.2073974609375, -0.130859375, -0.0543212890625, 0.022216796875, 0.0987548828125, 0.17529296875, 0.2518310546875, 0.328369140625, 0.4049072265625, 0.4814453125, 0.5579833984375, 0.634521484375, 0.7110595703125, 0.78759765625, 0.8641357421875, 0.940673828125, 1.0172119140625, 1.09375, 1.1702880859375, 1.246826171875, 1.3233642578125, 1.39990234375, 1.4764404296875, 1.552978515625, 1.6295166015625, 1.7060546875, 1.7825927734375, 1.859130859375, 1.9356689453125, 2.01220703125, 2.0887451171875, 2.165283203125, 2.2418212890625, 2.318359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 7.0, 3.0, 7.0, 8.0, 8.0, 12.0, 7.0, 8.0, 13.0, 14.0, 19.0, 25.0, 24.0, 31.0, 32.0, 28.0, 38.0, 41.0, 33.0, 47.0, 40.0, 39.0, 41.0, 38.0, 44.0, 34.0, 43.0, 39.0, 41.0, 29.0, 29.0, 22.0, 21.0, 25.0, 26.0, 11.0, 21.0, 12.0, 10.0, 14.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 5.0], "bins": [-3.41015625, -3.315185546875, -3.22021484375, -3.125244140625, -3.0302734375, -2.935302734375, -2.84033203125, -2.745361328125, -2.650390625, -2.555419921875, -2.46044921875, -2.365478515625, -2.2705078125, -2.175537109375, -2.08056640625, -1.985595703125, -1.890625, -1.795654296875, -1.70068359375, -1.605712890625, -1.5107421875, -1.415771484375, -1.32080078125, -1.225830078125, -1.130859375, -1.035888671875, -0.94091796875, -0.845947265625, -0.7509765625, -0.656005859375, -0.56103515625, -0.466064453125, -0.37109375, -0.276123046875, -0.18115234375, -0.086181640625, 0.0087890625, 0.103759765625, 0.19873046875, 0.293701171875, 0.388671875, 0.483642578125, 0.57861328125, 0.673583984375, 0.7685546875, 0.863525390625, 0.95849609375, 1.053466796875, 1.1484375, 1.243408203125, 1.33837890625, 1.433349609375, 1.5283203125, 1.623291015625, 1.71826171875, 1.813232421875, 1.908203125, 2.003173828125, 2.09814453125, 2.193115234375, 2.2880859375, 2.383056640625, 2.47802734375, 2.572998046875, 2.66796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 5.0, 3.0, 5.0, 10.0, 15.0, 22.0, 39.0, 51.0, 66.0, 107.0, 166.0, 247.0, 356.0, 636.0, 951.0, 1473.0, 2477.0, 4085.0, 6846.0, 11106.0, 18385.0, 29065.0, 44862.0, 66551.0, 91714.0, 115704.0, 130785.0, 130163.0, 115177.0, 91217.0, 66431.0, 44764.0, 28815.0, 17961.0, 10793.0, 6739.0, 4148.0, 2474.0, 1464.0, 934.0, 602.0, 392.0, 245.0, 177.0, 112.0, 74.0, 52.0, 22.0, 23.0, 18.0, 11.0, 5.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.552734375, -1.5041961669921875, -1.455657958984375, -1.4071197509765625, -1.35858154296875, -1.3100433349609375, -1.261505126953125, -1.2129669189453125, -1.1644287109375, -1.1158905029296875, -1.067352294921875, -1.0188140869140625, -0.97027587890625, -0.9217376708984375, -0.873199462890625, -0.8246612548828125, -0.776123046875, -0.7275848388671875, -0.679046630859375, -0.6305084228515625, -0.58197021484375, -0.5334320068359375, -0.484893798828125, -0.4363555908203125, -0.3878173828125, -0.3392791748046875, -0.290740966796875, -0.2422027587890625, -0.19366455078125, -0.1451263427734375, -0.096588134765625, -0.0480499267578125, 0.00048828125, 0.0490264892578125, 0.097564697265625, 0.1461029052734375, 0.19464111328125, 0.2431793212890625, 0.291717529296875, 0.3402557373046875, 0.3887939453125, 0.4373321533203125, 0.485870361328125, 0.5344085693359375, 0.58294677734375, 0.6314849853515625, 0.680023193359375, 0.7285614013671875, 0.777099609375, 0.8256378173828125, 0.874176025390625, 0.9227142333984375, 0.97125244140625, 1.0197906494140625, 1.068328857421875, 1.1168670654296875, 1.1654052734375, 1.2139434814453125, 1.262481689453125, 1.3110198974609375, 1.35955810546875, 1.4080963134765625, 1.456634521484375, 1.5051727294921875, 1.5537109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 12.0, 10.0, 12.0, 20.0, 19.0, 16.0, 24.0, 36.0, 40.0, 43.0, 37.0, 45.0, 52.0, 53.0, 41.0, 58.0, 50.0, 46.0, 39.0, 40.0, 40.0, 47.0, 35.0, 28.0, 21.0, 20.0, 15.0, 24.0, 11.0, 10.0, 13.0, 4.0, 8.0, 5.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017261505126953125, -0.00016721338033676147, -0.0001618117094039917, -0.00015641003847122192, -0.00015100836753845215, -0.00014560669660568237, -0.0001402050256729126, -0.00013480335474014282, -0.00012940168380737305, -0.00012400001287460327, -0.0001185983419418335, -0.00011319667100906372, -0.00010779500007629395, -0.00010239332914352417, -9.69916582107544e-05, -9.158998727798462e-05, -8.618831634521484e-05, -8.078664541244507e-05, -7.538497447967529e-05, -6.998330354690552e-05, -6.458163261413574e-05, -5.917996168136597e-05, -5.377829074859619e-05, -4.8376619815826416e-05, -4.297494888305664e-05, -3.7573277950286865e-05, -3.217160701751709e-05, -2.6769936084747314e-05, -2.136826515197754e-05, -1.5966594219207764e-05, -1.0564923286437988e-05, -5.163252353668213e-06, 2.384185791015625e-07, 5.640089511871338e-06, 1.1041760444641113e-05, 1.644343137741089e-05, 2.1845102310180664e-05, 2.724677324295044e-05, 3.2648444175720215e-05, 3.805011510848999e-05, 4.3451786041259766e-05, 4.885345697402954e-05, 5.4255127906799316e-05, 5.965679883956909e-05, 6.505846977233887e-05, 7.046014070510864e-05, 7.586181163787842e-05, 8.12634825706482e-05, 8.666515350341797e-05, 9.206682443618774e-05, 9.746849536895752e-05, 0.0001028701663017273, 0.00010827183723449707, 0.00011367350816726685, 0.00011907517910003662, 0.0001244768500328064, 0.00012987852096557617, 0.00013528019189834595, 0.00014068186283111572, 0.0001460835337638855, 0.00015148520469665527, 0.00015688687562942505, 0.00016228854656219482, 0.0001676902174949646, 0.00017309188842773438]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 16.0, 22.0, 40.0, 54.0, 84.0, 150.0, 219.0, 295.0, 463.0, 787.0, 1256.0, 1890.0, 3014.0, 4735.0, 7443.0, 11592.0, 17661.0, 26602.0, 38680.0, 54194.0, 72956.0, 91910.0, 106545.0, 115089.0, 111945.0, 99306.0, 81675.0, 62530.0, 45296.0, 31204.0, 21340.0, 14084.0, 9098.0, 5891.0, 3738.0, 2439.0, 1583.0, 912.0, 639.0, 412.0, 244.0, 170.0, 115.0, 73.0, 52.0, 32.0, 20.0, 15.0, 13.0, 4.0, 3.0, 2.0, 3.0, 4.0], "bins": [-1.4482421875, -1.405303955078125, -1.36236572265625, -1.319427490234375, -1.2764892578125, -1.233551025390625, -1.19061279296875, -1.147674560546875, -1.104736328125, -1.061798095703125, -1.01885986328125, -0.975921630859375, -0.9329833984375, -0.890045166015625, -0.84710693359375, -0.804168701171875, -0.76123046875, -0.718292236328125, -0.67535400390625, -0.632415771484375, -0.5894775390625, -0.546539306640625, -0.50360107421875, -0.460662841796875, -0.417724609375, -0.374786376953125, -0.33184814453125, -0.288909912109375, -0.2459716796875, -0.203033447265625, -0.16009521484375, -0.117156982421875, -0.07421875, -0.031280517578125, 0.01165771484375, 0.054595947265625, 0.0975341796875, 0.140472412109375, 0.18341064453125, 0.226348876953125, 0.269287109375, 0.312225341796875, 0.35516357421875, 0.398101806640625, 0.4410400390625, 0.483978271484375, 0.52691650390625, 0.569854736328125, 0.61279296875, 0.655731201171875, 0.69866943359375, 0.741607666015625, 0.7845458984375, 0.827484130859375, 0.87042236328125, 0.913360595703125, 0.956298828125, 0.999237060546875, 1.04217529296875, 1.085113525390625, 1.1280517578125, 1.170989990234375, 1.21392822265625, 1.256866455078125, 1.2998046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 4.0, 2.0, 8.0, 10.0, 9.0, 11.0, 20.0, 19.0, 23.0, 17.0, 27.0, 24.0, 30.0, 41.0, 36.0, 36.0, 40.0, 45.0, 41.0, 51.0, 42.0, 42.0, 45.0, 49.0, 37.0, 42.0, 38.0, 37.0, 28.0, 24.0, 25.0, 21.0, 11.0, 15.0, 10.0, 5.0, 8.0, 2.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5341567993164062, -0.5160675048828125, -0.49797821044921875, -0.479888916015625, -0.46179962158203125, -0.4437103271484375, -0.42562103271484375, -0.40753173828125, -0.38944244384765625, -0.3713531494140625, -0.35326385498046875, -0.335174560546875, -0.31708526611328125, -0.2989959716796875, -0.28090667724609375, -0.2628173828125, -0.24472808837890625, -0.2266387939453125, -0.20854949951171875, -0.190460205078125, -0.17237091064453125, -0.1542816162109375, -0.13619232177734375, -0.11810302734375, -0.10001373291015625, -0.0819244384765625, -0.06383514404296875, -0.045745849609375, -0.02765655517578125, -0.0095672607421875, 0.00852203369140625, 0.026611328125, 0.04470062255859375, 0.0627899169921875, 0.08087921142578125, 0.098968505859375, 0.11705780029296875, 0.1351470947265625, 0.15323638916015625, 0.17132568359375, 0.18941497802734375, 0.2075042724609375, 0.22559356689453125, 0.243682861328125, 0.26177215576171875, 0.2798614501953125, 0.29795074462890625, 0.3160400390625, 0.33412933349609375, 0.3522186279296875, 0.37030792236328125, 0.388397216796875, 0.40648651123046875, 0.4245758056640625, 0.44266510009765625, 0.46075439453125, 0.47884368896484375, 0.4969329833984375, 0.5150222778320312, 0.533111572265625, 0.5512008666992188, 0.5692901611328125, 0.5873794555664062, 0.60546875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 3.0, 12.0, 9.0, 13.0, 13.0, 15.0, 13.0, 19.0, 21.0, 29.0, 23.0, 38.0, 29.0, 34.0, 32.0, 37.0, 31.0, 35.0, 39.0, 42.0, 47.0, 42.0, 28.0, 40.0, 35.0, 30.0, 37.0, 34.0, 33.0, 21.0, 23.0, 19.0, 11.0, 16.0, 18.0, 8.0, 11.0, 14.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.732205629348755, -3.602726697921753, -3.47324800491333, -3.343769073486328, -3.214290142059326, -3.084811210632324, -2.9553322792053223, -2.8258535861968994, -2.6963746547698975, -2.5668957233428955, -2.4374170303344727, -2.3079380989074707, -2.1784591674804688, -2.048980236053467, -1.9195014238357544, -1.790022611618042, -1.66054368019104, -1.531064748764038, -1.4015859365463257, -1.2721071243286133, -1.1426281929016113, -1.0131492614746094, -0.883670449256897, -0.7541915774345398, -0.6247127056121826, -0.49523383378982544, -0.36575496196746826, -0.23627609014511108, -0.1067972183227539, 0.02268165349960327, 0.15216052532196045, 0.2816393971443176, 0.4111180305480957, 0.5405969023704529, 0.6700757741928101, 0.7995546460151672, 0.9290335178375244, 1.0585124492645264, 1.1879912614822388, 1.3174700736999512, 1.4469490051269531, 1.576427936553955, 1.7059067487716675, 1.8353855609893799, 1.9648644924163818, 2.094343423843384, 2.2238221168518066, 2.3533010482788086, 2.4827799797058105, 2.6122589111328125, 2.7417378425598145, 2.8712165355682373, 3.0006954669952393, 3.130174398422241, 3.259653091430664, 3.389132022857666, 3.518610954284668, 3.64808988571167, 3.777568817138672, 3.9070475101470947, 4.036526679992676, 4.1660051345825195, 4.2954840660095215, 4.424962997436523, 4.554441928863525]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 12.0, 8.0, 15.0, 9.0, 8.0, 18.0, 19.0, 15.0, 28.0, 19.0, 35.0, 25.0, 20.0, 36.0, 32.0, 37.0, 46.0, 37.0, 34.0, 40.0, 57.0, 49.0, 35.0, 42.0, 30.0, 27.0, 32.0, 29.0, 26.0, 25.0, 24.0, 11.0, 18.0, 11.0, 16.0, 14.0, 7.0, 7.0, 8.0, 10.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.524530410766602, -4.389077663421631, -4.25362491607666, -4.118171691894531, -3.9827189445495605, -3.84726619720459, -3.71181321144104, -3.5763602256774902, -3.4409074783325195, -3.305454730987549, -3.170001745223999, -3.034548759460449, -2.8990960121154785, -2.763643264770508, -2.628190279006958, -2.492737293243408, -2.3572845458984375, -2.221831798553467, -2.086378812789917, -1.9509259462356567, -1.8154730796813965, -1.6800202131271362, -1.544567346572876, -1.4091144800186157, -1.2736616134643555, -1.1382087469100952, -1.002755880355835, -0.8673030138015747, -0.7318501472473145, -0.5963972806930542, -0.46094441413879395, -0.3254915475845337, -0.19003820419311523, -0.05458533763885498, 0.08086752891540527, 0.21632039546966553, 0.3517732620239258, 0.48722612857818604, 0.6226789951324463, 0.7581318616867065, 0.8935847282409668, 1.029037594795227, 1.1644904613494873, 1.2999433279037476, 1.4353961944580078, 1.570849061012268, 1.7063019275665283, 1.8417547941207886, 1.9772076606750488, 2.1126604080200195, 2.2481133937835693, 2.383566379547119, 2.51901912689209, 2.6544718742370605, 2.7899248600006104, 2.92537784576416, 3.060830593109131, 3.1962833404541016, 3.3317363262176514, 3.467189311981201, 3.602642059326172, 3.7380948066711426, 3.8735477924346924, 4.009000778198242, 4.144453525543213]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 21.0, 24.0, 33.0, 56.0, 93.0, 138.0, 210.0, 326.0, 533.0, 888.0, 1497.0, 2391.0, 3966.0, 6727.0, 11668.0, 19611.0, 35101.0, 61735.0, 106885.0, 183045.0, 298578.0, 445509.0, 584223.0, 643693.0, 586537.0, 450065.0, 301344.0, 186367.0, 110105.0, 63576.0, 36956.0, 21438.0, 12405.0, 7354.0, 4413.0, 2644.0, 1492.0, 992.0, 613.0, 372.0, 248.0, 147.0, 101.0, 67.0, 35.0, 23.0, 9.0, 14.0, 7.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.55157470703125, -3.4312744140625, -3.31097412109375, -3.190673828125, -3.07037353515625, -2.9500732421875, -2.82977294921875, -2.70947265625, -2.58917236328125, -2.4688720703125, -2.34857177734375, -2.228271484375, -2.10797119140625, -1.9876708984375, -1.86737060546875, -1.7470703125, -1.62677001953125, -1.5064697265625, -1.38616943359375, -1.265869140625, -1.14556884765625, -1.0252685546875, -0.90496826171875, -0.78466796875, -0.66436767578125, -0.5440673828125, -0.42376708984375, -0.303466796875, -0.18316650390625, -0.0628662109375, 0.05743408203125, 0.177734375, 0.29803466796875, 0.4183349609375, 0.53863525390625, 0.658935546875, 0.77923583984375, 0.8995361328125, 1.01983642578125, 1.14013671875, 1.26043701171875, 1.3807373046875, 1.50103759765625, 1.621337890625, 1.74163818359375, 1.8619384765625, 1.98223876953125, 2.1025390625, 2.22283935546875, 2.3431396484375, 2.46343994140625, 2.583740234375, 2.70404052734375, 2.8243408203125, 2.94464111328125, 3.06494140625, 3.18524169921875, 3.3055419921875, 3.42584228515625, 3.546142578125, 3.66644287109375, 3.7867431640625, 3.90704345703125, 4.02734375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 11.0, 6.0, 6.0, 13.0, 6.0, 15.0, 24.0, 17.0, 20.0, 25.0, 27.0, 32.0, 27.0, 28.0, 25.0, 37.0, 32.0, 43.0, 40.0, 53.0, 43.0, 52.0, 47.0, 34.0, 44.0, 24.0, 35.0, 25.0, 32.0, 27.0, 19.0, 22.0, 10.0, 17.0, 15.0, 13.0, 14.0, 6.0, 7.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.18359375, -4.066131591796875, -3.94866943359375, -3.831207275390625, -3.7137451171875, -3.596282958984375, -3.47882080078125, -3.361358642578125, -3.243896484375, -3.126434326171875, -3.00897216796875, -2.891510009765625, -2.7740478515625, -2.656585693359375, -2.53912353515625, -2.421661376953125, -2.30419921875, -2.186737060546875, -2.06927490234375, -1.951812744140625, -1.8343505859375, -1.716888427734375, -1.59942626953125, -1.481964111328125, -1.364501953125, -1.247039794921875, -1.12957763671875, -1.012115478515625, -0.8946533203125, -0.777191162109375, -0.65972900390625, -0.542266845703125, -0.4248046875, -0.307342529296875, -0.18988037109375, -0.072418212890625, 0.0450439453125, 0.162506103515625, 0.27996826171875, 0.397430419921875, 0.514892578125, 0.632354736328125, 0.74981689453125, 0.867279052734375, 0.9847412109375, 1.102203369140625, 1.21966552734375, 1.337127685546875, 1.45458984375, 1.572052001953125, 1.68951416015625, 1.806976318359375, 1.9244384765625, 2.041900634765625, 2.15936279296875, 2.276824951171875, 2.394287109375, 2.511749267578125, 2.62921142578125, 2.746673583984375, 2.8641357421875, 2.981597900390625, 3.09906005859375, 3.216522216796875, 3.333984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 6.0, 11.0, 19.0, 41.0, 65.0, 84.0, 136.0, 242.0, 474.0, 878.0, 1607.0, 3001.0, 5676.0, 10636.0, 20011.0, 37686.0, 69814.0, 125545.0, 217356.0, 351700.0, 514227.0, 645264.0, 663240.0, 556642.0, 395176.0, 250532.0, 146386.0, 81859.0, 44735.0, 23909.0, 12749.0, 6656.0, 3636.0, 1942.0, 1093.0, 546.0, 307.0, 175.0, 99.0, 51.0, 29.0, 23.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.275146484375, -4.12841796875, -3.981689453125, -3.8349609375, -3.688232421875, -3.54150390625, -3.394775390625, -3.248046875, -3.101318359375, -2.95458984375, -2.807861328125, -2.6611328125, -2.514404296875, -2.36767578125, -2.220947265625, -2.07421875, -1.927490234375, -1.78076171875, -1.634033203125, -1.4873046875, -1.340576171875, -1.19384765625, -1.047119140625, -0.900390625, -0.753662109375, -0.60693359375, -0.460205078125, -0.3134765625, -0.166748046875, -0.02001953125, 0.126708984375, 0.2734375, 0.420166015625, 0.56689453125, 0.713623046875, 0.8603515625, 1.007080078125, 1.15380859375, 1.300537109375, 1.447265625, 1.593994140625, 1.74072265625, 1.887451171875, 2.0341796875, 2.180908203125, 2.32763671875, 2.474365234375, 2.62109375, 2.767822265625, 2.91455078125, 3.061279296875, 3.2080078125, 3.354736328125, 3.50146484375, 3.648193359375, 3.794921875, 3.941650390625, 4.08837890625, 4.235107421875, 4.3818359375, 4.528564453125, 4.67529296875, 4.822021484375, 4.96875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 11.0, 7.0, 17.0, 15.0, 17.0, 26.0, 33.0, 41.0, 45.0, 65.0, 72.0, 82.0, 103.0, 131.0, 139.0, 164.0, 158.0, 202.0, 206.0, 187.0, 212.0, 212.0, 200.0, 242.0, 183.0, 173.0, 160.0, 143.0, 130.0, 127.0, 105.0, 80.0, 68.0, 60.0, 56.0, 49.0, 35.0, 25.0, 21.0, 19.0, 14.0, 12.0, 5.0, 2.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.705078125, -1.653900146484375, -1.60272216796875, -1.551544189453125, -1.5003662109375, -1.449188232421875, -1.39801025390625, -1.346832275390625, -1.295654296875, -1.244476318359375, -1.19329833984375, -1.142120361328125, -1.0909423828125, -1.039764404296875, -0.98858642578125, -0.937408447265625, -0.88623046875, -0.835052490234375, -0.78387451171875, -0.732696533203125, -0.6815185546875, -0.630340576171875, -0.57916259765625, -0.527984619140625, -0.476806640625, -0.425628662109375, -0.37445068359375, -0.323272705078125, -0.2720947265625, -0.220916748046875, -0.16973876953125, -0.118560791015625, -0.0673828125, -0.016204833984375, 0.03497314453125, 0.086151123046875, 0.1373291015625, 0.188507080078125, 0.23968505859375, 0.290863037109375, 0.342041015625, 0.393218994140625, 0.44439697265625, 0.495574951171875, 0.5467529296875, 0.597930908203125, 0.64910888671875, 0.700286865234375, 0.75146484375, 0.802642822265625, 0.85382080078125, 0.904998779296875, 0.9561767578125, 1.007354736328125, 1.05853271484375, 1.109710693359375, 1.160888671875, 1.212066650390625, 1.26324462890625, 1.314422607421875, 1.3656005859375, 1.416778564453125, 1.46795654296875, 1.519134521484375, 1.5703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 11.0, 2.0, 6.0, 16.0, 9.0, 18.0, 32.0, 26.0, 27.0, 39.0, 43.0, 38.0, 46.0, 35.0, 53.0, 59.0, 51.0, 57.0, 51.0, 49.0, 42.0, 42.0, 37.0, 42.0, 20.0, 21.0, 28.0, 16.0, 20.0, 9.0, 8.0, 15.0, 14.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.146299362182617, -3.979362964630127, -3.8124263286590576, -3.6454899311065674, -3.478553533554077, -3.311616897583008, -3.1446805000305176, -2.9777441024780273, -2.810807704925537, -2.643871307373047, -2.4769346714019775, -2.3099982738494873, -2.143061876296997, -1.9761253595352173, -1.8091888427734375, -1.6422524452209473, -1.475315809249878, -1.3083792924880981, -1.141442894935608, -0.9745063781738281, -0.8075699210166931, -0.6406334638595581, -0.4736969470977783, -0.3067605495452881, -0.1398240327835083, 0.027112439274787903, 0.1940489113330841, 0.3609853982925415, 0.5279218554496765, 0.6948583126068115, 0.8617948293685913, 1.0287312269210815, 1.1956677436828613, 1.3626042604446411, 1.5295406579971313, 1.6964771747589111, 1.8634135723114014, 2.0303502082824707, 2.197286605834961, 2.364223003387451, 2.5311594009399414, 2.6980957984924316, 2.865032434463501, 3.031968832015991, 3.1989052295684814, 3.365841865539551, 3.532778263092041, 3.6997146606445312, 3.8666512966156006, 4.03358793258667, 4.20052433013916, 4.36746072769165, 4.534397125244141, 4.701333522796631, 4.868269920349121, 5.0352067947387695, 5.20214319229126, 5.36907958984375, 5.53601598739624, 5.7029523849487305, 5.869889259338379, 6.036825656890869, 6.203762054443359, 6.37069845199585, 6.53763484954834]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 6.0, 12.0, 12.0, 18.0, 21.0, 27.0, 23.0, 25.0, 26.0, 37.0, 32.0, 34.0, 39.0, 48.0, 45.0, 45.0, 55.0, 43.0, 47.0, 49.0, 24.0, 36.0, 41.0, 30.0, 28.0, 27.0, 25.0, 23.0, 15.0, 18.0, 15.0, 8.0, 8.0, 9.0, 11.0, 8.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.74122428894043, -4.5979461669921875, -4.4546685218811035, -4.311390399932861, -4.168112754821777, -4.024834632873535, -3.881556749343872, -3.738278865814209, -3.595000982284546, -3.451723098754883, -3.3084452152252197, -3.1651673316955566, -3.0218892097473145, -2.8786115646362305, -2.7353334426879883, -2.592055559158325, -2.448777675628662, -2.305499792098999, -2.162221908569336, -2.018944025039673, -1.8756660223007202, -1.7323881387710571, -1.5891101360321045, -1.4458322525024414, -1.3025543689727783, -1.1592764854431152, -1.0159986019134521, -0.8727205991744995, -0.7294427156448364, -0.5861648321151733, -0.4428868889808655, -0.2996089458465576, -0.15633106231689453, -0.013053148984909058, 0.13022476434707642, 0.2735026776790619, 0.41678059101104736, 0.5600584745407104, 0.7033364176750183, 0.8466143608093262, 0.9898922443389893, 1.1331701278686523, 1.2764480113983154, 1.419726014137268, 1.5630038976669312, 1.7062817811965942, 1.8495597839355469, 1.99283766746521, 2.136115550994873, 2.279393434524536, 2.422671318054199, 2.5659492015838623, 2.7092270851135254, 2.8525052070617676, 2.9957830905914307, 3.1390609741210938, 3.282338857650757, 3.42561674118042, 3.568894624710083, 3.712172508239746, 3.8554506301879883, 3.9987282752990723, 4.1420063972473145, 4.285284042358398, 4.428562164306641]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 8.0, 9.0, 10.0, 18.0, 24.0, 29.0, 33.0, 59.0, 82.0, 127.0, 165.0, 286.0, 448.0, 748.0, 1329.0, 2338.0, 4356.0, 8289.0, 15784.0, 31024.0, 57973.0, 102537.0, 156630.0, 191943.0, 178579.0, 128594.0, 78066.0, 42204.0, 22265.0, 11258.0, 5905.0, 3130.0, 1728.0, 906.0, 579.0, 354.0, 238.0, 153.0, 98.0, 62.0, 62.0, 41.0, 27.0, 12.0, 15.0, 8.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4453125, -2.36309814453125, -2.2808837890625, -2.19866943359375, -2.116455078125, -2.03424072265625, -1.9520263671875, -1.86981201171875, -1.78759765625, -1.70538330078125, -1.6231689453125, -1.54095458984375, -1.458740234375, -1.37652587890625, -1.2943115234375, -1.21209716796875, -1.1298828125, -1.04766845703125, -0.9654541015625, -0.88323974609375, -0.801025390625, -0.71881103515625, -0.6365966796875, -0.55438232421875, -0.47216796875, -0.38995361328125, -0.3077392578125, -0.22552490234375, -0.143310546875, -0.06109619140625, 0.0211181640625, 0.10333251953125, 0.185546875, 0.26776123046875, 0.3499755859375, 0.43218994140625, 0.514404296875, 0.59661865234375, 0.6788330078125, 0.76104736328125, 0.84326171875, 0.92547607421875, 1.0076904296875, 1.08990478515625, 1.172119140625, 1.25433349609375, 1.3365478515625, 1.41876220703125, 1.5009765625, 1.58319091796875, 1.6654052734375, 1.74761962890625, 1.829833984375, 1.91204833984375, 1.9942626953125, 2.07647705078125, 2.15869140625, 2.24090576171875, 2.3231201171875, 2.40533447265625, 2.487548828125, 2.56976318359375, 2.6519775390625, 2.73419189453125, 2.81640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 8.0, 5.0, 16.0, 14.0, 18.0, 19.0, 17.0, 30.0, 25.0, 25.0, 38.0, 30.0, 30.0, 48.0, 41.0, 36.0, 41.0, 51.0, 48.0, 43.0, 43.0, 47.0, 32.0, 44.0, 36.0, 33.0, 22.0, 22.0, 24.0, 16.0, 10.0, 17.0, 10.0, 6.0, 10.0, 7.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.61920166015625, -4.4727783203125, -4.32635498046875, -4.179931640625, -4.03350830078125, -3.8870849609375, -3.74066162109375, -3.59423828125, -3.44781494140625, -3.3013916015625, -3.15496826171875, -3.008544921875, -2.86212158203125, -2.7156982421875, -2.56927490234375, -2.4228515625, -2.27642822265625, -2.1300048828125, -1.98358154296875, -1.837158203125, -1.69073486328125, -1.5443115234375, -1.39788818359375, -1.25146484375, -1.10504150390625, -0.9586181640625, -0.81219482421875, -0.665771484375, -0.51934814453125, -0.3729248046875, -0.22650146484375, -0.080078125, 0.06634521484375, 0.2127685546875, 0.35919189453125, 0.505615234375, 0.65203857421875, 0.7984619140625, 0.94488525390625, 1.09130859375, 1.23773193359375, 1.3841552734375, 1.53057861328125, 1.677001953125, 1.82342529296875, 1.9698486328125, 2.11627197265625, 2.2626953125, 2.40911865234375, 2.5555419921875, 2.70196533203125, 2.848388671875, 2.99481201171875, 3.1412353515625, 3.28765869140625, 3.43408203125, 3.58050537109375, 3.7269287109375, 3.87335205078125, 4.019775390625, 4.16619873046875, 4.3126220703125, 4.45904541015625, 4.60546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 11.0, 21.0, 31.0, 45.0, 62.0, 98.0, 148.0, 260.0, 455.0, 846.0, 1459.0, 2838.0, 5803.0, 12097.0, 26637.0, 60450.0, 130281.0, 231810.0, 258742.0, 167127.0, 81047.0, 36119.0, 16440.0, 7597.0, 3718.0, 1935.0, 971.0, 607.0, 349.0, 190.0, 121.0, 92.0, 49.0, 24.0, 13.0, 14.0, 12.0, 7.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.91357421875, -3.7880859375, -3.66259765625, -3.537109375, -3.41162109375, -3.2861328125, -3.16064453125, -3.03515625, -2.90966796875, -2.7841796875, -2.65869140625, -2.533203125, -2.40771484375, -2.2822265625, -2.15673828125, -2.03125, -1.90576171875, -1.7802734375, -1.65478515625, -1.529296875, -1.40380859375, -1.2783203125, -1.15283203125, -1.02734375, -0.90185546875, -0.7763671875, -0.65087890625, -0.525390625, -0.39990234375, -0.2744140625, -0.14892578125, -0.0234375, 0.10205078125, 0.2275390625, 0.35302734375, 0.478515625, 0.60400390625, 0.7294921875, 0.85498046875, 0.98046875, 1.10595703125, 1.2314453125, 1.35693359375, 1.482421875, 1.60791015625, 1.7333984375, 1.85888671875, 1.984375, 2.10986328125, 2.2353515625, 2.36083984375, 2.486328125, 2.61181640625, 2.7373046875, 2.86279296875, 2.98828125, 3.11376953125, 3.2392578125, 3.36474609375, 3.490234375, 3.61572265625, 3.7412109375, 3.86669921875, 3.9921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 9.0, 11.0, 10.0, 11.0, 13.0, 17.0, 22.0, 26.0, 26.0, 26.0, 32.0, 39.0, 30.0, 39.0, 58.0, 38.0, 49.0, 36.0, 47.0, 39.0, 46.0, 52.0, 51.0, 46.0, 29.0, 35.0, 27.0, 16.0, 25.0, 11.0, 13.0, 19.0, 13.0, 8.0, 6.0, 7.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.099609375, -3.003448486328125, -2.90728759765625, -2.811126708984375, -2.7149658203125, -2.618804931640625, -2.52264404296875, -2.426483154296875, -2.330322265625, -2.234161376953125, -2.13800048828125, -2.041839599609375, -1.9456787109375, -1.849517822265625, -1.75335693359375, -1.657196044921875, -1.56103515625, -1.464874267578125, -1.36871337890625, -1.272552490234375, -1.1763916015625, -1.080230712890625, -0.98406982421875, -0.887908935546875, -0.791748046875, -0.695587158203125, -0.59942626953125, -0.503265380859375, -0.4071044921875, -0.310943603515625, -0.21478271484375, -0.118621826171875, -0.0224609375, 0.073699951171875, 0.16986083984375, 0.266021728515625, 0.3621826171875, 0.458343505859375, 0.55450439453125, 0.650665283203125, 0.746826171875, 0.842987060546875, 0.93914794921875, 1.035308837890625, 1.1314697265625, 1.227630615234375, 1.32379150390625, 1.419952392578125, 1.51611328125, 1.612274169921875, 1.70843505859375, 1.804595947265625, 1.9007568359375, 1.996917724609375, 2.09307861328125, 2.189239501953125, 2.285400390625, 2.381561279296875, 2.47772216796875, 2.573883056640625, 2.6700439453125, 2.766204833984375, 2.86236572265625, 2.958526611328125, 3.0546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 7.0, 7.0, 17.0, 20.0, 25.0, 25.0, 38.0, 59.0, 62.0, 97.0, 130.0, 172.0, 223.0, 329.0, 461.0, 679.0, 1096.0, 1761.0, 2862.0, 5243.0, 10108.0, 20823.0, 47771.0, 116364.0, 253075.0, 299561.0, 162290.0, 67100.0, 28887.0, 13026.0, 6604.0, 3596.0, 1997.0, 1287.0, 887.0, 528.0, 412.0, 225.0, 185.0, 127.0, 110.0, 72.0, 65.0, 50.0, 23.0, 17.0, 14.0, 18.0, 10.0, 7.0, 3.0, 1.0, 0.0, 3.0, 3.0], "bins": [-2.080078125, -2.0192413330078125, -1.958404541015625, -1.8975677490234375, -1.83673095703125, -1.7758941650390625, -1.715057373046875, -1.6542205810546875, -1.5933837890625, -1.5325469970703125, -1.471710205078125, -1.4108734130859375, -1.35003662109375, -1.2891998291015625, -1.228363037109375, -1.1675262451171875, -1.106689453125, -1.0458526611328125, -0.985015869140625, -0.9241790771484375, -0.86334228515625, -0.8025054931640625, -0.741668701171875, -0.6808319091796875, -0.6199951171875, -0.5591583251953125, -0.498321533203125, -0.4374847412109375, -0.37664794921875, -0.3158111572265625, -0.254974365234375, -0.1941375732421875, -0.13330078125, -0.0724639892578125, -0.011627197265625, 0.0492095947265625, 0.11004638671875, 0.1708831787109375, 0.231719970703125, 0.2925567626953125, 0.3533935546875, 0.4142303466796875, 0.475067138671875, 0.5359039306640625, 0.59674072265625, 0.6575775146484375, 0.718414306640625, 0.7792510986328125, 0.840087890625, 0.9009246826171875, 0.961761474609375, 1.0225982666015625, 1.08343505859375, 1.1442718505859375, 1.205108642578125, 1.2659454345703125, 1.3267822265625, 1.3876190185546875, 1.448455810546875, 1.5092926025390625, 1.57012939453125, 1.6309661865234375, 1.691802978515625, 1.7526397705078125, 1.8134765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 7.0, 8.0, 18.0, 25.0, 31.0, 45.0, 58.0, 85.0, 92.0, 98.0, 118.0, 113.0, 96.0, 60.0, 41.0, 32.0, 28.0, 14.0, 14.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018095970153808594, -0.0001767752692103386, -0.00017259083688259125, -0.0001684064045548439, -0.00016422197222709656, -0.0001600375398993492, -0.00015585310757160187, -0.00015166867524385452, -0.00014748424291610718, -0.00014329981058835983, -0.0001391153782606125, -0.00013493094593286514, -0.0001307465136051178, -0.00012656208127737045, -0.0001223776489496231, -0.00011819321662187576, -0.00011400878429412842, -0.00010982435196638107, -0.00010563991963863373, -0.00010145548731088638, -9.727105498313904e-05, -9.308662265539169e-05, -8.890219032764435e-05, -8.4717757999897e-05, -8.053332567214966e-05, -7.634889334440231e-05, -7.216446101665497e-05, -6.798002868890762e-05, -6.379559636116028e-05, -5.961116403341293e-05, -5.542673170566559e-05, -5.1242299377918243e-05, -4.70578670501709e-05, -4.2873434722423553e-05, -3.868900239467621e-05, -3.4504570066928864e-05, -3.032013773918152e-05, -2.6135705411434174e-05, -2.195127308368683e-05, -1.7766840755939484e-05, -1.3582408428192139e-05, -9.397976100444794e-06, -5.213543772697449e-06, -1.0291114449501038e-06, 3.155320882797241e-06, 7.339753210544586e-06, 1.1524185538291931e-05, 1.5708617866039276e-05, 1.989305019378662e-05, 2.4077482521533966e-05, 2.826191484928131e-05, 3.2446347177028656e-05, 3.6630779504776e-05, 4.0815211832523346e-05, 4.499964416027069e-05, 4.9184076488018036e-05, 5.336850881576538e-05, 5.7552941143512726e-05, 6.173737347126007e-05, 6.592180579900742e-05, 7.010623812675476e-05, 7.42906704545021e-05, 7.847510278224945e-05, 8.26595351099968e-05, 8.684396743774414e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 2.0, 10.0, 12.0, 31.0, 38.0, 59.0, 79.0, 112.0, 147.0, 228.0, 298.0, 487.0, 678.0, 1021.0, 1657.0, 2753.0, 4229.0, 7544.0, 12894.0, 23362.0, 43411.0, 81384.0, 144010.0, 206311.0, 203765.0, 139745.0, 78638.0, 41625.0, 22726.0, 12453.0, 7147.0, 4251.0, 2687.0, 1595.0, 1041.0, 637.0, 441.0, 331.0, 224.0, 146.0, 113.0, 62.0, 54.0, 34.0, 21.0, 21.0, 16.0, 4.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.607421875, -1.5586700439453125, -1.509918212890625, -1.4611663818359375, -1.41241455078125, -1.3636627197265625, -1.314910888671875, -1.2661590576171875, -1.2174072265625, -1.1686553955078125, -1.119903564453125, -1.0711517333984375, -1.02239990234375, -0.9736480712890625, -0.924896240234375, -0.8761444091796875, -0.827392578125, -0.7786407470703125, -0.729888916015625, -0.6811370849609375, -0.63238525390625, -0.5836334228515625, -0.534881591796875, -0.4861297607421875, -0.4373779296875, -0.3886260986328125, -0.339874267578125, -0.2911224365234375, -0.24237060546875, -0.1936187744140625, -0.144866943359375, -0.0961151123046875, -0.04736328125, 0.0013885498046875, 0.050140380859375, 0.0988922119140625, 0.14764404296875, 0.1963958740234375, 0.245147705078125, 0.2938995361328125, 0.3426513671875, 0.3914031982421875, 0.440155029296875, 0.4889068603515625, 0.53765869140625, 0.5864105224609375, 0.635162353515625, 0.6839141845703125, 0.732666015625, 0.7814178466796875, 0.830169677734375, 0.8789215087890625, 0.92767333984375, 0.9764251708984375, 1.025177001953125, 1.0739288330078125, 1.1226806640625, 1.1714324951171875, 1.220184326171875, 1.2689361572265625, 1.31768798828125, 1.3664398193359375, 1.415191650390625, 1.4639434814453125, 1.5126953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 4.0, 12.0, 7.0, 13.0, 17.0, 26.0, 31.0, 32.0, 38.0, 37.0, 57.0, 51.0, 57.0, 69.0, 66.0, 59.0, 43.0, 65.0, 36.0, 41.0, 28.0, 27.0, 26.0, 22.0, 16.0, 13.0, 18.0, 18.0, 6.0, 12.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439453125, -0.424072265625, -0.40869140625, -0.393310546875, -0.3779296875, -0.362548828125, -0.34716796875, -0.331787109375, -0.31640625, -0.301025390625, -0.28564453125, -0.270263671875, -0.2548828125, -0.239501953125, -0.22412109375, -0.208740234375, -0.193359375, -0.177978515625, -0.16259765625, -0.147216796875, -0.1318359375, -0.116455078125, -0.10107421875, -0.085693359375, -0.0703125, -0.054931640625, -0.03955078125, -0.024169921875, -0.0087890625, 0.006591796875, 0.02197265625, 0.037353515625, 0.052734375, 0.068115234375, 0.08349609375, 0.098876953125, 0.1142578125, 0.129638671875, 0.14501953125, 0.160400390625, 0.17578125, 0.191162109375, 0.20654296875, 0.221923828125, 0.2373046875, 0.252685546875, 0.26806640625, 0.283447265625, 0.298828125, 0.314208984375, 0.32958984375, 0.344970703125, 0.3603515625, 0.375732421875, 0.39111328125, 0.406494140625, 0.421875, 0.437255859375, 0.45263671875, 0.468017578125, 0.4833984375, 0.498779296875, 0.51416015625, 0.529541015625, 0.544921875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 8.0, 4.0, 8.0, 9.0, 14.0, 17.0, 23.0, 22.0, 37.0, 44.0, 39.0, 39.0, 35.0, 53.0, 43.0, 48.0, 65.0, 52.0, 60.0, 52.0, 48.0, 33.0, 36.0, 32.0, 35.0, 29.0, 19.0, 20.0, 15.0, 10.0, 10.0, 13.0, 11.0, 3.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5323567390441895, -4.363328456878662, -4.194299697875977, -4.025271415710449, -3.8562428951263428, -3.6872143745422363, -3.518186092376709, -3.3491575717926025, -3.180129051208496, -3.0111005306243896, -2.842072010040283, -2.673043727874756, -2.5040152072906494, -2.334986686706543, -2.1659584045410156, -1.9969298839569092, -1.8279013633728027, -1.6588728427886963, -1.4898444414138794, -1.3208160400390625, -1.151787519454956, -0.9827590584754944, -0.8137305974960327, -0.6447021961212158, -0.4756736755371094, -0.3066452145576477, -0.13761675357818604, 0.031411707401275635, 0.2004401683807373, 0.369468629360199, 0.5384970903396606, 0.7075254917144775, 0.876554012298584, 1.0455825328826904, 1.2146109342575073, 1.3836393356323242, 1.5526678562164307, 1.721696376800537, 1.890724778175354, 2.059753179550171, 2.2287817001342773, 2.397810220718384, 2.5668387413024902, 2.7358670234680176, 2.904895544052124, 3.0739240646362305, 3.242952346801758, 3.4119808673858643, 3.5810093879699707, 3.750037908554077, 3.9190664291381836, 4.088094711303711, 4.257122993469238, 4.426151752471924, 4.595180034637451, 4.764208793640137, 4.933237075805664, 5.102265357971191, 5.271294116973877, 5.440322399139404, 5.60935115814209, 5.778379440307617, 5.9474077224731445, 6.116436004638672, 6.285464763641357]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 8.0, 8.0, 9.0, 11.0, 11.0, 24.0, 29.0, 19.0, 29.0, 24.0, 31.0, 29.0, 35.0, 47.0, 43.0, 43.0, 51.0, 50.0, 43.0, 52.0, 53.0, 25.0, 36.0, 34.0, 37.0, 30.0, 30.0, 27.0, 17.0, 19.0, 20.0, 15.0, 12.0, 8.0, 9.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.749150276184082, -4.604325771331787, -4.45950174331665, -4.3146772384643555, -4.1698527336120605, -4.025028228759766, -3.880204200744629, -3.735379695892334, -3.590555191040039, -3.4457309246063232, -3.3009064197540283, -3.1560821533203125, -3.0112576484680176, -2.8664333820343018, -2.721609115600586, -2.576784610748291, -2.431960344314575, -2.2871360778808594, -2.1423115730285645, -1.9974873065948486, -1.8526628017425537, -1.707838535308838, -1.5630141496658325, -1.4181897640228271, -1.2733653783798218, -1.1285409927368164, -0.983716607093811, -0.8388922810554504, -0.6940678954124451, -0.5492435097694397, -0.4044191837310791, -0.25959479808807373, -0.11477041244506836, 0.030053958296775818, 0.17487832903862, 0.319702684879303, 0.46452707052230835, 0.6093514561653137, 0.7541757822036743, 0.8990001678466797, 1.043824553489685, 1.1886489391326904, 1.3334733247756958, 1.4782977104187012, 1.623121976852417, 1.767946481704712, 1.9127707481384277, 2.0575952529907227, 2.2024195194244385, 2.3472437858581543, 2.492068290710449, 2.636892557144165, 2.78171706199646, 2.926541328430176, 3.0713658332824707, 3.2161900997161865, 3.3610143661499023, 3.505838632583618, 3.650663137435913, 3.795487403869629, 3.940311908721924, 4.085136413574219, 4.2299604415893555, 4.37478494644165, 4.519609451293945]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 8.0, 12.0, 21.0, 21.0, 29.0, 43.0, 66.0, 116.0, 182.0, 297.0, 484.0, 723.0, 1093.0, 1768.0, 2635.0, 4074.0, 6260.0, 9554.0, 13961.0, 20283.0, 29512.0, 39904.0, 53182.0, 67415.0, 80965.0, 91641.0, 98424.0, 98705.0, 91958.0, 81351.0, 67750.0, 53782.0, 40007.0, 29646.0, 21065.0, 14155.0, 9604.0, 6272.0, 4184.0, 2651.0, 1660.0, 1107.0, 700.0, 461.0, 291.0, 193.0, 130.0, 74.0, 47.0, 35.0, 25.0, 10.0, 11.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.396484375, -2.321624755859375, -2.24676513671875, -2.171905517578125, -2.0970458984375, -2.022186279296875, -1.94732666015625, -1.872467041015625, -1.797607421875, -1.722747802734375, -1.64788818359375, -1.573028564453125, -1.4981689453125, -1.423309326171875, -1.34844970703125, -1.273590087890625, -1.19873046875, -1.123870849609375, -1.04901123046875, -0.974151611328125, -0.8992919921875, -0.824432373046875, -0.74957275390625, -0.674713134765625, -0.599853515625, -0.524993896484375, -0.45013427734375, -0.375274658203125, -0.3004150390625, -0.225555419921875, -0.15069580078125, -0.075836181640625, -0.0009765625, 0.073883056640625, 0.14874267578125, 0.223602294921875, 0.2984619140625, 0.373321533203125, 0.44818115234375, 0.523040771484375, 0.597900390625, 0.672760009765625, 0.74761962890625, 0.822479248046875, 0.8973388671875, 0.972198486328125, 1.04705810546875, 1.121917724609375, 1.19677734375, 1.271636962890625, 1.34649658203125, 1.421356201171875, 1.4962158203125, 1.571075439453125, 1.64593505859375, 1.720794677734375, 1.795654296875, 1.870513916015625, 1.94537353515625, 2.020233154296875, 2.0950927734375, 2.169952392578125, 2.24481201171875, 2.319671630859375, 2.39453125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 12.0, 8.0, 13.0, 22.0, 18.0, 20.0, 21.0, 25.0, 32.0, 45.0, 39.0, 37.0, 42.0, 40.0, 39.0, 53.0, 44.0, 42.0, 43.0, 44.0, 42.0, 40.0, 34.0, 43.0, 28.0, 25.0, 18.0, 17.0, 20.0, 19.0, 14.0, 9.0, 10.0, 5.0, 6.0, 6.0, 8.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.734375, -4.58831787109375, -4.4422607421875, -4.29620361328125, -4.150146484375, -4.00408935546875, -3.8580322265625, -3.71197509765625, -3.56591796875, -3.41986083984375, -3.2738037109375, -3.12774658203125, -2.981689453125, -2.83563232421875, -2.6895751953125, -2.54351806640625, -2.3974609375, -2.25140380859375, -2.1053466796875, -1.95928955078125, -1.813232421875, -1.66717529296875, -1.5211181640625, -1.37506103515625, -1.22900390625, -1.08294677734375, -0.9368896484375, -0.79083251953125, -0.644775390625, -0.49871826171875, -0.3526611328125, -0.20660400390625, -0.060546875, 0.08551025390625, 0.2315673828125, 0.37762451171875, 0.523681640625, 0.66973876953125, 0.8157958984375, 0.96185302734375, 1.10791015625, 1.25396728515625, 1.4000244140625, 1.54608154296875, 1.692138671875, 1.83819580078125, 1.9842529296875, 2.13031005859375, 2.2763671875, 2.42242431640625, 2.5684814453125, 2.71453857421875, 2.860595703125, 3.00665283203125, 3.1527099609375, 3.29876708984375, 3.44482421875, 3.59088134765625, 3.7369384765625, 3.88299560546875, 4.029052734375, 4.17510986328125, 4.3211669921875, 4.46722412109375, 4.61328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 21.0, 20.0, 37.0, 51.0, 65.0, 107.0, 212.0, 291.0, 480.0, 767.0, 1231.0, 1921.0, 3055.0, 4720.0, 7226.0, 10758.0, 15684.0, 23389.0, 33112.0, 44407.0, 59191.0, 74213.0, 88357.0, 97564.0, 101505.0, 98196.0, 89916.0, 76297.0, 60921.0, 46574.0, 34452.0, 24317.0, 16930.0, 11334.0, 7473.0, 4897.0, 3132.0, 2149.0, 1321.0, 825.0, 555.0, 311.0, 213.0, 129.0, 82.0, 61.0, 36.0, 22.0, 10.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.615234375, -2.537322998046875, -2.45941162109375, -2.381500244140625, -2.3035888671875, -2.225677490234375, -2.14776611328125, -2.069854736328125, -1.991943359375, -1.914031982421875, -1.83612060546875, -1.758209228515625, -1.6802978515625, -1.602386474609375, -1.52447509765625, -1.446563720703125, -1.36865234375, -1.290740966796875, -1.21282958984375, -1.134918212890625, -1.0570068359375, -0.979095458984375, -0.90118408203125, -0.823272705078125, -0.745361328125, -0.667449951171875, -0.58953857421875, -0.511627197265625, -0.4337158203125, -0.355804443359375, -0.27789306640625, -0.199981689453125, -0.1220703125, -0.044158935546875, 0.03375244140625, 0.111663818359375, 0.1895751953125, 0.267486572265625, 0.34539794921875, 0.423309326171875, 0.501220703125, 0.579132080078125, 0.65704345703125, 0.734954833984375, 0.8128662109375, 0.890777587890625, 0.96868896484375, 1.046600341796875, 1.12451171875, 1.202423095703125, 1.28033447265625, 1.358245849609375, 1.4361572265625, 1.514068603515625, 1.59197998046875, 1.669891357421875, 1.747802734375, 1.825714111328125, 1.90362548828125, 1.981536865234375, 2.0594482421875, 2.137359619140625, 2.21527099609375, 2.293182373046875, 2.37109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 16.0, 18.0, 17.0, 15.0, 19.0, 26.0, 26.0, 30.0, 42.0, 38.0, 46.0, 41.0, 37.0, 61.0, 53.0, 46.0, 54.0, 43.0, 45.0, 29.0, 36.0, 41.0, 30.0, 25.0, 24.0, 13.0, 21.0, 18.0, 12.0, 15.0, 11.0, 6.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.92694091796875, -2.8323974609375, -2.73785400390625, -2.643310546875, -2.54876708984375, -2.4542236328125, -2.35968017578125, -2.26513671875, -2.17059326171875, -2.0760498046875, -1.98150634765625, -1.886962890625, -1.79241943359375, -1.6978759765625, -1.60333251953125, -1.5087890625, -1.41424560546875, -1.3197021484375, -1.22515869140625, -1.130615234375, -1.03607177734375, -0.9415283203125, -0.84698486328125, -0.75244140625, -0.65789794921875, -0.5633544921875, -0.46881103515625, -0.374267578125, -0.27972412109375, -0.1851806640625, -0.09063720703125, 0.00390625, 0.09844970703125, 0.1929931640625, 0.28753662109375, 0.382080078125, 0.47662353515625, 0.5711669921875, 0.66571044921875, 0.76025390625, 0.85479736328125, 0.9493408203125, 1.04388427734375, 1.138427734375, 1.23297119140625, 1.3275146484375, 1.42205810546875, 1.5166015625, 1.61114501953125, 1.7056884765625, 1.80023193359375, 1.894775390625, 1.98931884765625, 2.0838623046875, 2.17840576171875, 2.27294921875, 2.36749267578125, 2.4620361328125, 2.55657958984375, 2.651123046875, 2.74566650390625, 2.8402099609375, 2.93475341796875, 3.029296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 23.0, 22.0, 37.0, 72.0, 106.0, 189.0, 307.0, 520.0, 775.0, 1337.0, 2263.0, 3781.0, 6148.0, 10291.0, 16767.0, 26497.0, 40987.0, 60562.0, 83395.0, 105106.0, 121851.0, 126480.0, 117690.0, 98909.0, 75703.0, 53468.0, 36017.0, 23119.0, 14193.0, 8723.0, 5245.0, 3218.0, 1863.0, 1106.0, 715.0, 423.0, 267.0, 132.0, 86.0, 61.0, 45.0, 23.0, 9.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0595703125, -1.02081298828125, -0.9820556640625, -0.94329833984375, -0.904541015625, -0.86578369140625, -0.8270263671875, -0.78826904296875, -0.74951171875, -0.71075439453125, -0.6719970703125, -0.63323974609375, -0.594482421875, -0.55572509765625, -0.5169677734375, -0.47821044921875, -0.439453125, -0.40069580078125, -0.3619384765625, -0.32318115234375, -0.284423828125, -0.24566650390625, -0.2069091796875, -0.16815185546875, -0.12939453125, -0.09063720703125, -0.0518798828125, -0.01312255859375, 0.025634765625, 0.06439208984375, 0.1031494140625, 0.14190673828125, 0.1806640625, 0.21942138671875, 0.2581787109375, 0.29693603515625, 0.335693359375, 0.37445068359375, 0.4132080078125, 0.45196533203125, 0.49072265625, 0.52947998046875, 0.5682373046875, 0.60699462890625, 0.645751953125, 0.68450927734375, 0.7232666015625, 0.76202392578125, 0.80078125, 0.83953857421875, 0.8782958984375, 0.91705322265625, 0.955810546875, 0.99456787109375, 1.0333251953125, 1.07208251953125, 1.11083984375, 1.14959716796875, 1.1883544921875, 1.22711181640625, 1.265869140625, 1.30462646484375, 1.3433837890625, 1.38214111328125, 1.4208984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 0.0, 4.0, 8.0, 11.0, 10.0, 16.0, 16.0, 21.0, 19.0, 36.0, 37.0, 41.0, 38.0, 48.0, 54.0, 60.0, 55.0, 57.0, 55.0, 47.0, 46.0, 40.0, 46.0, 38.0, 35.0, 27.0, 29.0, 24.0, 20.0, 9.0, 11.0, 13.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 5.0], "bins": [-0.00017654895782470703, -0.00017191097140312195, -0.00016727298498153687, -0.00016263499855995178, -0.0001579970121383667, -0.00015335902571678162, -0.00014872103929519653, -0.00014408305287361145, -0.00013944506645202637, -0.00013480708003044128, -0.0001301690936088562, -0.00012553110718727112, -0.00012089312076568604, -0.00011625513434410095, -0.00011161714792251587, -0.00010697916150093079, -0.0001023411750793457, -9.770318865776062e-05, -9.306520223617554e-05, -8.842721581459045e-05, -8.378922939300537e-05, -7.915124297142029e-05, -7.45132565498352e-05, -6.987527012825012e-05, -6.523728370666504e-05, -6.0599297285079956e-05, -5.596131086349487e-05, -5.132332444190979e-05, -4.668533802032471e-05, -4.2047351598739624e-05, -3.740936517715454e-05, -3.277137875556946e-05, -2.8133392333984375e-05, -2.3495405912399292e-05, -1.885741949081421e-05, -1.4219433069229126e-05, -9.581446647644043e-06, -4.94346022605896e-06, -3.0547380447387695e-07, 4.332512617111206e-06, 8.970499038696289e-06, 1.3608485460281372e-05, 1.8246471881866455e-05, 2.2884458303451538e-05, 2.752244472503662e-05, 3.2160431146621704e-05, 3.679841756820679e-05, 4.143640398979187e-05, 4.607439041137695e-05, 5.0712376832962036e-05, 5.535036325454712e-05, 5.99883496761322e-05, 6.462633609771729e-05, 6.926432251930237e-05, 7.390230894088745e-05, 7.854029536247253e-05, 8.317828178405762e-05, 8.78162682056427e-05, 9.245425462722778e-05, 9.709224104881287e-05, 0.00010173022747039795, 0.00010636821389198303, 0.00011100620031356812, 0.0001156441867351532, 0.00012028217315673828]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 24.0, 29.0, 46.0, 73.0, 108.0, 165.0, 292.0, 409.0, 616.0, 1095.0, 1653.0, 2557.0, 4050.0, 6223.0, 9494.0, 14465.0, 21392.0, 30966.0, 43035.0, 58014.0, 74545.0, 90576.0, 101903.0, 106715.0, 103045.0, 93295.0, 77833.0, 60799.0, 45799.0, 32654.0, 22587.0, 15214.0, 10364.0, 6506.0, 4278.0, 2804.0, 1731.0, 1109.0, 738.0, 463.0, 326.0, 191.0, 114.0, 77.0, 53.0, 30.0, 28.0, 16.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0361328125, -1.003326416015625, -0.97052001953125, -0.937713623046875, -0.9049072265625, -0.872100830078125, -0.83929443359375, -0.806488037109375, -0.773681640625, -0.740875244140625, -0.70806884765625, -0.675262451171875, -0.6424560546875, -0.609649658203125, -0.57684326171875, -0.544036865234375, -0.51123046875, -0.478424072265625, -0.44561767578125, -0.412811279296875, -0.3800048828125, -0.347198486328125, -0.31439208984375, -0.281585693359375, -0.248779296875, -0.215972900390625, -0.18316650390625, -0.150360107421875, -0.1175537109375, -0.084747314453125, -0.05194091796875, -0.019134521484375, 0.013671875, 0.046478271484375, 0.07928466796875, 0.112091064453125, 0.1448974609375, 0.177703857421875, 0.21051025390625, 0.243316650390625, 0.276123046875, 0.308929443359375, 0.34173583984375, 0.374542236328125, 0.4073486328125, 0.440155029296875, 0.47296142578125, 0.505767822265625, 0.53857421875, 0.571380615234375, 0.60418701171875, 0.636993408203125, 0.6697998046875, 0.702606201171875, 0.73541259765625, 0.768218994140625, 0.801025390625, 0.833831787109375, 0.86663818359375, 0.899444580078125, 0.9322509765625, 0.965057373046875, 0.99786376953125, 1.030670166015625, 1.0634765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 8.0, 6.0, 13.0, 9.0, 11.0, 8.0, 16.0, 31.0, 19.0, 32.0, 24.0, 23.0, 30.0, 43.0, 40.0, 39.0, 39.0, 37.0, 31.0, 44.0, 42.0, 46.0, 43.0, 42.0, 22.0, 36.0, 35.0, 31.0, 9.0, 29.0, 23.0, 15.0, 22.0, 16.0, 15.0, 15.0, 8.0, 5.0, 4.0, 3.0, 2.0, 6.0, 2.0, 8.0, 4.0, 0.0, 3.0], "bins": [-0.50732421875, -0.49359130859375, -0.4798583984375, -0.46612548828125, -0.452392578125, -0.43865966796875, -0.4249267578125, -0.41119384765625, -0.3974609375, -0.38372802734375, -0.3699951171875, -0.35626220703125, -0.342529296875, -0.32879638671875, -0.3150634765625, -0.30133056640625, -0.28759765625, -0.27386474609375, -0.2601318359375, -0.24639892578125, -0.232666015625, -0.21893310546875, -0.2052001953125, -0.19146728515625, -0.177734375, -0.16400146484375, -0.1502685546875, -0.13653564453125, -0.122802734375, -0.10906982421875, -0.0953369140625, -0.08160400390625, -0.06787109375, -0.05413818359375, -0.0404052734375, -0.02667236328125, -0.012939453125, 0.00079345703125, 0.0145263671875, 0.02825927734375, 0.0419921875, 0.05572509765625, 0.0694580078125, 0.08319091796875, 0.096923828125, 0.11065673828125, 0.1243896484375, 0.13812255859375, 0.15185546875, 0.16558837890625, 0.1793212890625, 0.19305419921875, 0.206787109375, 0.22052001953125, 0.2342529296875, 0.24798583984375, 0.26171875, 0.27545166015625, 0.2891845703125, 0.30291748046875, 0.316650390625, 0.33038330078125, 0.3441162109375, 0.35784912109375, 0.37158203125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 2.0, 1.0, 9.0, 2.0, 8.0, 12.0, 11.0, 15.0, 14.0, 29.0, 26.0, 36.0, 33.0, 39.0, 49.0, 33.0, 41.0, 43.0, 61.0, 45.0, 41.0, 51.0, 46.0, 37.0, 40.0, 36.0, 37.0, 31.0, 24.0, 25.0, 16.0, 15.0, 17.0, 19.0, 9.0, 8.0, 8.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.026535987854004, -3.8773913383483887, -3.7282466888427734, -3.579102039337158, -3.429957389831543, -3.2808127403259277, -3.1316680908203125, -2.9825234413146973, -2.833378791809082, -2.684234142303467, -2.5350894927978516, -2.3859448432922363, -2.236800193786621, -2.087655544281006, -1.9385110139846802, -1.789366364479065, -1.6402218341827393, -1.491077184677124, -1.3419325351715088, -1.1927878856658936, -1.0436432361602783, -0.8944986462593079, -0.7453540563583374, -0.5962094068527222, -0.44706475734710693, -0.2979201078414917, -0.14877548813819885, 0.00036913156509399414, 0.14951378107070923, 0.29865843057632446, 0.4478030204772949, 0.5969476699829102, 0.7460923194885254, 0.8952369689941406, 1.0443816184997559, 1.193526268005371, 1.3426709175109863, 1.4918155670166016, 1.6409600973129272, 1.7901047468185425, 1.9392493963241577, 2.0883939266204834, 2.2375385761260986, 2.386683225631714, 2.535827875137329, 2.6849725246429443, 2.8341171741485596, 2.983261823654175, 3.13240647315979, 3.2815511226654053, 3.4306957721710205, 3.5798404216766357, 3.728985071182251, 3.878129720687866, 4.027274131774902, 4.176418781280518, 4.325563430786133, 4.474708080291748, 4.623852729797363, 4.7729973793029785, 4.922142028808594, 5.071286678314209, 5.220431327819824, 5.3695759773254395, 5.518720626831055]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 1.0, 6.0, 8.0, 6.0, 12.0, 8.0, 14.0, 16.0, 11.0, 16.0, 29.0, 27.0, 23.0, 38.0, 33.0, 39.0, 38.0, 44.0, 41.0, 53.0, 51.0, 50.0, 54.0, 40.0, 48.0, 39.0, 29.0, 36.0, 23.0, 31.0, 21.0, 22.0, 18.0, 11.0, 14.0, 17.0, 8.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.585770606994629, -4.435801982879639, -4.285833358764648, -4.1358642578125, -3.9858956336975098, -3.8359270095825195, -3.68595814704895, -3.535989284515381, -3.3860206604003906, -3.2360520362854004, -3.086083173751831, -2.9361143112182617, -2.7861456871032715, -2.6361770629882812, -2.486208200454712, -2.3362393379211426, -2.1862707138061523, -2.036302089691162, -1.8863332271575928, -1.736364483833313, -1.5863957405090332, -1.4364269971847534, -1.2864582538604736, -1.1364895105361938, -0.9865207672119141, -0.8365520238876343, -0.6865832805633545, -0.5366145372390747, -0.3866457939147949, -0.23667705059051514, -0.08670830726623535, 0.06326043605804443, 0.21322870254516602, 0.3631974458694458, 0.5131661891937256, 0.6631349325180054, 0.8131036758422852, 0.9630724191665649, 1.1130411624908447, 1.2630099058151245, 1.4129786491394043, 1.562947392463684, 1.7129161357879639, 1.8628848791122437, 2.0128536224365234, 2.1628222465515137, 2.312791109085083, 2.4627599716186523, 2.6127285957336426, 2.762697219848633, 2.912666082382202, 3.0626349449157715, 3.2126035690307617, 3.362572193145752, 3.5125410556793213, 3.6625099182128906, 3.812478542327881, 3.962447166442871, 4.1124162673950195, 4.26238489151001, 4.412353515625, 4.56232213973999, 4.7122907638549805, 4.862259864807129, 5.012228488922119]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 14.0, 26.0, 48.0, 77.0, 157.0, 246.0, 412.0, 711.0, 1300.0, 2135.0, 3780.0, 6814.0, 12206.0, 21437.0, 39020.0, 70928.0, 127646.0, 224434.0, 373318.0, 550671.0, 679458.0, 676282.0, 539025.0, 361149.0, 219076.0, 125585.0, 70250.0, 38659.0, 21543.0, 12150.0, 6975.0, 3800.0, 2138.0, 1184.0, 697.0, 382.0, 219.0, 118.0, 90.0, 40.0, 30.0, 23.0, 13.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.8973388671875, -3.767333984375, -3.6373291015625, -3.50732421875, -3.3773193359375, -3.247314453125, -3.1173095703125, -2.9873046875, -2.8572998046875, -2.727294921875, -2.5972900390625, -2.46728515625, -2.3372802734375, -2.207275390625, -2.0772705078125, -1.947265625, -1.8172607421875, -1.687255859375, -1.5572509765625, -1.42724609375, -1.2972412109375, -1.167236328125, -1.0372314453125, -0.9072265625, -0.7772216796875, -0.647216796875, -0.5172119140625, -0.38720703125, -0.2572021484375, -0.127197265625, 0.0028076171875, 0.1328125, 0.2628173828125, 0.392822265625, 0.5228271484375, 0.65283203125, 0.7828369140625, 0.912841796875, 1.0428466796875, 1.1728515625, 1.3028564453125, 1.432861328125, 1.5628662109375, 1.69287109375, 1.8228759765625, 1.952880859375, 2.0828857421875, 2.212890625, 2.3428955078125, 2.472900390625, 2.6029052734375, 2.73291015625, 2.8629150390625, 2.992919921875, 3.1229248046875, 3.2529296875, 3.3829345703125, 3.512939453125, 3.6429443359375, 3.77294921875, 3.9029541015625, 4.032958984375, 4.1629638671875, 4.29296875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 13.0, 8.0, 11.0, 11.0, 15.0, 22.0, 19.0, 24.0, 22.0, 32.0, 33.0, 33.0, 43.0, 37.0, 44.0, 43.0, 32.0, 46.0, 55.0, 42.0, 55.0, 38.0, 38.0, 35.0, 31.0, 33.0, 30.0, 17.0, 16.0, 19.0, 14.0, 12.0, 17.0, 13.0, 5.0, 6.0, 14.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.802734375, -3.6824951171875, -3.562255859375, -3.4420166015625, -3.32177734375, -3.2015380859375, -3.081298828125, -2.9610595703125, -2.8408203125, -2.7205810546875, -2.600341796875, -2.4801025390625, -2.35986328125, -2.2396240234375, -2.119384765625, -1.9991455078125, -1.87890625, -1.7586669921875, -1.638427734375, -1.5181884765625, -1.39794921875, -1.2777099609375, -1.157470703125, -1.0372314453125, -0.9169921875, -0.7967529296875, -0.676513671875, -0.5562744140625, -0.43603515625, -0.3157958984375, -0.195556640625, -0.0753173828125, 0.044921875, 0.1651611328125, 0.285400390625, 0.4056396484375, 0.52587890625, 0.6461181640625, 0.766357421875, 0.8865966796875, 1.0068359375, 1.1270751953125, 1.247314453125, 1.3675537109375, 1.48779296875, 1.6080322265625, 1.728271484375, 1.8485107421875, 1.96875, 2.0889892578125, 2.209228515625, 2.3294677734375, 2.44970703125, 2.5699462890625, 2.690185546875, 2.8104248046875, 2.9306640625, 3.0509033203125, 3.171142578125, 3.2913818359375, 3.41162109375, 3.5318603515625, 3.652099609375, 3.7723388671875, 3.892578125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 9.0, 9.0, 20.0, 22.0, 56.0, 86.0, 140.0, 230.0, 407.0, 681.0, 1228.0, 2179.0, 3690.0, 6703.0, 11421.0, 20027.0, 35275.0, 61202.0, 103694.0, 170880.0, 267967.0, 392143.0, 516424.0, 591970.0, 575320.0, 482815.0, 354712.0, 236317.0, 147970.0, 89352.0, 51996.0, 29812.0, 17021.0, 9667.0, 5525.0, 3185.0, 1753.0, 1001.0, 594.0, 309.0, 177.0, 116.0, 76.0, 49.0, 29.0, 13.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.0635986328125, -3.931884765625, -3.8001708984375, -3.66845703125, -3.5367431640625, -3.405029296875, -3.2733154296875, -3.1416015625, -3.0098876953125, -2.878173828125, -2.7464599609375, -2.61474609375, -2.4830322265625, -2.351318359375, -2.2196044921875, -2.087890625, -1.9561767578125, -1.824462890625, -1.6927490234375, -1.56103515625, -1.4293212890625, -1.297607421875, -1.1658935546875, -1.0341796875, -0.9024658203125, -0.770751953125, -0.6390380859375, -0.50732421875, -0.3756103515625, -0.243896484375, -0.1121826171875, 0.01953125, 0.1512451171875, 0.282958984375, 0.4146728515625, 0.54638671875, 0.6781005859375, 0.809814453125, 0.9415283203125, 1.0732421875, 1.2049560546875, 1.336669921875, 1.4683837890625, 1.60009765625, 1.7318115234375, 1.863525390625, 1.9952392578125, 2.126953125, 2.2586669921875, 2.390380859375, 2.5220947265625, 2.65380859375, 2.7855224609375, 2.917236328125, 3.0489501953125, 3.1806640625, 3.3123779296875, 3.444091796875, 3.5758056640625, 3.70751953125, 3.8392333984375, 3.970947265625, 4.1026611328125, 4.234375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 6.0, 7.0, 9.0, 14.0, 27.0, 31.0, 32.0, 57.0, 56.0, 56.0, 83.0, 84.0, 100.0, 121.0, 139.0, 160.0, 184.0, 195.0, 203.0, 269.0, 227.0, 229.0, 233.0, 196.0, 208.0, 179.0, 159.0, 130.0, 119.0, 117.0, 80.0, 87.0, 60.0, 56.0, 38.0, 34.0, 23.0, 23.0, 8.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.767578125, -1.7121429443359375, -1.656707763671875, -1.6012725830078125, -1.54583740234375, -1.4904022216796875, -1.434967041015625, -1.3795318603515625, -1.3240966796875, -1.2686614990234375, -1.213226318359375, -1.1577911376953125, -1.10235595703125, -1.0469207763671875, -0.991485595703125, -0.9360504150390625, -0.880615234375, -0.8251800537109375, -0.769744873046875, -0.7143096923828125, -0.65887451171875, -0.6034393310546875, -0.548004150390625, -0.4925689697265625, -0.4371337890625, -0.3816986083984375, -0.326263427734375, -0.2708282470703125, -0.21539306640625, -0.1599578857421875, -0.104522705078125, -0.0490875244140625, 0.00634765625, 0.0617828369140625, 0.117218017578125, 0.1726531982421875, 0.22808837890625, 0.2835235595703125, 0.338958740234375, 0.3943939208984375, 0.4498291015625, 0.5052642822265625, 0.560699462890625, 0.6161346435546875, 0.67156982421875, 0.7270050048828125, 0.782440185546875, 0.8378753662109375, 0.893310546875, 0.9487457275390625, 1.004180908203125, 1.0596160888671875, 1.11505126953125, 1.1704864501953125, 1.225921630859375, 1.2813568115234375, 1.3367919921875, 1.3922271728515625, 1.447662353515625, 1.5030975341796875, 1.55853271484375, 1.6139678955078125, 1.669403076171875, 1.7248382568359375, 1.7802734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 7.0, 7.0, 10.0, 6.0, 7.0, 14.0, 23.0, 22.0, 34.0, 32.0, 41.0, 45.0, 38.0, 56.0, 45.0, 59.0, 52.0, 43.0, 52.0, 50.0, 47.0, 39.0, 31.0, 34.0, 32.0, 29.0, 22.0, 27.0, 20.0, 15.0, 10.0, 12.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.377223014831543, -4.217852592468262, -4.0584821701049805, -3.899111747741699, -3.739741325378418, -3.5803709030151367, -3.4210004806518555, -3.261630058288574, -3.102259635925293, -2.9428892135620117, -2.7835187911987305, -2.624148368835449, -2.464777946472168, -2.3054075241088867, -2.1460371017456055, -1.9866666793823242, -1.827296257019043, -1.6679258346557617, -1.5085554122924805, -1.3491849899291992, -1.189814567565918, -1.0304441452026367, -0.8710737228393555, -0.7117033004760742, -0.552332878112793, -0.3929624557495117, -0.23359203338623047, -0.07422161102294922, 0.08514881134033203, 0.24451923370361328, 0.40388965606689453, 0.5632600784301758, 0.7226309776306152, 0.8820013999938965, 1.0413718223571777, 1.200742244720459, 1.3601126670837402, 1.5194830894470215, 1.6788535118103027, 1.838223934173584, 1.9975943565368652, 2.1569647789001465, 2.3163352012634277, 2.475705623626709, 2.6350760459899902, 2.7944464683532715, 2.9538168907165527, 3.113187313079834, 3.2725577354431152, 3.4319281578063965, 3.5912985801696777, 3.750669002532959, 3.9100394248962402, 4.0694098472595215, 4.228780269622803, 4.388150691986084, 4.547521114349365, 4.7068915367126465, 4.866261959075928, 5.025632381439209, 5.18500280380249, 5.3443732261657715, 5.503743648529053, 5.663114070892334, 5.822484493255615]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 5.0, 10.0, 15.0, 12.0, 15.0, 12.0, 9.0, 16.0, 29.0, 30.0, 24.0, 38.0, 34.0, 50.0, 43.0, 40.0, 36.0, 49.0, 37.0, 54.0, 49.0, 44.0, 31.0, 37.0, 41.0, 39.0, 37.0, 35.0, 26.0, 19.0, 15.0, 13.0, 9.0, 14.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.764530181884766, -4.623108863830566, -4.481687545776367, -4.340266227722168, -4.198844909667969, -4.057423114776611, -3.916001796722412, -3.774580478668213, -3.6331591606140137, -3.4917378425598145, -3.3503165245056152, -3.208894968032837, -3.0674736499786377, -2.9260523319244385, -2.78463077545166, -2.643209457397461, -2.5017881393432617, -2.3603668212890625, -2.2189455032348633, -2.077523946762085, -1.9361026287078857, -1.7946813106536865, -1.6532598733901978, -1.511838436126709, -1.3704171180725098, -1.2289958000183105, -1.0875743627548218, -0.9461529850959778, -0.8047316074371338, -0.6633102297782898, -0.5218888521194458, -0.3804674744606018, -0.2390460968017578, -0.09762471914291382, 0.043796658515930176, 0.18521803617477417, 0.32663941383361816, 0.46806079149246216, 0.6094821691513062, 0.7509035468101501, 0.8923249244689941, 1.0337462425231934, 1.1751676797866821, 1.316589117050171, 1.4580104351043701, 1.5994317531585693, 1.740853190422058, 1.8822746276855469, 2.023695945739746, 2.1651172637939453, 2.3065385818481445, 2.447960138320923, 2.589381456375122, 2.7308027744293213, 2.8722243309020996, 3.013645648956299, 3.155066967010498, 3.2964882850646973, 3.4379096031188965, 3.579331159591675, 3.720752477645874, 3.8621737957000732, 4.003595352172852, 4.145016670227051, 4.28643798828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 17.0, 17.0, 23.0, 41.0, 45.0, 61.0, 98.0, 140.0, 227.0, 339.0, 470.0, 800.0, 1252.0, 2183.0, 3831.0, 7286.0, 14264.0, 28287.0, 53951.0, 97517.0, 153018.0, 192088.0, 183341.0, 134426.0, 82145.0, 44123.0, 22737.0, 11460.0, 5982.0, 3342.0, 1934.0, 1137.0, 684.0, 449.0, 262.0, 188.0, 131.0, 80.0, 58.0, 33.0, 33.0, 11.0, 10.0, 10.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.65625, -2.5777587890625, -2.499267578125, -2.4207763671875, -2.34228515625, -2.2637939453125, -2.185302734375, -2.1068115234375, -2.0283203125, -1.9498291015625, -1.871337890625, -1.7928466796875, -1.71435546875, -1.6358642578125, -1.557373046875, -1.4788818359375, -1.400390625, -1.3218994140625, -1.243408203125, -1.1649169921875, -1.08642578125, -1.0079345703125, -0.929443359375, -0.8509521484375, -0.7724609375, -0.6939697265625, -0.615478515625, -0.5369873046875, -0.45849609375, -0.3800048828125, -0.301513671875, -0.2230224609375, -0.14453125, -0.0660400390625, 0.012451171875, 0.0909423828125, 0.16943359375, 0.2479248046875, 0.326416015625, 0.4049072265625, 0.4833984375, 0.5618896484375, 0.640380859375, 0.7188720703125, 0.79736328125, 0.8758544921875, 0.954345703125, 1.0328369140625, 1.111328125, 1.1898193359375, 1.268310546875, 1.3468017578125, 1.42529296875, 1.5037841796875, 1.582275390625, 1.6607666015625, 1.7392578125, 1.8177490234375, 1.896240234375, 1.9747314453125, 2.05322265625, 2.1317138671875, 2.210205078125, 2.2886962890625, 2.3671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 9.0, 11.0, 16.0, 13.0, 13.0, 15.0, 15.0, 23.0, 35.0, 34.0, 30.0, 36.0, 33.0, 26.0, 44.0, 32.0, 34.0, 50.0, 44.0, 33.0, 41.0, 38.0, 42.0, 49.0, 28.0, 34.0, 35.0, 21.0, 18.0, 29.0, 22.0, 16.0, 10.0, 13.0, 9.0, 12.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.3603515625, -4.224609375, -4.0888671875, -3.953125, -3.8173828125, -3.681640625, -3.5458984375, -3.41015625, -3.2744140625, -3.138671875, -3.0029296875, -2.8671875, -2.7314453125, -2.595703125, -2.4599609375, -2.32421875, -2.1884765625, -2.052734375, -1.9169921875, -1.78125, -1.6455078125, -1.509765625, -1.3740234375, -1.23828125, -1.1025390625, -0.966796875, -0.8310546875, -0.6953125, -0.5595703125, -0.423828125, -0.2880859375, -0.15234375, -0.0166015625, 0.119140625, 0.2548828125, 0.390625, 0.5263671875, 0.662109375, 0.7978515625, 0.93359375, 1.0693359375, 1.205078125, 1.3408203125, 1.4765625, 1.6123046875, 1.748046875, 1.8837890625, 2.01953125, 2.1552734375, 2.291015625, 2.4267578125, 2.5625, 2.6982421875, 2.833984375, 2.9697265625, 3.10546875, 3.2412109375, 3.376953125, 3.5126953125, 3.6484375, 3.7841796875, 3.919921875, 4.0556640625, 4.19140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 7.0, 15.0, 32.0, 41.0, 75.0, 111.0, 153.0, 277.0, 369.0, 660.0, 1103.0, 1873.0, 3411.0, 6522.0, 12700.0, 25828.0, 53515.0, 108568.0, 190735.0, 240302.0, 189729.0, 107300.0, 53222.0, 25116.0, 12662.0, 6242.0, 3369.0, 1827.0, 1055.0, 625.0, 407.0, 244.0, 146.0, 111.0, 51.0, 40.0, 38.0, 17.0, 12.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.205078125, -3.096405029296875, -2.98773193359375, -2.879058837890625, -2.7703857421875, -2.661712646484375, -2.55303955078125, -2.444366455078125, -2.335693359375, -2.227020263671875, -2.11834716796875, -2.009674072265625, -1.9010009765625, -1.792327880859375, -1.68365478515625, -1.574981689453125, -1.46630859375, -1.357635498046875, -1.24896240234375, -1.140289306640625, -1.0316162109375, -0.922943115234375, -0.81427001953125, -0.705596923828125, -0.596923828125, -0.488250732421875, -0.37957763671875, -0.270904541015625, -0.1622314453125, -0.053558349609375, 0.05511474609375, 0.163787841796875, 0.2724609375, 0.381134033203125, 0.48980712890625, 0.598480224609375, 0.7071533203125, 0.815826416015625, 0.92449951171875, 1.033172607421875, 1.141845703125, 1.250518798828125, 1.35919189453125, 1.467864990234375, 1.5765380859375, 1.685211181640625, 1.79388427734375, 1.902557373046875, 2.01123046875, 2.119903564453125, 2.22857666015625, 2.337249755859375, 2.4459228515625, 2.554595947265625, 2.66326904296875, 2.771942138671875, 2.880615234375, 2.989288330078125, 3.09796142578125, 3.206634521484375, 3.3153076171875, 3.423980712890625, 3.53265380859375, 3.641326904296875, 3.75]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 8.0, 5.0, 7.0, 7.0, 7.0, 7.0, 13.0, 15.0, 15.0, 11.0, 20.0, 20.0, 26.0, 28.0, 16.0, 28.0, 23.0, 31.0, 41.0, 36.0, 45.0, 35.0, 42.0, 31.0, 34.0, 28.0, 37.0, 40.0, 33.0, 33.0, 37.0, 21.0, 26.0, 25.0, 21.0, 16.0, 21.0, 10.0, 15.0, 20.0, 10.0, 13.0, 2.0, 5.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0], "bins": [-2.427734375, -2.35308837890625, -2.2784423828125, -2.20379638671875, -2.129150390625, -2.05450439453125, -1.9798583984375, -1.90521240234375, -1.83056640625, -1.75592041015625, -1.6812744140625, -1.60662841796875, -1.531982421875, -1.45733642578125, -1.3826904296875, -1.30804443359375, -1.2333984375, -1.15875244140625, -1.0841064453125, -1.00946044921875, -0.934814453125, -0.86016845703125, -0.7855224609375, -0.71087646484375, -0.63623046875, -0.56158447265625, -0.4869384765625, -0.41229248046875, -0.337646484375, -0.26300048828125, -0.1883544921875, -0.11370849609375, -0.0390625, 0.03558349609375, 0.1102294921875, 0.18487548828125, 0.259521484375, 0.33416748046875, 0.4088134765625, 0.48345947265625, 0.55810546875, 0.63275146484375, 0.7073974609375, 0.78204345703125, 0.856689453125, 0.93133544921875, 1.0059814453125, 1.08062744140625, 1.1552734375, 1.22991943359375, 1.3045654296875, 1.37921142578125, 1.453857421875, 1.52850341796875, 1.6031494140625, 1.67779541015625, 1.75244140625, 1.82708740234375, 1.9017333984375, 1.97637939453125, 2.051025390625, 2.12567138671875, 2.2003173828125, 2.27496337890625, 2.349609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 8.0, 8.0, 18.0, 28.0, 40.0, 70.0, 95.0, 161.0, 214.0, 344.0, 571.0, 926.0, 1494.0, 2747.0, 5382.0, 11456.0, 27350.0, 68521.0, 164436.0, 291524.0, 257670.0, 125349.0, 50556.0, 20461.0, 9123.0, 4319.0, 2230.0, 1293.0, 757.0, 492.0, 315.0, 212.0, 137.0, 84.0, 56.0, 25.0, 23.0, 15.0, 6.0, 11.0, 7.0, 2.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8037109375, -1.7470550537109375, -1.690399169921875, -1.6337432861328125, -1.57708740234375, -1.5204315185546875, -1.463775634765625, -1.4071197509765625, -1.3504638671875, -1.2938079833984375, -1.237152099609375, -1.1804962158203125, -1.12384033203125, -1.0671844482421875, -1.010528564453125, -0.9538726806640625, -0.897216796875, -0.8405609130859375, -0.783905029296875, -0.7272491455078125, -0.67059326171875, -0.6139373779296875, -0.557281494140625, -0.5006256103515625, -0.4439697265625, -0.3873138427734375, -0.330657958984375, -0.2740020751953125, -0.21734619140625, -0.1606903076171875, -0.104034423828125, -0.0473785400390625, 0.00927734375, 0.0659332275390625, 0.122589111328125, 0.1792449951171875, 0.23590087890625, 0.2925567626953125, 0.349212646484375, 0.4058685302734375, 0.4625244140625, 0.5191802978515625, 0.575836181640625, 0.6324920654296875, 0.68914794921875, 0.7458038330078125, 0.802459716796875, 0.8591156005859375, 0.915771484375, 0.9724273681640625, 1.029083251953125, 1.0857391357421875, 1.14239501953125, 1.1990509033203125, 1.255706787109375, 1.3123626708984375, 1.3690185546875, 1.4256744384765625, 1.482330322265625, 1.5389862060546875, 1.59564208984375, 1.6522979736328125, 1.708953857421875, 1.7656097412109375, 1.822265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 12.0, 17.0, 16.0, 27.0, 27.0, 47.0, 61.0, 85.0, 95.0, 91.0, 104.0, 99.0, 96.0, 62.0, 42.0, 32.0, 22.0, 14.0, 12.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.00011481065303087234, -0.00011112727224826813, -0.00010744389146566391, -0.00010376051068305969, -0.00010007712990045547, -9.639374911785126e-05, -9.271036833524704e-05, -8.902698755264282e-05, -8.53436067700386e-05, -8.166022598743439e-05, -7.797684520483017e-05, -7.429346442222595e-05, -7.061008363962173e-05, -6.692670285701752e-05, -6.32433220744133e-05, -5.955994129180908e-05, -5.5876560509204865e-05, -5.219317972660065e-05, -4.850979894399643e-05, -4.482641816139221e-05, -4.1143037378787994e-05, -3.745965659618378e-05, -3.377627581357956e-05, -3.0092895030975342e-05, -2.6409514248371124e-05, -2.2726133465766907e-05, -1.904275268316269e-05, -1.535937190055847e-05, -1.1675991117954254e-05, -7.992610335350037e-06, -4.309229552745819e-06, -6.258487701416016e-07, 3.057532012462616e-06, 6.7409127950668335e-06, 1.0424293577671051e-05, 1.4107674360275269e-05, 1.7791055142879486e-05, 2.1474435925483704e-05, 2.515781670808792e-05, 2.884119749069214e-05, 3.2524578273296356e-05, 3.6207959055900574e-05, 3.989133983850479e-05, 4.357472062110901e-05, 4.7258101403713226e-05, 5.0941482186317444e-05, 5.462486296892166e-05, 5.830824375152588e-05, 6.19916245341301e-05, 6.567500531673431e-05, 6.935838609933853e-05, 7.304176688194275e-05, 7.672514766454697e-05, 8.040852844715118e-05, 8.40919092297554e-05, 8.777529001235962e-05, 9.145867079496384e-05, 9.514205157756805e-05, 9.882543236017227e-05, 0.00010250881314277649, 0.00010619219392538071, 0.00010987557470798492, 0.00011355895549058914, 0.00011724233627319336]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 10.0, 11.0, 19.0, 26.0, 31.0, 51.0, 63.0, 83.0, 124.0, 169.0, 259.0, 367.0, 508.0, 817.0, 1248.0, 2045.0, 3318.0, 6115.0, 11136.0, 21713.0, 42376.0, 82545.0, 141693.0, 197727.0, 201668.0, 149195.0, 87615.0, 46095.0, 23232.0, 12096.0, 6442.0, 3581.0, 2188.0, 1304.0, 830.0, 536.0, 380.0, 235.0, 181.0, 129.0, 100.0, 78.0, 46.0, 55.0, 24.0, 16.0, 20.0, 17.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0], "bins": [-1.4833984375, -1.4385223388671875, -1.393646240234375, -1.3487701416015625, -1.30389404296875, -1.2590179443359375, -1.214141845703125, -1.1692657470703125, -1.1243896484375, -1.0795135498046875, -1.034637451171875, -0.9897613525390625, -0.94488525390625, -0.9000091552734375, -0.855133056640625, -0.8102569580078125, -0.765380859375, -0.7205047607421875, -0.675628662109375, -0.6307525634765625, -0.58587646484375, -0.5410003662109375, -0.496124267578125, -0.4512481689453125, -0.4063720703125, -0.3614959716796875, -0.316619873046875, -0.2717437744140625, -0.22686767578125, -0.1819915771484375, -0.137115478515625, -0.0922393798828125, -0.04736328125, -0.0024871826171875, 0.042388916015625, 0.0872650146484375, 0.13214111328125, 0.1770172119140625, 0.221893310546875, 0.2667694091796875, 0.3116455078125, 0.3565216064453125, 0.401397705078125, 0.4462738037109375, 0.49114990234375, 0.5360260009765625, 0.580902099609375, 0.6257781982421875, 0.670654296875, 0.7155303955078125, 0.760406494140625, 0.8052825927734375, 0.85015869140625, 0.8950347900390625, 0.939910888671875, 0.9847869873046875, 1.0296630859375, 1.0745391845703125, 1.119415283203125, 1.1642913818359375, 1.20916748046875, 1.2540435791015625, 1.298919677734375, 1.3437957763671875, 1.388671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 12.0, 18.0, 26.0, 30.0, 32.0, 50.0, 49.0, 55.0, 63.0, 64.0, 75.0, 62.0, 65.0, 52.0, 64.0, 39.0, 45.0, 38.0, 33.0, 20.0, 22.0, 16.0, 11.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5591812133789062, -0.5407257080078125, -0.5222702026367188, -0.503814697265625, -0.48535919189453125, -0.4669036865234375, -0.44844818115234375, -0.42999267578125, -0.41153717041015625, -0.3930816650390625, -0.37462615966796875, -0.356170654296875, -0.33771514892578125, -0.3192596435546875, -0.30080413818359375, -0.2823486328125, -0.26389312744140625, -0.2454376220703125, -0.22698211669921875, -0.208526611328125, -0.19007110595703125, -0.1716156005859375, -0.15316009521484375, -0.13470458984375, -0.11624908447265625, -0.0977935791015625, -0.07933807373046875, -0.060882568359375, -0.04242706298828125, -0.0239715576171875, -0.00551605224609375, 0.012939453125, 0.03139495849609375, 0.0498504638671875, 0.06830596923828125, 0.086761474609375, 0.10521697998046875, 0.1236724853515625, 0.14212799072265625, 0.16058349609375, 0.17903900146484375, 0.1974945068359375, 0.21595001220703125, 0.234405517578125, 0.25286102294921875, 0.2713165283203125, 0.28977203369140625, 0.3082275390625, 0.32668304443359375, 0.3451385498046875, 0.36359405517578125, 0.382049560546875, 0.40050506591796875, 0.4189605712890625, 0.43741607666015625, 0.45587158203125, 0.47432708740234375, 0.4927825927734375, 0.5112380981445312, 0.529693603515625, 0.5481491088867188, 0.5666046142578125, 0.5850601196289062, 0.603515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 9.0, 6.0, 6.0, 7.0, 6.0, 12.0, 14.0, 19.0, 16.0, 24.0, 37.0, 45.0, 36.0, 40.0, 49.0, 56.0, 45.0, 52.0, 44.0, 53.0, 45.0, 48.0, 48.0, 34.0, 30.0, 35.0, 28.0, 23.0, 27.0, 15.0, 15.0, 18.0, 18.0, 7.0, 7.0, 12.0, 5.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8300344944000244, -3.6761722564697266, -3.5223100185394287, -3.368447780609131, -3.214585542678833, -3.060723304748535, -2.9068610668182373, -2.7529988288879395, -2.5991365909576416, -2.4452743530273438, -2.291412115097046, -2.137549877166748, -1.9836876392364502, -1.8298254013061523, -1.6759631633758545, -1.5221009254455566, -1.3682386875152588, -1.214376449584961, -1.060514211654663, -0.9066519737243652, -0.7527897357940674, -0.5989274978637695, -0.4450652599334717, -0.29120302200317383, -0.13734078407287598, 0.016521453857421875, 0.17038369178771973, 0.3242459297180176, 0.47810816764831543, 0.6319704055786133, 0.7858326435089111, 0.939694881439209, 1.0935568809509277, 1.2474191188812256, 1.4012813568115234, 1.5551435947418213, 1.7090058326721191, 1.862868070602417, 2.016730308532715, 2.1705925464630127, 2.3244547843933105, 2.4783170223236084, 2.6321792602539062, 2.786041498184204, 2.939903736114502, 3.0937659740448, 3.2476282119750977, 3.4014904499053955, 3.5553526878356934, 3.709214925765991, 3.863077163696289, 4.016939163208008, 4.170801639556885, 4.324664115905762, 4.4785261154174805, 4.632388114929199, 4.786250591278076, 4.940113067626953, 5.093975067138672, 5.247837066650391, 5.401699542999268, 5.5555620193481445, 5.709424018859863, 5.863286018371582, 6.017148494720459]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 17.0, 14.0, 9.0, 13.0, 13.0, 15.0, 26.0, 29.0, 24.0, 40.0, 34.0, 42.0, 44.0, 38.0, 42.0, 40.0, 49.0, 43.0, 46.0, 41.0, 42.0, 33.0, 36.0, 39.0, 42.0, 26.0, 35.0, 19.0, 21.0, 11.0, 12.0, 13.0, 14.0, 4.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.693100452423096, -4.554470539093018, -4.415841102600098, -4.2772111892700195, -4.138581275939941, -3.9999513626098633, -3.8613216876983643, -3.7226920127868652, -3.584062099456787, -3.445432186126709, -3.30680251121521, -3.168172836303711, -3.029542922973633, -2.8909130096435547, -2.7522833347320557, -2.6136536598205566, -2.4750237464904785, -2.3363938331604004, -2.1977641582489014, -2.0591344833374023, -1.9205045700073242, -1.7818747758865356, -1.643244981765747, -1.5046151876449585, -1.36598539352417, -1.2273555994033813, -1.0887258052825928, -0.9500960111618042, -0.8114662170410156, -0.672836422920227, -0.5342066287994385, -0.3955768346786499, -0.2569465637207031, -0.11831676959991455, 0.020313024520874023, 0.1589428186416626, 0.29757261276245117, 0.43620240688323975, 0.5748322010040283, 0.7134619951248169, 0.8520917892456055, 0.990721583366394, 1.1293513774871826, 1.2679811716079712, 1.4066109657287598, 1.5452407598495483, 1.683870553970337, 1.8225003480911255, 1.961130142211914, 2.099760055541992, 2.238389730453491, 2.3770194053649902, 2.5156493186950684, 2.6542792320251465, 2.7929089069366455, 2.9315385818481445, 3.0701684951782227, 3.208798408508301, 3.3474280834198, 3.486057758331299, 3.624687671661377, 3.763317584991455, 3.901947259902954, 4.040576934814453, 4.179206848144531]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 23.0, 19.0, 50.0, 81.0, 116.0, 213.0, 305.0, 526.0, 836.0, 1420.0, 2224.0, 3586.0, 5760.0, 8990.0, 13599.0, 20316.0, 28876.0, 41108.0, 54991.0, 70442.0, 85074.0, 95570.0, 102226.0, 101868.0, 94218.0, 81224.0, 66611.0, 51577.0, 37959.0, 26848.0, 18426.0, 12125.0, 7951.0, 5062.0, 3232.0, 1955.0, 1207.0, 752.0, 457.0, 286.0, 167.0, 105.0, 63.0, 36.0, 26.0, 25.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.28125, -2.207366943359375, -2.13348388671875, -2.059600830078125, -1.9857177734375, -1.911834716796875, -1.83795166015625, -1.764068603515625, -1.690185546875, -1.616302490234375, -1.54241943359375, -1.468536376953125, -1.3946533203125, -1.320770263671875, -1.24688720703125, -1.173004150390625, -1.09912109375, -1.025238037109375, -0.95135498046875, -0.877471923828125, -0.8035888671875, -0.729705810546875, -0.65582275390625, -0.581939697265625, -0.508056640625, -0.434173583984375, -0.36029052734375, -0.286407470703125, -0.2125244140625, -0.138641357421875, -0.06475830078125, 0.009124755859375, 0.0830078125, 0.156890869140625, 0.23077392578125, 0.304656982421875, 0.3785400390625, 0.452423095703125, 0.52630615234375, 0.600189208984375, 0.674072265625, 0.747955322265625, 0.82183837890625, 0.895721435546875, 0.9696044921875, 1.043487548828125, 1.11737060546875, 1.191253662109375, 1.26513671875, 1.339019775390625, 1.41290283203125, 1.486785888671875, 1.5606689453125, 1.634552001953125, 1.70843505859375, 1.782318115234375, 1.856201171875, 1.930084228515625, 2.00396728515625, 2.077850341796875, 2.1517333984375, 2.225616455078125, 2.29949951171875, 2.373382568359375, 2.447265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 7.0, 8.0, 18.0, 15.0, 14.0, 15.0, 16.0, 31.0, 32.0, 26.0, 33.0, 32.0, 26.0, 50.0, 41.0, 35.0, 33.0, 53.0, 41.0, 45.0, 45.0, 34.0, 39.0, 47.0, 34.0, 27.0, 31.0, 31.0, 18.0, 16.0, 17.0, 10.0, 8.0, 13.0, 12.0, 10.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7265625, -4.5899658203125, -4.453369140625, -4.3167724609375, -4.18017578125, -4.0435791015625, -3.906982421875, -3.7703857421875, -3.6337890625, -3.4971923828125, -3.360595703125, -3.2239990234375, -3.08740234375, -2.9508056640625, -2.814208984375, -2.6776123046875, -2.541015625, -2.4044189453125, -2.267822265625, -2.1312255859375, -1.99462890625, -1.8580322265625, -1.721435546875, -1.5848388671875, -1.4482421875, -1.3116455078125, -1.175048828125, -1.0384521484375, -0.90185546875, -0.7652587890625, -0.628662109375, -0.4920654296875, -0.35546875, -0.2188720703125, -0.082275390625, 0.0543212890625, 0.19091796875, 0.3275146484375, 0.464111328125, 0.6007080078125, 0.7373046875, 0.8739013671875, 1.010498046875, 1.1470947265625, 1.28369140625, 1.4202880859375, 1.556884765625, 1.6934814453125, 1.830078125, 1.9666748046875, 2.103271484375, 2.2398681640625, 2.37646484375, 2.5130615234375, 2.649658203125, 2.7862548828125, 2.9228515625, 3.0594482421875, 3.196044921875, 3.3326416015625, 3.46923828125, 3.6058349609375, 3.742431640625, 3.8790283203125, 4.015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 5.0, 7.0, 17.0, 35.0, 68.0, 84.0, 160.0, 241.0, 403.0, 621.0, 1101.0, 1771.0, 2913.0, 4641.0, 7568.0, 12345.0, 18914.0, 28836.0, 43107.0, 60437.0, 79550.0, 97691.0, 110491.0, 116112.0, 110055.0, 95956.0, 77942.0, 58437.0, 41627.0, 28602.0, 18153.0, 11749.0, 7437.0, 4514.0, 2719.0, 1650.0, 1057.0, 597.0, 349.0, 221.0, 141.0, 98.0, 46.0, 26.0, 23.0, 15.0, 9.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.869140625, -2.78338623046875, -2.6976318359375, -2.61187744140625, -2.526123046875, -2.44036865234375, -2.3546142578125, -2.26885986328125, -2.18310546875, -2.09735107421875, -2.0115966796875, -1.92584228515625, -1.840087890625, -1.75433349609375, -1.6685791015625, -1.58282470703125, -1.4970703125, -1.41131591796875, -1.3255615234375, -1.23980712890625, -1.154052734375, -1.06829833984375, -0.9825439453125, -0.89678955078125, -0.81103515625, -0.72528076171875, -0.6395263671875, -0.55377197265625, -0.468017578125, -0.38226318359375, -0.2965087890625, -0.21075439453125, -0.125, -0.03924560546875, 0.0465087890625, 0.13226318359375, 0.218017578125, 0.30377197265625, 0.3895263671875, 0.47528076171875, 0.56103515625, 0.64678955078125, 0.7325439453125, 0.81829833984375, 0.904052734375, 0.98980712890625, 1.0755615234375, 1.16131591796875, 1.2470703125, 1.33282470703125, 1.4185791015625, 1.50433349609375, 1.590087890625, 1.67584228515625, 1.7615966796875, 1.84735107421875, 1.93310546875, 2.01885986328125, 2.1046142578125, 2.19036865234375, 2.276123046875, 2.36187744140625, 2.4476318359375, 2.53338623046875, 2.619140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 9.0, 5.0, 6.0, 13.0, 7.0, 9.0, 24.0, 16.0, 21.0, 22.0, 20.0, 28.0, 25.0, 35.0, 40.0, 36.0, 35.0, 35.0, 56.0, 32.0, 36.0, 33.0, 41.0, 44.0, 49.0, 33.0, 33.0, 25.0, 34.0, 18.0, 24.0, 19.0, 20.0, 12.0, 14.0, 20.0, 8.0, 12.0, 10.0, 5.0, 3.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.315887451171875, -2.23529052734375, -2.154693603515625, -2.0740966796875, -1.993499755859375, -1.91290283203125, -1.832305908203125, -1.751708984375, -1.671112060546875, -1.59051513671875, -1.509918212890625, -1.4293212890625, -1.348724365234375, -1.26812744140625, -1.187530517578125, -1.10693359375, -1.026336669921875, -0.94573974609375, -0.865142822265625, -0.7845458984375, -0.703948974609375, -0.62335205078125, -0.542755126953125, -0.462158203125, -0.381561279296875, -0.30096435546875, -0.220367431640625, -0.1397705078125, -0.059173583984375, 0.02142333984375, 0.102020263671875, 0.1826171875, 0.263214111328125, 0.34381103515625, 0.424407958984375, 0.5050048828125, 0.585601806640625, 0.66619873046875, 0.746795654296875, 0.827392578125, 0.907989501953125, 0.98858642578125, 1.069183349609375, 1.1497802734375, 1.230377197265625, 1.31097412109375, 1.391571044921875, 1.47216796875, 1.552764892578125, 1.63336181640625, 1.713958740234375, 1.7945556640625, 1.875152587890625, 1.95574951171875, 2.036346435546875, 2.116943359375, 2.197540283203125, 2.27813720703125, 2.358734130859375, 2.4393310546875, 2.519927978515625, 2.60052490234375, 2.681121826171875, 2.76171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 13.0, 15.0, 24.0, 24.0, 55.0, 74.0, 121.0, 196.0, 296.0, 456.0, 732.0, 1081.0, 1673.0, 2706.0, 4385.0, 6864.0, 10739.0, 16861.0, 25643.0, 38210.0, 55121.0, 73469.0, 92344.0, 108591.0, 114844.0, 112847.0, 100837.0, 82277.0, 63267.0, 45762.0, 31474.0, 20891.0, 13346.0, 8579.0, 5379.0, 3289.0, 2156.0, 1363.0, 918.0, 562.0, 394.0, 241.0, 142.0, 97.0, 65.0, 44.0, 30.0, 18.0, 12.0, 6.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.01171875, -0.9798431396484375, -0.947967529296875, -0.9160919189453125, -0.88421630859375, -0.8523406982421875, -0.820465087890625, -0.7885894775390625, -0.7567138671875, -0.7248382568359375, -0.692962646484375, -0.6610870361328125, -0.62921142578125, -0.5973358154296875, -0.565460205078125, -0.5335845947265625, -0.501708984375, -0.4698333740234375, -0.437957763671875, -0.4060821533203125, -0.37420654296875, -0.3423309326171875, -0.310455322265625, -0.2785797119140625, -0.2467041015625, -0.2148284912109375, -0.182952880859375, -0.1510772705078125, -0.11920166015625, -0.0873260498046875, -0.055450439453125, -0.0235748291015625, 0.00830078125, 0.0401763916015625, 0.072052001953125, 0.1039276123046875, 0.13580322265625, 0.1676788330078125, 0.199554443359375, 0.2314300537109375, 0.2633056640625, 0.2951812744140625, 0.327056884765625, 0.3589324951171875, 0.39080810546875, 0.4226837158203125, 0.454559326171875, 0.4864349365234375, 0.518310546875, 0.5501861572265625, 0.582061767578125, 0.6139373779296875, 0.64581298828125, 0.6776885986328125, 0.709564208984375, 0.7414398193359375, 0.7733154296875, 0.8051910400390625, 0.837066650390625, 0.8689422607421875, 0.90081787109375, 0.9326934814453125, 0.964569091796875, 0.9964447021484375, 1.0283203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 4.0, 7.0, 13.0, 18.0, 18.0, 23.0, 21.0, 30.0, 38.0, 40.0, 40.0, 55.0, 58.0, 58.0, 46.0, 58.0, 57.0, 57.0, 67.0, 38.0, 46.0, 34.0, 33.0, 31.0, 24.0, 20.0, 12.0, 9.0, 16.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001533031463623047, -0.0001485198736190796, -0.0001437366008758545, -0.0001389533281326294, -0.0001341700553894043, -0.0001293867826461792, -0.0001246035099029541, -0.000119820237159729, -0.0001150369644165039, -0.00011025369167327881, -0.00010547041893005371, -0.00010068714618682861, -9.590387344360352e-05, -9.112060070037842e-05, -8.633732795715332e-05, -8.155405521392822e-05, -7.677078247070312e-05, -7.198750972747803e-05, -6.720423698425293e-05, -6.242096424102783e-05, -5.7637691497802734e-05, -5.285441875457764e-05, -4.807114601135254e-05, -4.328787326812744e-05, -3.8504600524902344e-05, -3.3721327781677246e-05, -2.893805503845215e-05, -2.415478229522705e-05, -1.9371509552001953e-05, -1.4588236808776855e-05, -9.804964065551758e-06, -5.02169132232666e-06, -2.384185791015625e-07, 4.544854164123535e-06, 9.328126907348633e-06, 1.411139965057373e-05, 1.8894672393798828e-05, 2.3677945137023926e-05, 2.8461217880249023e-05, 3.324449062347412e-05, 3.802776336669922e-05, 4.2811036109924316e-05, 4.7594308853149414e-05, 5.237758159637451e-05, 5.716085433959961e-05, 6.194412708282471e-05, 6.67273998260498e-05, 7.15106725692749e-05, 7.62939453125e-05, 8.10772180557251e-05, 8.58604907989502e-05, 9.064376354217529e-05, 9.542703628540039e-05, 0.00010021030902862549, 0.00010499358177185059, 0.00010977685451507568, 0.00011456012725830078, 0.00011934340000152588, 0.00012412667274475098, 0.00012890994548797607, 0.00013369321823120117, 0.00013847649097442627, 0.00014325976371765137, 0.00014804303646087646, 0.00015282630920410156]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 25.0, 28.0, 50.0, 99.0, 142.0, 282.0, 401.0, 802.0, 1334.0, 2427.0, 4156.0, 7209.0, 12516.0, 21330.0, 35025.0, 54895.0, 80102.0, 106861.0, 128442.0, 136169.0, 127560.0, 107072.0, 79891.0, 55004.0, 35192.0, 21829.0, 12659.0, 7526.0, 4039.0, 2401.0, 1349.0, 748.0, 403.0, 249.0, 112.0, 89.0, 57.0, 33.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2522430419921875, -1.212493896484375, -1.1727447509765625, -1.13299560546875, -1.0932464599609375, -1.053497314453125, -1.0137481689453125, -0.9739990234375, -0.9342498779296875, -0.894500732421875, -0.8547515869140625, -0.81500244140625, -0.7752532958984375, -0.735504150390625, -0.6957550048828125, -0.656005859375, -0.6162567138671875, -0.576507568359375, -0.5367584228515625, -0.49700927734375, -0.4572601318359375, -0.417510986328125, -0.3777618408203125, -0.3380126953125, -0.2982635498046875, -0.258514404296875, -0.2187652587890625, -0.17901611328125, -0.1392669677734375, -0.099517822265625, -0.0597686767578125, -0.02001953125, 0.0197296142578125, 0.059478759765625, 0.0992279052734375, 0.13897705078125, 0.1787261962890625, 0.218475341796875, 0.2582244873046875, 0.2979736328125, 0.3377227783203125, 0.377471923828125, 0.4172210693359375, 0.45697021484375, 0.4967193603515625, 0.536468505859375, 0.5762176513671875, 0.615966796875, 0.6557159423828125, 0.695465087890625, 0.7352142333984375, 0.77496337890625, 0.8147125244140625, 0.854461669921875, 0.8942108154296875, 0.9339599609375, 0.9737091064453125, 1.013458251953125, 1.0532073974609375, 1.09295654296875, 1.1327056884765625, 1.172454833984375, 1.2122039794921875, 1.251953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 14.0, 12.0, 30.0, 19.0, 15.0, 27.0, 31.0, 27.0, 31.0, 27.0, 42.0, 43.0, 47.0, 40.0, 60.0, 43.0, 38.0, 38.0, 46.0, 41.0, 42.0, 41.0, 28.0, 27.0, 21.0, 19.0, 16.0, 26.0, 14.0, 10.0, 15.0, 5.0, 2.0, 2.0, 5.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43505859375, -0.42176055908203125, -0.4084625244140625, -0.39516448974609375, -0.381866455078125, -0.36856842041015625, -0.3552703857421875, -0.34197235107421875, -0.32867431640625, -0.31537628173828125, -0.3020782470703125, -0.28878021240234375, -0.275482177734375, -0.26218414306640625, -0.2488861083984375, -0.23558807373046875, -0.2222900390625, -0.20899200439453125, -0.1956939697265625, -0.18239593505859375, -0.169097900390625, -0.15579986572265625, -0.1425018310546875, -0.12920379638671875, -0.11590576171875, -0.10260772705078125, -0.0893096923828125, -0.07601165771484375, -0.062713623046875, -0.04941558837890625, -0.0361175537109375, -0.02281951904296875, -0.009521484375, 0.00377655029296875, 0.0170745849609375, 0.03037261962890625, 0.043670654296875, 0.05696868896484375, 0.0702667236328125, 0.08356475830078125, 0.09686279296875, 0.11016082763671875, 0.1234588623046875, 0.13675689697265625, 0.150054931640625, 0.16335296630859375, 0.1766510009765625, 0.18994903564453125, 0.2032470703125, 0.21654510498046875, 0.2298431396484375, 0.24314117431640625, 0.256439208984375, 0.26973724365234375, 0.2830352783203125, 0.29633331298828125, 0.30963134765625, 0.32292938232421875, 0.3362274169921875, 0.34952545166015625, 0.362823486328125, 0.37612152099609375, 0.3894195556640625, 0.40271759033203125, 0.416015625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 10.0, 13.0, 14.0, 19.0, 19.0, 20.0, 26.0, 34.0, 38.0, 40.0, 40.0, 50.0, 52.0, 44.0, 53.0, 64.0, 43.0, 49.0, 42.0, 38.0, 43.0, 29.0, 34.0, 40.0, 22.0, 18.0, 15.0, 14.0, 17.0, 11.0, 14.0, 4.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.030482769012451, -3.872673511505127, -3.7148642539978027, -3.5570549964904785, -3.3992457389831543, -3.24143648147583, -3.0836269855499268, -2.9258177280426025, -2.7680084705352783, -2.610199213027954, -2.45238995552063, -2.2945806980133057, -2.1367712020874023, -1.9789620637893677, -1.821152687072754, -1.6633434295654297, -1.5055341720581055, -1.3477249145507812, -1.189915657043457, -1.0321062803268433, -0.874297022819519, -0.7164877653121948, -0.5586784482002258, -0.40086913108825684, -0.24305987358093262, -0.08525058627128601, 0.0725587010383606, 0.2303679883480072, 0.3881772756576538, 0.545986533164978, 0.703795850276947, 0.861605167388916, 1.0194144248962402, 1.1772236824035645, 1.3350329399108887, 1.4928423166275024, 1.6506515741348267, 1.8084608316421509, 1.9662702083587646, 2.124079465866089, 2.281888723373413, 2.4396979808807373, 2.5975072383880615, 2.7553164958953857, 2.913125991821289, 3.0709352493286133, 3.2287445068359375, 3.3865537643432617, 3.544363021850586, 3.70217227935791, 3.8599815368652344, 4.017790794372559, 4.175600051879883, 4.333409309387207, 4.491218566894531, 4.6490278244018555, 4.80683708190918, 4.964646339416504, 5.122455596923828, 5.280264854431152, 5.438074111938477, 5.595883369445801, 5.753692626953125, 5.911501884460449, 6.069311618804932]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 2.0, 0.0, 5.0, 10.0, 14.0, 20.0, 13.0, 15.0, 20.0, 16.0, 16.0, 21.0, 24.0, 18.0, 25.0, 31.0, 41.0, 36.0, 42.0, 33.0, 34.0, 41.0, 33.0, 32.0, 29.0, 42.0, 33.0, 51.0, 35.0, 28.0, 42.0, 23.0, 31.0, 26.0, 17.0, 15.0, 7.0, 13.0, 11.0, 9.0, 13.0, 8.0, 5.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-4.3107404708862305, -4.184695243835449, -4.058650016784668, -3.932605028152466, -3.8065598011016846, -3.6805145740509033, -3.554469585418701, -3.42842435836792, -3.3023791313171387, -3.1763339042663574, -3.050288677215576, -2.924243688583374, -2.7981984615325928, -2.6721532344818115, -2.5461082458496094, -2.420063018798828, -2.294017791748047, -2.1679725646972656, -2.0419273376464844, -1.9158823490142822, -1.789837121963501, -1.6637918949127197, -1.537746787071228, -1.4117016792297363, -1.285656452178955, -1.1596112251281738, -1.0335661172866821, -0.9075209498405457, -0.7814757823944092, -0.6554306149482727, -0.5293854475021362, -0.40334028005599976, -0.2772953510284424, -0.1512501835823059, -0.025205016136169434, 0.10084015130996704, 0.22688531875610352, 0.35293048620224, 0.47897565364837646, 0.6050208210945129, 0.7310659885406494, 0.8571111559867859, 0.9831563234329224, 1.109201431274414, 1.2352466583251953, 1.3612918853759766, 1.4873369932174683, 1.61338210105896, 1.7394273281097412, 1.8654725551605225, 1.9915176630020142, 2.117562770843506, 2.243607997894287, 2.3696532249450684, 2.4956984519958496, 2.6217434406280518, 2.747788667678833, 2.8738338947296143, 2.9998788833618164, 3.1259241104125977, 3.251969337463379, 3.37801456451416, 3.5040597915649414, 3.6301047801971436, 3.756150007247925]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 9.0, 4.0, 11.0, 18.0, 28.0, 38.0, 50.0, 96.0, 142.0, 231.0, 395.0, 669.0, 1074.0, 1636.0, 2728.0, 4677.0, 7543.0, 12693.0, 21233.0, 35222.0, 58841.0, 98277.0, 159509.0, 251115.0, 370300.0, 493809.0, 578226.0, 577949.0, 493617.0, 369503.0, 249829.0, 159992.0, 97994.0, 58546.0, 35379.0, 21226.0, 12585.0, 7584.0, 4546.0, 2707.0, 1609.0, 1037.0, 630.0, 394.0, 237.0, 129.0, 81.0, 63.0, 33.0, 13.0, 8.0, 10.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4296875, -3.31536865234375, -3.2010498046875, -3.08673095703125, -2.972412109375, -2.85809326171875, -2.7437744140625, -2.62945556640625, -2.51513671875, -2.40081787109375, -2.2864990234375, -2.17218017578125, -2.057861328125, -1.94354248046875, -1.8292236328125, -1.71490478515625, -1.6005859375, -1.48626708984375, -1.3719482421875, -1.25762939453125, -1.143310546875, -1.02899169921875, -0.9146728515625, -0.80035400390625, -0.68603515625, -0.57171630859375, -0.4573974609375, -0.34307861328125, -0.228759765625, -0.11444091796875, -0.0001220703125, 0.11419677734375, 0.228515625, 0.34283447265625, 0.4571533203125, 0.57147216796875, 0.685791015625, 0.80010986328125, 0.9144287109375, 1.02874755859375, 1.14306640625, 1.25738525390625, 1.3717041015625, 1.48602294921875, 1.600341796875, 1.71466064453125, 1.8289794921875, 1.94329833984375, 2.0576171875, 2.17193603515625, 2.2862548828125, 2.40057373046875, 2.514892578125, 2.62921142578125, 2.7435302734375, 2.85784912109375, 2.97216796875, 3.08648681640625, 3.2008056640625, 3.31512451171875, 3.429443359375, 3.54376220703125, 3.6580810546875, 3.77239990234375, 3.88671875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 14.0, 12.0, 16.0, 19.0, 13.0, 17.0, 22.0, 22.0, 24.0, 22.0, 27.0, 34.0, 38.0, 42.0, 38.0, 41.0, 31.0, 47.0, 42.0, 46.0, 35.0, 33.0, 30.0, 40.0, 47.0, 22.0, 29.0, 31.0, 17.0, 16.0, 17.0, 19.0, 9.0, 14.0, 8.0, 8.0, 7.0, 7.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.666015625, -3.55645751953125, -3.4468994140625, -3.33734130859375, -3.227783203125, -3.11822509765625, -3.0086669921875, -2.89910888671875, -2.78955078125, -2.67999267578125, -2.5704345703125, -2.46087646484375, -2.351318359375, -2.24176025390625, -2.1322021484375, -2.02264404296875, -1.9130859375, -1.80352783203125, -1.6939697265625, -1.58441162109375, -1.474853515625, -1.36529541015625, -1.2557373046875, -1.14617919921875, -1.03662109375, -0.92706298828125, -0.8175048828125, -0.70794677734375, -0.598388671875, -0.48883056640625, -0.3792724609375, -0.26971435546875, -0.16015625, -0.05059814453125, 0.0589599609375, 0.16851806640625, 0.278076171875, 0.38763427734375, 0.4971923828125, 0.60675048828125, 0.71630859375, 0.82586669921875, 0.9354248046875, 1.04498291015625, 1.154541015625, 1.26409912109375, 1.3736572265625, 1.48321533203125, 1.5927734375, 1.70233154296875, 1.8118896484375, 1.92144775390625, 2.031005859375, 2.14056396484375, 2.2501220703125, 2.35968017578125, 2.46923828125, 2.57879638671875, 2.6883544921875, 2.79791259765625, 2.907470703125, 3.01702880859375, 3.1265869140625, 3.23614501953125, 3.345703125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 19.0, 37.0, 33.0, 98.0, 152.0, 243.0, 379.0, 636.0, 984.0, 1607.0, 2529.0, 4162.0, 6767.0, 11057.0, 17756.0, 28185.0, 44793.0, 70195.0, 107391.0, 160441.0, 230117.0, 314861.0, 401507.0, 467885.0, 492491.0, 463438.0, 394824.0, 307507.0, 223645.0, 154833.0, 103696.0, 67507.0, 42989.0, 27035.0, 16749.0, 10454.0, 6592.0, 4096.0, 2504.0, 1521.0, 975.0, 595.0, 425.0, 212.0, 151.0, 80.0, 45.0, 39.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0], "bins": [-3.5625, -3.449249267578125, -3.33599853515625, -3.222747802734375, -3.1094970703125, -2.996246337890625, -2.88299560546875, -2.769744873046875, -2.656494140625, -2.543243408203125, -2.42999267578125, -2.316741943359375, -2.2034912109375, -2.090240478515625, -1.97698974609375, -1.863739013671875, -1.75048828125, -1.637237548828125, -1.52398681640625, -1.410736083984375, -1.2974853515625, -1.184234619140625, -1.07098388671875, -0.957733154296875, -0.844482421875, -0.731231689453125, -0.61798095703125, -0.504730224609375, -0.3914794921875, -0.278228759765625, -0.16497802734375, -0.051727294921875, 0.0615234375, 0.174774169921875, 0.28802490234375, 0.401275634765625, 0.5145263671875, 0.627777099609375, 0.74102783203125, 0.854278564453125, 0.967529296875, 1.080780029296875, 1.19403076171875, 1.307281494140625, 1.4205322265625, 1.533782958984375, 1.64703369140625, 1.760284423828125, 1.87353515625, 1.986785888671875, 2.10003662109375, 2.213287353515625, 2.3265380859375, 2.439788818359375, 2.55303955078125, 2.666290283203125, 2.779541015625, 2.892791748046875, 3.00604248046875, 3.119293212890625, 3.2325439453125, 3.345794677734375, 3.45904541015625, 3.572296142578125, 3.685546875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 7.0, 16.0, 22.0, 34.0, 25.0, 38.0, 47.0, 59.0, 94.0, 103.0, 131.0, 122.0, 141.0, 164.0, 181.0, 210.0, 209.0, 243.0, 258.0, 224.0, 208.0, 222.0, 198.0, 186.0, 147.0, 132.0, 119.0, 109.0, 95.0, 75.0, 57.0, 43.0, 33.0, 28.0, 21.0, 13.0, 12.0, 10.0, 9.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.095703125, -2.0382537841796875, -1.980804443359375, -1.9233551025390625, -1.86590576171875, -1.8084564208984375, -1.751007080078125, -1.6935577392578125, -1.6361083984375, -1.5786590576171875, -1.521209716796875, -1.4637603759765625, -1.40631103515625, -1.3488616943359375, -1.291412353515625, -1.2339630126953125, -1.176513671875, -1.1190643310546875, -1.061614990234375, -1.0041656494140625, -0.94671630859375, -0.8892669677734375, -0.831817626953125, -0.7743682861328125, -0.7169189453125, -0.6594696044921875, -0.602020263671875, -0.5445709228515625, -0.48712158203125, -0.4296722412109375, -0.372222900390625, -0.3147735595703125, -0.25732421875, -0.1998748779296875, -0.142425537109375, -0.0849761962890625, -0.02752685546875, 0.0299224853515625, 0.087371826171875, 0.1448211669921875, 0.2022705078125, 0.2597198486328125, 0.317169189453125, 0.3746185302734375, 0.43206787109375, 0.4895172119140625, 0.546966552734375, 0.6044158935546875, 0.661865234375, 0.7193145751953125, 0.776763916015625, 0.8342132568359375, 0.89166259765625, 0.9491119384765625, 1.006561279296875, 1.0640106201171875, 1.1214599609375, 1.1789093017578125, 1.236358642578125, 1.2938079833984375, 1.35125732421875, 1.4087066650390625, 1.466156005859375, 1.5236053466796875, 1.5810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 5.0, 15.0, 12.0, 10.0, 15.0, 8.0, 15.0, 21.0, 15.0, 24.0, 19.0, 31.0, 27.0, 38.0, 34.0, 49.0, 46.0, 43.0, 37.0, 42.0, 34.0, 54.0, 42.0, 44.0, 43.0, 46.0, 34.0, 30.0, 15.0, 19.0, 25.0, 15.0, 16.0, 10.0, 13.0, 11.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.802727460861206, -3.6600940227508545, -3.517460823059082, -3.3748273849487305, -3.232193946838379, -3.0895605087280273, -2.946927070617676, -2.8042938709259033, -2.6616604328155518, -2.5190269947052, -2.3763937950134277, -2.233760356903076, -2.0911269187927246, -1.948493480682373, -1.805860161781311, -1.663226842880249, -1.5205934047698975, -1.377959966659546, -1.2353266477584839, -1.0926933288574219, -0.9500598907470703, -0.8074265122413635, -0.6647931337356567, -0.52215975522995, -0.37952637672424316, -0.23689299821853638, -0.09425961971282959, 0.0483737587928772, 0.19100713729858398, 0.33364051580429077, 0.47627389430999756, 0.6189072728157043, 0.7615408897399902, 0.904174268245697, 1.0468076467514038, 1.1894409656524658, 1.3320744037628174, 1.474707841873169, 1.617341160774231, 1.759974479675293, 1.9026079177856445, 2.045241355895996, 2.1878747940063477, 2.33050799369812, 2.4731414318084717, 2.6157748699188232, 2.7584080696105957, 2.9010415077209473, 3.043674945831299, 3.1863083839416504, 3.328941822052002, 3.4715750217437744, 3.614208459854126, 3.7568418979644775, 3.89947509765625, 4.042108535766602, 4.184741973876953, 4.327375411987305, 4.470008850097656, 4.612642288208008, 4.755275726318359, 4.897908687591553, 5.040542125701904, 5.183175563812256, 5.325809001922607]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 7.0, 1.0, 8.0, 11.0, 10.0, 14.0, 15.0, 18.0, 24.0, 29.0, 23.0, 38.0, 38.0, 38.0, 40.0, 33.0, 41.0, 43.0, 38.0, 47.0, 35.0, 38.0, 43.0, 51.0, 35.0, 40.0, 40.0, 27.0, 36.0, 17.0, 18.0, 19.0, 21.0, 13.0, 11.0, 9.0, 8.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.571445465087891, -4.4310431480407715, -4.2906413078308105, -4.150238990783691, -4.0098371505737305, -3.8694348335266113, -3.7290327548980713, -3.5886306762695312, -3.448228359222412, -3.307826280593872, -3.167424201965332, -3.027021884918213, -2.886619806289673, -2.746217727661133, -2.6058156490325928, -2.4654135704040527, -2.3250114917755127, -2.1846094131469727, -2.0442073345184326, -1.903805136680603, -1.7634029388427734, -1.6230008602142334, -1.4825987815856934, -1.3421967029571533, -1.2017945051193237, -1.0613924264907837, -0.9209902286529541, -0.7805881500244141, -0.6401860117912292, -0.49978387355804443, -0.3593817949295044, -0.21897965669631958, -0.07857751846313477, 0.061824604868888855, 0.20222672820091248, 0.3426288366317749, 0.4830309748649597, 0.6234331130981445, 0.7638351917266846, 0.9042373299598694, 1.0446394681930542, 1.1850415468215942, 1.3254437446594238, 1.4658458232879639, 1.606247901916504, 1.7466500997543335, 1.8870521783828735, 2.027454376220703, 2.167856454849243, 2.308258533477783, 2.4486606121063232, 2.5890626907348633, 2.7294650077819824, 2.8698670864105225, 3.0102691650390625, 3.1506712436676025, 3.2910733222961426, 3.4314754009246826, 3.5718774795532227, 3.712279796600342, 3.852681875228882, 3.993083953857422, 4.133485794067383, 4.273888111114502, 4.414290428161621]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 3.0, 4.0, 7.0, 26.0, 33.0, 51.0, 77.0, 129.0, 210.0, 287.0, 498.0, 756.0, 1427.0, 2009.0, 3323.0, 5341.0, 8738.0, 13784.0, 21557.0, 33057.0, 49105.0, 69616.0, 92183.0, 113323.0, 123927.0, 121873.0, 107884.0, 87233.0, 64194.0, 45188.0, 30390.0, 19551.0, 12268.0, 7650.0, 4912.0, 3023.0, 1876.0, 1141.0, 698.0, 425.0, 290.0, 165.0, 105.0, 73.0, 44.0, 38.0, 24.0, 13.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.572265625, -1.5258636474609375, -1.479461669921875, -1.4330596923828125, -1.38665771484375, -1.3402557373046875, -1.293853759765625, -1.2474517822265625, -1.2010498046875, -1.1546478271484375, -1.108245849609375, -1.0618438720703125, -1.01544189453125, -0.9690399169921875, -0.922637939453125, -0.8762359619140625, -0.829833984375, -0.7834320068359375, -0.737030029296875, -0.6906280517578125, -0.64422607421875, -0.5978240966796875, -0.551422119140625, -0.5050201416015625, -0.4586181640625, -0.4122161865234375, -0.365814208984375, -0.3194122314453125, -0.27301025390625, -0.2266082763671875, -0.180206298828125, -0.1338043212890625, -0.08740234375, -0.0410003662109375, 0.005401611328125, 0.0518035888671875, 0.09820556640625, 0.1446075439453125, 0.191009521484375, 0.2374114990234375, 0.2838134765625, 0.3302154541015625, 0.376617431640625, 0.4230194091796875, 0.46942138671875, 0.5158233642578125, 0.562225341796875, 0.6086273193359375, 0.655029296875, 0.7014312744140625, 0.747833251953125, 0.7942352294921875, 0.84063720703125, 0.8870391845703125, 0.933441162109375, 0.9798431396484375, 1.0262451171875, 1.0726470947265625, 1.119049072265625, 1.1654510498046875, 1.21185302734375, 1.2582550048828125, 1.304656982421875, 1.3510589599609375, 1.3974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 10.0, 8.0, 4.0, 11.0, 9.0, 15.0, 17.0, 12.0, 19.0, 33.0, 30.0, 36.0, 30.0, 37.0, 30.0, 38.0, 38.0, 33.0, 32.0, 47.0, 29.0, 39.0, 33.0, 33.0, 43.0, 46.0, 36.0, 30.0, 32.0, 28.0, 23.0, 25.0, 11.0, 19.0, 15.0, 10.0, 10.0, 11.0, 9.0, 10.0, 8.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.06787109375, -3.9326171875, -3.79736328125, -3.662109375, -3.52685546875, -3.3916015625, -3.25634765625, -3.12109375, -2.98583984375, -2.8505859375, -2.71533203125, -2.580078125, -2.44482421875, -2.3095703125, -2.17431640625, -2.0390625, -1.90380859375, -1.7685546875, -1.63330078125, -1.498046875, -1.36279296875, -1.2275390625, -1.09228515625, -0.95703125, -0.82177734375, -0.6865234375, -0.55126953125, -0.416015625, -0.28076171875, -0.1455078125, -0.01025390625, 0.125, 0.26025390625, 0.3955078125, 0.53076171875, 0.666015625, 0.80126953125, 0.9365234375, 1.07177734375, 1.20703125, 1.34228515625, 1.4775390625, 1.61279296875, 1.748046875, 1.88330078125, 2.0185546875, 2.15380859375, 2.2890625, 2.42431640625, 2.5595703125, 2.69482421875, 2.830078125, 2.96533203125, 3.1005859375, 3.23583984375, 3.37109375, 3.50634765625, 3.6416015625, 3.77685546875, 3.912109375, 4.04736328125, 4.1826171875, 4.31787109375, 4.453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 18.0, 17.0, 31.0, 54.0, 74.0, 131.0, 226.0, 384.0, 761.0, 1414.0, 2766.0, 5516.0, 11281.0, 23956.0, 48290.0, 96228.0, 168068.0, 225960.0, 201525.0, 127411.0, 68555.0, 33513.0, 16273.0, 7940.0, 3919.0, 1950.0, 1019.0, 511.0, 343.0, 162.0, 94.0, 64.0, 34.0, 18.0, 14.0, 13.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.93310546875, -2.8310546875, -2.72900390625, -2.626953125, -2.52490234375, -2.4228515625, -2.32080078125, -2.21875, -2.11669921875, -2.0146484375, -1.91259765625, -1.810546875, -1.70849609375, -1.6064453125, -1.50439453125, -1.40234375, -1.30029296875, -1.1982421875, -1.09619140625, -0.994140625, -0.89208984375, -0.7900390625, -0.68798828125, -0.5859375, -0.48388671875, -0.3818359375, -0.27978515625, -0.177734375, -0.07568359375, 0.0263671875, 0.12841796875, 0.23046875, 0.33251953125, 0.4345703125, 0.53662109375, 0.638671875, 0.74072265625, 0.8427734375, 0.94482421875, 1.046875, 1.14892578125, 1.2509765625, 1.35302734375, 1.455078125, 1.55712890625, 1.6591796875, 1.76123046875, 1.86328125, 1.96533203125, 2.0673828125, 2.16943359375, 2.271484375, 2.37353515625, 2.4755859375, 2.57763671875, 2.6796875, 2.78173828125, 2.8837890625, 2.98583984375, 3.087890625, 3.18994140625, 3.2919921875, 3.39404296875, 3.49609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 1.0, 7.0, 5.0, 12.0, 7.0, 13.0, 19.0, 20.0, 12.0, 21.0, 26.0, 23.0, 36.0, 38.0, 29.0, 38.0, 34.0, 33.0, 32.0, 51.0, 41.0, 40.0, 37.0, 34.0, 50.0, 36.0, 41.0, 27.0, 30.0, 26.0, 26.0, 21.0, 27.0, 25.0, 11.0, 14.0, 9.0, 6.0, 8.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.683685302734375, -2.59588623046875, -2.508087158203125, -2.4202880859375, -2.332489013671875, -2.24468994140625, -2.156890869140625, -2.069091796875, -1.981292724609375, -1.89349365234375, -1.805694580078125, -1.7178955078125, -1.630096435546875, -1.54229736328125, -1.454498291015625, -1.36669921875, -1.278900146484375, -1.19110107421875, -1.103302001953125, -1.0155029296875, -0.927703857421875, -0.83990478515625, -0.752105712890625, -0.664306640625, -0.576507568359375, -0.48870849609375, -0.400909423828125, -0.3131103515625, -0.225311279296875, -0.13751220703125, -0.049713134765625, 0.0380859375, 0.125885009765625, 0.21368408203125, 0.301483154296875, 0.3892822265625, 0.477081298828125, 0.56488037109375, 0.652679443359375, 0.740478515625, 0.828277587890625, 0.91607666015625, 1.003875732421875, 1.0916748046875, 1.179473876953125, 1.26727294921875, 1.355072021484375, 1.44287109375, 1.530670166015625, 1.61846923828125, 1.706268310546875, 1.7940673828125, 1.881866455078125, 1.96966552734375, 2.057464599609375, 2.145263671875, 2.233062744140625, 2.32086181640625, 2.408660888671875, 2.4964599609375, 2.584259033203125, 2.67205810546875, 2.759857177734375, 2.84765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 9.0, 5.0, 14.0, 16.0, 25.0, 40.0, 54.0, 102.0, 159.0, 300.0, 442.0, 805.0, 1549.0, 2943.0, 6233.0, 12831.0, 27967.0, 58509.0, 115696.0, 193172.0, 233075.0, 184385.0, 107066.0, 53885.0, 25598.0, 12015.0, 5759.0, 2751.0, 1367.0, 688.0, 419.0, 243.0, 147.0, 85.0, 62.0, 35.0, 27.0, 23.0, 13.0, 6.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1173248291015625, -1.079376220703125, -1.0414276123046875, -1.00347900390625, -0.9655303955078125, -0.927581787109375, -0.8896331787109375, -0.8516845703125, -0.8137359619140625, -0.775787353515625, -0.7378387451171875, -0.69989013671875, -0.6619415283203125, -0.623992919921875, -0.5860443115234375, -0.548095703125, -0.5101470947265625, -0.472198486328125, -0.4342498779296875, -0.39630126953125, -0.3583526611328125, -0.320404052734375, -0.2824554443359375, -0.2445068359375, -0.2065582275390625, -0.168609619140625, -0.1306610107421875, -0.09271240234375, -0.0547637939453125, -0.016815185546875, 0.0211334228515625, 0.05908203125, 0.0970306396484375, 0.134979248046875, 0.1729278564453125, 0.21087646484375, 0.2488250732421875, 0.286773681640625, 0.3247222900390625, 0.3626708984375, 0.4006195068359375, 0.438568115234375, 0.4765167236328125, 0.51446533203125, 0.5524139404296875, 0.590362548828125, 0.6283111572265625, 0.666259765625, 0.7042083740234375, 0.742156982421875, 0.7801055908203125, 0.81805419921875, 0.8560028076171875, 0.893951416015625, 0.9319000244140625, 0.9698486328125, 1.0077972412109375, 1.045745849609375, 1.0836944580078125, 1.12164306640625, 1.1595916748046875, 1.197540283203125, 1.2354888916015625, 1.2734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 9.0, 13.0, 15.0, 22.0, 20.0, 25.0, 42.0, 45.0, 48.0, 47.0, 49.0, 58.0, 60.0, 66.0, 54.0, 60.0, 56.0, 56.0, 33.0, 36.0, 36.0, 29.0, 23.0, 15.0, 17.0, 12.0, 21.0, 5.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1021575927734375e-05, -4.901085048913956e-05, -4.700012505054474e-05, -4.498939961194992e-05, -4.29786741733551e-05, -4.0967948734760284e-05, -3.8957223296165466e-05, -3.694649785757065e-05, -3.493577241897583e-05, -3.292504698038101e-05, -3.0914321541786194e-05, -2.8903596103191376e-05, -2.6892870664596558e-05, -2.488214522600174e-05, -2.287141978740692e-05, -2.0860694348812103e-05, -1.8849968910217285e-05, -1.6839243471622467e-05, -1.4828518033027649e-05, -1.281779259443283e-05, -1.0807067155838013e-05, -8.796341717243195e-06, -6.7856162786483765e-06, -4.774890840053558e-06, -2.7641654014587402e-06, -7.534399628639221e-07, 1.257285475730896e-06, 3.268010914325714e-06, 5.278736352920532e-06, 7.28946179151535e-06, 9.300187230110168e-06, 1.1310912668704987e-05, 1.3321638107299805e-05, 1.5332363545894623e-05, 1.734308898448944e-05, 1.935381442308426e-05, 2.1364539861679077e-05, 2.3375265300273895e-05, 2.5385990738868713e-05, 2.739671617746353e-05, 2.940744161605835e-05, 3.141816705465317e-05, 3.3428892493247986e-05, 3.5439617931842804e-05, 3.745034337043762e-05, 3.946106880903244e-05, 4.147179424762726e-05, 4.3482519686222076e-05, 4.5493245124816895e-05, 4.750397056341171e-05, 4.951469600200653e-05, 5.152542144060135e-05, 5.353614687919617e-05, 5.5546872317790985e-05, 5.75575977563858e-05, 5.956832319498062e-05, 6.157904863357544e-05, 6.358977407217026e-05, 6.560049951076508e-05, 6.76112249493599e-05, 6.962195038795471e-05, 7.163267582654953e-05, 7.364340126514435e-05, 7.565412670373917e-05, 7.766485214233398e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 13.0, 10.0, 17.0, 31.0, 46.0, 54.0, 99.0, 161.0, 220.0, 375.0, 635.0, 1033.0, 1825.0, 3102.0, 5589.0, 9705.0, 17042.0, 29738.0, 49812.0, 79131.0, 115072.0, 146168.0, 158068.0, 141201.0, 107628.0, 73486.0, 45088.0, 26927.0, 15512.0, 8834.0, 5047.0, 2857.0, 1614.0, 949.0, 566.0, 335.0, 200.0, 135.0, 64.0, 59.0, 38.0, 25.0, 13.0, 11.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8633041381835938, -0.8306121826171875, -0.7979202270507812, -0.765228271484375, -0.7325363159179688, -0.6998443603515625, -0.6671524047851562, -0.63446044921875, -0.6017684936523438, -0.5690765380859375, -0.5363845825195312, -0.503692626953125, -0.47100067138671875, -0.4383087158203125, -0.40561676025390625, -0.3729248046875, -0.34023284912109375, -0.3075408935546875, -0.27484893798828125, -0.242156982421875, -0.20946502685546875, -0.1767730712890625, -0.14408111572265625, -0.11138916015625, -0.07869720458984375, -0.0460052490234375, -0.01331329345703125, 0.019378662109375, 0.05207061767578125, 0.0847625732421875, 0.11745452880859375, 0.150146484375, 0.18283843994140625, 0.2155303955078125, 0.24822235107421875, 0.280914306640625, 0.31360626220703125, 0.3462982177734375, 0.37899017333984375, 0.41168212890625, 0.44437408447265625, 0.4770660400390625, 0.5097579956054688, 0.542449951171875, 0.5751419067382812, 0.6078338623046875, 0.6405258178710938, 0.6732177734375, 0.7059097290039062, 0.7386016845703125, 0.7712936401367188, 0.803985595703125, 0.8366775512695312, 0.8693695068359375, 0.9020614624023438, 0.93475341796875, 0.9674453735351562, 1.0001373291015625, 1.0328292846679688, 1.065521240234375, 1.0982131958007812, 1.1309051513671875, 1.1635971069335938, 1.1962890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 11.0, 7.0, 10.0, 10.0, 16.0, 18.0, 29.0, 27.0, 28.0, 27.0, 34.0, 32.0, 37.0, 43.0, 55.0, 65.0, 38.0, 58.0, 53.0, 50.0, 38.0, 51.0, 41.0, 30.0, 29.0, 28.0, 22.0, 15.0, 12.0, 17.0, 8.0, 22.0, 7.0, 8.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.393798828125, -0.3818855285644531, -0.36997222900390625, -0.3580589294433594, -0.3461456298828125, -0.3342323303222656, -0.32231903076171875, -0.3104057312011719, -0.298492431640625, -0.2865791320800781, -0.27466583251953125, -0.2627525329589844, -0.2508392333984375, -0.23892593383789062, -0.22701263427734375, -0.21509933471679688, -0.20318603515625, -0.19127273559570312, -0.17935943603515625, -0.16744613647460938, -0.1555328369140625, -0.14361953735351562, -0.13170623779296875, -0.11979293823242188, -0.107879638671875, -0.09596633911132812, -0.08405303955078125, -0.07213973999023438, -0.0602264404296875, -0.048313140869140625, -0.03639984130859375, -0.024486541748046875, -0.0125732421875, -0.000659942626953125, 0.01125335693359375, 0.023166656494140625, 0.0350799560546875, 0.046993255615234375, 0.05890655517578125, 0.07081985473632812, 0.082733154296875, 0.09464645385742188, 0.10655975341796875, 0.11847305297851562, 0.1303863525390625, 0.14229965209960938, 0.15421295166015625, 0.16612625122070312, 0.17803955078125, 0.18995285034179688, 0.20186614990234375, 0.21377944946289062, 0.2256927490234375, 0.23760604858398438, 0.24951934814453125, 0.2614326477050781, 0.273345947265625, 0.2852592468261719, 0.29717254638671875, 0.3090858459472656, 0.3209991455078125, 0.3329124450683594, 0.34482574462890625, 0.3567390441894531, 0.36865234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 10.0, 5.0, 12.0, 11.0, 17.0, 8.0, 10.0, 25.0, 14.0, 21.0, 19.0, 29.0, 25.0, 41.0, 38.0, 42.0, 40.0, 41.0, 49.0, 44.0, 38.0, 48.0, 42.0, 44.0, 47.0, 40.0, 41.0, 29.0, 18.0, 25.0, 20.0, 16.0, 17.0, 9.0, 10.0, 15.0, 11.0, 4.0, 9.0, 4.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.895940065383911, -3.751131772994995, -3.6063232421875, -3.461514949798584, -3.316706418991089, -3.171898126602173, -3.0270895957946777, -2.8822813034057617, -2.7374730110168457, -2.5926647186279297, -2.4478561878204346, -2.3030478954315186, -2.1582393646240234, -2.0134310722351074, -1.8686226606369019, -1.7238142490386963, -1.5790057182312012, -1.4341973066329956, -1.28938889503479, -1.144580602645874, -0.9997721314430237, -0.8549637198448181, -0.7101553678512573, -0.5653469562530518, -0.4205385446548462, -0.2757301330566406, -0.13092175126075745, 0.013886630535125732, 0.1586950421333313, 0.30350345373153687, 0.44831180572509766, 0.5931202173233032, 0.7379288673400879, 0.8827372789382935, 1.027545690536499, 1.172353982925415, 1.3171625137329102, 1.4619708061218262, 1.6067792177200317, 1.7515876293182373, 1.8963960409164429, 2.0412044525146484, 2.1860127449035645, 2.3308212757110596, 2.4756295680999756, 2.6204380989074707, 2.7652463912963867, 2.9100546836853027, 3.054863214492798, 3.199671506881714, 3.344480037689209, 3.489288330078125, 3.63409686088562, 3.778905153274536, 3.9237136840820312, 4.068521976470947, 4.213330268859863, 4.358138561248779, 4.502946853637695, 4.6477556228637695, 4.7925639152526855, 4.937372207641602, 5.082180500030518, 5.226988792419434, 5.371797561645508]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 1.0, 7.0, 5.0, 9.0, 8.0, 14.0, 11.0, 15.0, 25.0, 17.0, 21.0, 33.0, 36.0, 31.0, 42.0, 40.0, 31.0, 53.0, 34.0, 36.0, 46.0, 40.0, 36.0, 41.0, 47.0, 35.0, 42.0, 35.0, 36.0, 31.0, 23.0, 19.0, 22.0, 12.0, 18.0, 11.0, 9.0, 5.0, 10.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.533507823944092, -4.3940558433532715, -4.254604339599609, -4.115152359008789, -3.975700855255127, -3.8362491130828857, -3.6967973709106445, -3.557345390319824, -3.417893886566162, -3.278442144393921, -3.1389904022216797, -2.9995386600494385, -2.8600869178771973, -2.720635175704956, -2.581183433532715, -2.4417314529418945, -2.3022797107696533, -2.162827968597412, -2.023376226425171, -1.8839244842529297, -1.7444727420806885, -1.6050209999084473, -1.4655691385269165, -1.3261173963546753, -1.186665654182434, -1.0472139120101929, -0.9077621698379517, -0.7683103680610657, -0.6288586258888245, -0.48940688371658325, -0.34995508193969727, -0.21050333976745605, -0.07105159759521484, 0.06840015947818756, 0.20785191655158997, 0.34730368852615356, 0.4867554306983948, 0.626207172870636, 0.765658974647522, 0.9051107168197632, 1.0445624589920044, 1.1840142011642456, 1.3234659433364868, 1.4629178047180176, 1.6023695468902588, 1.7418212890625, 1.8812730312347412, 2.0207247734069824, 2.1601765155792236, 2.299628257751465, 2.439079999923706, 2.5785317420959473, 2.7179834842681885, 2.8574352264404297, 2.99688720703125, 3.136338710784912, 3.2757906913757324, 3.4152424335479736, 3.554694175720215, 3.694145917892456, 3.8335976600646973, 3.9730494022369385, 4.11250114440918, 4.251953125, 4.391404628753662]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 18.0, 18.0, 30.0, 70.0, 86.0, 153.0, 253.0, 411.0, 560.0, 937.0, 1455.0, 2367.0, 3422.0, 5367.0, 7982.0, 11313.0, 16455.0, 22983.0, 31330.0, 41837.0, 52585.0, 64681.0, 76167.0, 84630.0, 90040.0, 90033.0, 85753.0, 77770.0, 67549.0, 55255.0, 43913.0, 33126.0, 24868.0, 17525.0, 12421.0, 8542.0, 5765.0, 3780.0, 2541.0, 1642.0, 1069.0, 699.0, 421.0, 266.0, 199.0, 100.0, 72.0, 37.0, 21.0, 22.0, 6.0, 1.0, 5.0, 2.0, 0.0, 4.0], "bins": [-2.16796875, -2.10247802734375, -2.0369873046875, -1.97149658203125, -1.906005859375, -1.84051513671875, -1.7750244140625, -1.70953369140625, -1.64404296875, -1.57855224609375, -1.5130615234375, -1.44757080078125, -1.382080078125, -1.31658935546875, -1.2510986328125, -1.18560791015625, -1.1201171875, -1.05462646484375, -0.9891357421875, -0.92364501953125, -0.858154296875, -0.79266357421875, -0.7271728515625, -0.66168212890625, -0.59619140625, -0.53070068359375, -0.4652099609375, -0.39971923828125, -0.334228515625, -0.26873779296875, -0.2032470703125, -0.13775634765625, -0.072265625, -0.00677490234375, 0.0587158203125, 0.12420654296875, 0.189697265625, 0.25518798828125, 0.3206787109375, 0.38616943359375, 0.45166015625, 0.51715087890625, 0.5826416015625, 0.64813232421875, 0.713623046875, 0.77911376953125, 0.8446044921875, 0.91009521484375, 0.9755859375, 1.04107666015625, 1.1065673828125, 1.17205810546875, 1.237548828125, 1.30303955078125, 1.3685302734375, 1.43402099609375, 1.49951171875, 1.56500244140625, 1.6304931640625, 1.69598388671875, 1.761474609375, 1.82696533203125, 1.8924560546875, 1.95794677734375, 2.0234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 6.0, 12.0, 11.0, 8.0, 19.0, 14.0, 30.0, 20.0, 25.0, 30.0, 36.0, 36.0, 33.0, 39.0, 36.0, 41.0, 41.0, 50.0, 35.0, 37.0, 32.0, 45.0, 38.0, 27.0, 44.0, 41.0, 36.0, 34.0, 27.0, 19.0, 27.0, 10.0, 13.0, 11.0, 7.0, 9.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.73828125, -4.592041015625, -4.44580078125, -4.299560546875, -4.1533203125, -4.007080078125, -3.86083984375, -3.714599609375, -3.568359375, -3.422119140625, -3.27587890625, -3.129638671875, -2.9833984375, -2.837158203125, -2.69091796875, -2.544677734375, -2.3984375, -2.252197265625, -2.10595703125, -1.959716796875, -1.8134765625, -1.667236328125, -1.52099609375, -1.374755859375, -1.228515625, -1.082275390625, -0.93603515625, -0.789794921875, -0.6435546875, -0.497314453125, -0.35107421875, -0.204833984375, -0.05859375, 0.087646484375, 0.23388671875, 0.380126953125, 0.5263671875, 0.672607421875, 0.81884765625, 0.965087890625, 1.111328125, 1.257568359375, 1.40380859375, 1.550048828125, 1.6962890625, 1.842529296875, 1.98876953125, 2.135009765625, 2.28125, 2.427490234375, 2.57373046875, 2.719970703125, 2.8662109375, 3.012451171875, 3.15869140625, 3.304931640625, 3.451171875, 3.597412109375, 3.74365234375, 3.889892578125, 4.0361328125, 4.182373046875, 4.32861328125, 4.474853515625, 4.62109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 11.0, 5.0, 16.0, 19.0, 31.0, 56.0, 100.0, 158.0, 241.0, 333.0, 536.0, 865.0, 1323.0, 2054.0, 3122.0, 4683.0, 7362.0, 10856.0, 16085.0, 23912.0, 33128.0, 45514.0, 59989.0, 74766.0, 88292.0, 97716.0, 102049.0, 97911.0, 88794.0, 75661.0, 60570.0, 46152.0, 33682.0, 23913.0, 16239.0, 11068.0, 7459.0, 4924.0, 3160.0, 2101.0, 1305.0, 852.0, 554.0, 364.0, 225.0, 145.0, 85.0, 67.0, 47.0, 14.0, 12.0, 15.0, 2.0, 7.0, 4.0, 3.0, 3.0], "bins": [-2.564453125, -2.487945556640625, -2.41143798828125, -2.334930419921875, -2.2584228515625, -2.181915283203125, -2.10540771484375, -2.028900146484375, -1.952392578125, -1.875885009765625, -1.79937744140625, -1.722869873046875, -1.6463623046875, -1.569854736328125, -1.49334716796875, -1.416839599609375, -1.34033203125, -1.263824462890625, -1.18731689453125, -1.110809326171875, -1.0343017578125, -0.957794189453125, -0.88128662109375, -0.804779052734375, -0.728271484375, -0.651763916015625, -0.57525634765625, -0.498748779296875, -0.4222412109375, -0.345733642578125, -0.26922607421875, -0.192718505859375, -0.1162109375, -0.039703369140625, 0.03680419921875, 0.113311767578125, 0.1898193359375, 0.266326904296875, 0.34283447265625, 0.419342041015625, 0.495849609375, 0.572357177734375, 0.64886474609375, 0.725372314453125, 0.8018798828125, 0.878387451171875, 0.95489501953125, 1.031402587890625, 1.10791015625, 1.184417724609375, 1.26092529296875, 1.337432861328125, 1.4139404296875, 1.490447998046875, 1.56695556640625, 1.643463134765625, 1.719970703125, 1.796478271484375, 1.87298583984375, 1.949493408203125, 2.0260009765625, 2.102508544921875, 2.17901611328125, 2.255523681640625, 2.33203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 5.0, 13.0, 13.0, 17.0, 16.0, 27.0, 28.0, 33.0, 35.0, 36.0, 39.0, 43.0, 34.0, 40.0, 57.0, 35.0, 55.0, 39.0, 33.0, 40.0, 40.0, 40.0, 31.0, 42.0, 29.0, 36.0, 23.0, 17.0, 15.0, 21.0, 9.0, 13.0, 9.0, 5.0, 8.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.345703125, -3.24761962890625, -3.1495361328125, -3.05145263671875, -2.953369140625, -2.85528564453125, -2.7572021484375, -2.65911865234375, -2.56103515625, -2.46295166015625, -2.3648681640625, -2.26678466796875, -2.168701171875, -2.07061767578125, -1.9725341796875, -1.87445068359375, -1.7763671875, -1.67828369140625, -1.5802001953125, -1.48211669921875, -1.384033203125, -1.28594970703125, -1.1878662109375, -1.08978271484375, -0.99169921875, -0.89361572265625, -0.7955322265625, -0.69744873046875, -0.599365234375, -0.50128173828125, -0.4031982421875, -0.30511474609375, -0.20703125, -0.10894775390625, -0.0108642578125, 0.08721923828125, 0.185302734375, 0.28338623046875, 0.3814697265625, 0.47955322265625, 0.57763671875, 0.67572021484375, 0.7738037109375, 0.87188720703125, 0.969970703125, 1.06805419921875, 1.1661376953125, 1.26422119140625, 1.3623046875, 1.46038818359375, 1.5584716796875, 1.65655517578125, 1.754638671875, 1.85272216796875, 1.9508056640625, 2.04888916015625, 2.14697265625, 2.24505615234375, 2.3431396484375, 2.44122314453125, 2.539306640625, 2.63739013671875, 2.7354736328125, 2.83355712890625, 2.931640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 13.0, 15.0, 27.0, 42.0, 55.0, 96.0, 163.0, 282.0, 497.0, 924.0, 1678.0, 3189.0, 5757.0, 10472.0, 19223.0, 33004.0, 54080.0, 81284.0, 112192.0, 135533.0, 144497.0, 134368.0, 109161.0, 79016.0, 51301.0, 31358.0, 18123.0, 10144.0, 5469.0, 3010.0, 1607.0, 857.0, 479.0, 259.0, 153.0, 93.0, 49.0, 26.0, 21.0, 13.0, 8.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.05059814453125, -1.0123291015625, -0.97406005859375, -0.935791015625, -0.89752197265625, -0.8592529296875, -0.82098388671875, -0.78271484375, -0.74444580078125, -0.7061767578125, -0.66790771484375, -0.629638671875, -0.59136962890625, -0.5531005859375, -0.51483154296875, -0.4765625, -0.43829345703125, -0.4000244140625, -0.36175537109375, -0.323486328125, -0.28521728515625, -0.2469482421875, -0.20867919921875, -0.17041015625, -0.13214111328125, -0.0938720703125, -0.05560302734375, -0.017333984375, 0.02093505859375, 0.0592041015625, 0.09747314453125, 0.1357421875, 0.17401123046875, 0.2122802734375, 0.25054931640625, 0.288818359375, 0.32708740234375, 0.3653564453125, 0.40362548828125, 0.44189453125, 0.48016357421875, 0.5184326171875, 0.55670166015625, 0.594970703125, 0.63323974609375, 0.6715087890625, 0.70977783203125, 0.748046875, 0.78631591796875, 0.8245849609375, 0.86285400390625, 0.901123046875, 0.93939208984375, 0.9776611328125, 1.01593017578125, 1.05419921875, 1.09246826171875, 1.1307373046875, 1.16900634765625, 1.207275390625, 1.24554443359375, 1.2838134765625, 1.32208251953125, 1.3603515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 13.0, 12.0, 11.0, 12.0, 15.0, 18.0, 18.0, 33.0, 32.0, 39.0, 42.0, 25.0, 51.0, 24.0, 53.0, 43.0, 41.0, 50.0, 49.0, 44.0, 45.0, 41.0, 40.0, 28.0, 34.0, 27.0, 17.0, 21.0, 12.0, 12.0, 10.0, 17.0, 12.0, 7.0, 4.0, 1.0, 10.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000110626220703125, -0.00010711420327425003, -0.00010360218584537506, -0.00010009016841650009, -9.657815098762512e-05, -9.306613355875015e-05, -8.955411612987518e-05, -8.604209870100021e-05, -8.253008127212524e-05, -7.901806384325027e-05, -7.55060464143753e-05, -7.199402898550034e-05, -6.848201155662537e-05, -6.49699941277504e-05, -6.145797669887543e-05, -5.794595927000046e-05, -5.443394184112549e-05, -5.092192441225052e-05, -4.740990698337555e-05, -4.389788955450058e-05, -4.038587212562561e-05, -3.687385469675064e-05, -3.336183726787567e-05, -2.9849819839000702e-05, -2.6337802410125732e-05, -2.2825784981250763e-05, -1.9313767552375793e-05, -1.5801750123500824e-05, -1.2289732694625854e-05, -8.777715265750885e-06, -5.2656978368759155e-06, -1.753680408000946e-06, 1.7583370208740234e-06, 5.270354449748993e-06, 8.782371878623962e-06, 1.2294389307498932e-05, 1.58064067363739e-05, 1.931842416524887e-05, 2.283044159412384e-05, 2.634245902299881e-05, 2.985447645187378e-05, 3.336649388074875e-05, 3.687851130962372e-05, 4.039052873849869e-05, 4.390254616737366e-05, 4.741456359624863e-05, 5.0926581025123596e-05, 5.4438598453998566e-05, 5.7950615882873535e-05, 6.14626333117485e-05, 6.497465074062347e-05, 6.848666816949844e-05, 7.199868559837341e-05, 7.551070302724838e-05, 7.902272045612335e-05, 8.253473788499832e-05, 8.604675531387329e-05, 8.955877274274826e-05, 9.307079017162323e-05, 9.65828076004982e-05, 0.00010009482502937317, 0.00010360684245824814, 0.00010711885988712311, 0.00011063087731599808, 0.00011414289474487305]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 14.0, 9.0, 13.0, 19.0, 26.0, 38.0, 57.0, 95.0, 152.0, 246.0, 427.0, 707.0, 1118.0, 1916.0, 3126.0, 5445.0, 9194.0, 15053.0, 24351.0, 38115.0, 56306.0, 78948.0, 102378.0, 119739.0, 127169.0, 120812.0, 103618.0, 80454.0, 57382.0, 38627.0, 24792.0, 15384.0, 9189.0, 5443.0, 3283.0, 1955.0, 1140.0, 711.0, 411.0, 274.0, 133.0, 94.0, 66.0, 40.0, 31.0, 25.0, 13.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 5.0, 2.0], "bins": [-1.18359375, -1.148284912109375, -1.11297607421875, -1.077667236328125, -1.0423583984375, -1.007049560546875, -0.97174072265625, -0.936431884765625, -0.901123046875, -0.865814208984375, -0.83050537109375, -0.795196533203125, -0.7598876953125, -0.724578857421875, -0.68927001953125, -0.653961181640625, -0.61865234375, -0.583343505859375, -0.54803466796875, -0.512725830078125, -0.4774169921875, -0.442108154296875, -0.40679931640625, -0.371490478515625, -0.336181640625, -0.300872802734375, -0.26556396484375, -0.230255126953125, -0.1949462890625, -0.159637451171875, -0.12432861328125, -0.089019775390625, -0.0537109375, -0.018402099609375, 0.01690673828125, 0.052215576171875, 0.0875244140625, 0.122833251953125, 0.15814208984375, 0.193450927734375, 0.228759765625, 0.264068603515625, 0.29937744140625, 0.334686279296875, 0.3699951171875, 0.405303955078125, 0.44061279296875, 0.475921630859375, 0.51123046875, 0.546539306640625, 0.58184814453125, 0.617156982421875, 0.6524658203125, 0.687774658203125, 0.72308349609375, 0.758392333984375, 0.793701171875, 0.829010009765625, 0.86431884765625, 0.899627685546875, 0.9349365234375, 0.970245361328125, 1.00555419921875, 1.040863037109375, 1.076171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 7.0, 4.0, 8.0, 10.0, 8.0, 8.0, 16.0, 12.0, 16.0, 21.0, 20.0, 22.0, 21.0, 34.0, 42.0, 31.0, 44.0, 47.0, 48.0, 42.0, 39.0, 39.0, 44.0, 46.0, 45.0, 44.0, 28.0, 31.0, 37.0, 30.0, 24.0, 20.0, 20.0, 14.0, 19.0, 15.0, 4.0, 9.0, 6.0, 10.0, 4.0, 3.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.403564453125, -0.3913726806640625, -0.379180908203125, -0.3669891357421875, -0.35479736328125, -0.3426055908203125, -0.330413818359375, -0.3182220458984375, -0.3060302734375, -0.2938385009765625, -0.281646728515625, -0.2694549560546875, -0.25726318359375, -0.2450714111328125, -0.232879638671875, -0.2206878662109375, -0.20849609375, -0.1963043212890625, -0.184112548828125, -0.1719207763671875, -0.15972900390625, -0.1475372314453125, -0.135345458984375, -0.1231536865234375, -0.1109619140625, -0.0987701416015625, -0.086578369140625, -0.0743865966796875, -0.06219482421875, -0.0500030517578125, -0.037811279296875, -0.0256195068359375, -0.013427734375, -0.0012359619140625, 0.010955810546875, 0.0231475830078125, 0.03533935546875, 0.0475311279296875, 0.059722900390625, 0.0719146728515625, 0.0841064453125, 0.0962982177734375, 0.108489990234375, 0.1206817626953125, 0.13287353515625, 0.1450653076171875, 0.157257080078125, 0.1694488525390625, 0.181640625, 0.1938323974609375, 0.206024169921875, 0.2182159423828125, 0.23040771484375, 0.2425994873046875, 0.254791259765625, 0.2669830322265625, 0.2791748046875, 0.2913665771484375, 0.303558349609375, 0.3157501220703125, 0.32794189453125, 0.3401336669921875, 0.352325439453125, 0.3645172119140625, 0.376708984375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 11.0, 8.0, 9.0, 10.0, 11.0, 9.0, 16.0, 17.0, 17.0, 27.0, 27.0, 25.0, 29.0, 34.0, 41.0, 38.0, 36.0, 43.0, 51.0, 48.0, 47.0, 53.0, 44.0, 36.0, 39.0, 28.0, 37.0, 36.0, 31.0, 21.0, 15.0, 17.0, 14.0, 11.0, 13.0, 9.0, 5.0, 10.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.901782989501953, -3.756187677383423, -3.6105923652648926, -3.4649970531463623, -3.319401741027832, -3.173806667327881, -3.0282113552093506, -2.8826160430908203, -2.73702073097229, -2.5914254188537598, -2.4458301067352295, -2.300234794616699, -2.154639720916748, -2.0090441703796387, -1.8634490966796875, -1.7178537845611572, -1.572258472442627, -1.4266631603240967, -1.2810678482055664, -1.1354726552963257, -0.9898773431777954, -0.8442820310592651, -0.6986867785453796, -0.5530915260314941, -0.40749621391296387, -0.261900931596756, -0.1163056492805481, 0.02928963303565979, 0.17488491535186768, 0.32048022747039795, 0.46607547998428345, 0.611670732498169, 0.7572660446166992, 0.9028613567352295, 1.0484566688537598, 1.1940518617630005, 1.3396471738815308, 1.485242486000061, 1.6308376789093018, 1.776432991027832, 1.9220283031463623, 2.0676236152648926, 2.213218927383423, 2.358814239501953, 2.5044093132019043, 2.6500048637390137, 2.795599937438965, 2.941195249557495, 3.0867905616760254, 3.2323858737945557, 3.377981185913086, 3.523576498031616, 3.6691718101501465, 3.8147668838500977, 3.960362195968628, 4.105957508087158, 4.251552581787109, 4.3971476554870605, 4.54274320602417, 4.688338279724121, 4.8339338302612305, 4.979528903961182, 5.125124454498291, 5.270719528198242, 5.416315078735352]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 1.0, 2.0, 11.0, 8.0, 10.0, 7.0, 20.0, 25.0, 22.0, 24.0, 39.0, 31.0, 28.0, 33.0, 33.0, 47.0, 41.0, 56.0, 43.0, 42.0, 48.0, 46.0, 44.0, 44.0, 45.0, 39.0, 37.0, 30.0, 26.0, 29.0, 15.0, 28.0, 9.0, 9.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.41481876373291, -5.257462978363037, -5.100107192993164, -4.942751884460449, -4.785396099090576, -4.628040313720703, -4.47068452835083, -4.313328742980957, -4.155973434448242, -3.998617649078369, -3.841262102127075, -3.683906316757202, -3.526550769805908, -3.369194984436035, -3.211839199066162, -3.054483413696289, -2.897127628326416, -2.739771842956543, -2.582416296005249, -2.425060510635376, -2.267704963684082, -2.110349178314209, -1.952993392944336, -1.7956377267837524, -1.638282060623169, -1.4809263944625854, -1.323570728302002, -1.166214942932129, -1.0088592767715454, -0.8515036106109619, -0.6941478848457336, -0.5367921590805054, -0.3794364929199219, -0.222080796957016, -0.06472510099411011, 0.09263059496879578, 0.24998629093170166, 0.40734195709228516, 0.5646976828575134, 0.7220534086227417, 0.8794090747833252, 1.0367647409439087, 1.1941204071044922, 1.3514761924743652, 1.5088318586349487, 1.6661875247955322, 1.8235433101654053, 1.9808989763259888, 2.1382546424865723, 2.2956104278564453, 2.4529659748077393, 2.6103217601776123, 2.7676773071289062, 2.9250330924987793, 3.0823888778686523, 3.2397446632385254, 3.3971002101898193, 3.5544559955596924, 3.7118115425109863, 3.8691673278808594, 4.026523113250732, 4.1838788986206055, 4.34123420715332, 4.498589992523193, 4.655945777893066]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 9.0, 14.0, 26.0, 30.0, 49.0, 84.0, 116.0, 195.0, 332.0, 509.0, 811.0, 1410.0, 2446.0, 3998.0, 6575.0, 11370.0, 19256.0, 32531.0, 55009.0, 92223.0, 149523.0, 236581.0, 352488.0, 476872.0, 566909.0, 580327.0, 510325.0, 389995.0, 268077.0, 173337.0, 106433.0, 63836.0, 37828.0, 22213.0, 13370.0, 7902.0, 4524.0, 2652.0, 1646.0, 929.0, 544.0, 360.0, 224.0, 162.0, 84.0, 55.0, 30.0, 30.0, 13.0, 8.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73046875, -3.60675048828125, -3.4830322265625, -3.35931396484375, -3.235595703125, -3.11187744140625, -2.9881591796875, -2.86444091796875, -2.74072265625, -2.61700439453125, -2.4932861328125, -2.36956787109375, -2.245849609375, -2.12213134765625, -1.9984130859375, -1.87469482421875, -1.7509765625, -1.62725830078125, -1.5035400390625, -1.37982177734375, -1.256103515625, -1.13238525390625, -1.0086669921875, -0.88494873046875, -0.76123046875, -0.63751220703125, -0.5137939453125, -0.39007568359375, -0.266357421875, -0.14263916015625, -0.0189208984375, 0.10479736328125, 0.228515625, 0.35223388671875, 0.4759521484375, 0.59967041015625, 0.723388671875, 0.84710693359375, 0.9708251953125, 1.09454345703125, 1.21826171875, 1.34197998046875, 1.4656982421875, 1.58941650390625, 1.713134765625, 1.83685302734375, 1.9605712890625, 2.08428955078125, 2.2080078125, 2.33172607421875, 2.4554443359375, 2.57916259765625, 2.702880859375, 2.82659912109375, 2.9503173828125, 3.07403564453125, 3.19775390625, 3.32147216796875, 3.4451904296875, 3.56890869140625, 3.692626953125, 3.81634521484375, 3.9400634765625, 4.06378173828125, 4.1875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 10.0, 8.0, 11.0, 12.0, 16.0, 23.0, 23.0, 24.0, 27.0, 32.0, 33.0, 36.0, 36.0, 55.0, 47.0, 49.0, 38.0, 33.0, 43.0, 56.0, 46.0, 41.0, 43.0, 34.0, 33.0, 38.0, 23.0, 20.0, 22.0, 25.0, 19.0, 11.0, 5.0, 2.0, 10.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.609375, -4.4752197265625, -4.341064453125, -4.2069091796875, -4.07275390625, -3.9385986328125, -3.804443359375, -3.6702880859375, -3.5361328125, -3.4019775390625, -3.267822265625, -3.1336669921875, -2.99951171875, -2.8653564453125, -2.731201171875, -2.5970458984375, -2.462890625, -2.3287353515625, -2.194580078125, -2.0604248046875, -1.92626953125, -1.7921142578125, -1.657958984375, -1.5238037109375, -1.3896484375, -1.2554931640625, -1.121337890625, -0.9871826171875, -0.85302734375, -0.7188720703125, -0.584716796875, -0.4505615234375, -0.31640625, -0.1822509765625, -0.048095703125, 0.0860595703125, 0.22021484375, 0.3543701171875, 0.488525390625, 0.6226806640625, 0.7568359375, 0.8909912109375, 1.025146484375, 1.1593017578125, 1.29345703125, 1.4276123046875, 1.561767578125, 1.6959228515625, 1.830078125, 1.9642333984375, 2.098388671875, 2.2325439453125, 2.36669921875, 2.5008544921875, 2.635009765625, 2.7691650390625, 2.9033203125, 3.0374755859375, 3.171630859375, 3.3057861328125, 3.43994140625, 3.5740966796875, 3.708251953125, 3.8424072265625, 3.9765625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 13.0, 33.0, 65.0, 69.0, 119.0, 185.0, 295.0, 450.0, 712.0, 1141.0, 1876.0, 3163.0, 5051.0, 8072.0, 12717.0, 20973.0, 32983.0, 51868.0, 79746.0, 120088.0, 176367.0, 247933.0, 328022.0, 404936.0, 460627.0, 475071.0, 441095.0, 376119.0, 293914.0, 217120.0, 150094.0, 102004.0, 66609.0, 42865.0, 26967.0, 16977.0, 10500.0, 6684.0, 3943.0, 2570.0, 1647.0, 972.0, 636.0, 372.0, 227.0, 139.0, 89.0, 65.0, 37.0, 22.0, 14.0, 7.0, 5.0, 0.0, 4.0, 2.0, 3.0], "bins": [-3.796875, -3.679290771484375, -3.56170654296875, -3.444122314453125, -3.3265380859375, -3.208953857421875, -3.09136962890625, -2.973785400390625, -2.856201171875, -2.738616943359375, -2.62103271484375, -2.503448486328125, -2.3858642578125, -2.268280029296875, -2.15069580078125, -2.033111572265625, -1.91552734375, -1.797943115234375, -1.68035888671875, -1.562774658203125, -1.4451904296875, -1.327606201171875, -1.21002197265625, -1.092437744140625, -0.974853515625, -0.857269287109375, -0.73968505859375, -0.622100830078125, -0.5045166015625, -0.386932373046875, -0.26934814453125, -0.151763916015625, -0.0341796875, 0.083404541015625, 0.20098876953125, 0.318572998046875, 0.4361572265625, 0.553741455078125, 0.67132568359375, 0.788909912109375, 0.906494140625, 1.024078369140625, 1.14166259765625, 1.259246826171875, 1.3768310546875, 1.494415283203125, 1.61199951171875, 1.729583740234375, 1.84716796875, 1.964752197265625, 2.08233642578125, 2.199920654296875, 2.3175048828125, 2.435089111328125, 2.55267333984375, 2.670257568359375, 2.787841796875, 2.905426025390625, 3.02301025390625, 3.140594482421875, 3.2581787109375, 3.375762939453125, 3.49334716796875, 3.610931396484375, 3.728515625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 4.0, 10.0, 6.0, 19.0, 23.0, 29.0, 25.0, 26.0, 49.0, 61.0, 58.0, 70.0, 86.0, 109.0, 120.0, 137.0, 158.0, 181.0, 187.0, 186.0, 207.0, 218.0, 206.0, 212.0, 199.0, 176.0, 160.0, 188.0, 154.0, 135.0, 111.0, 104.0, 78.0, 68.0, 60.0, 41.0, 44.0, 35.0, 31.0, 22.0, 17.0, 14.0, 8.0, 12.0, 7.0, 2.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.9248046875, -1.868804931640625, -1.81280517578125, -1.756805419921875, -1.7008056640625, -1.644805908203125, -1.58880615234375, -1.532806396484375, -1.476806640625, -1.420806884765625, -1.36480712890625, -1.308807373046875, -1.2528076171875, -1.196807861328125, -1.14080810546875, -1.084808349609375, -1.02880859375, -0.972808837890625, -0.91680908203125, -0.860809326171875, -0.8048095703125, -0.748809814453125, -0.69281005859375, -0.636810302734375, -0.580810546875, -0.524810791015625, -0.46881103515625, -0.412811279296875, -0.3568115234375, -0.300811767578125, -0.24481201171875, -0.188812255859375, -0.1328125, -0.076812744140625, -0.02081298828125, 0.035186767578125, 0.0911865234375, 0.147186279296875, 0.20318603515625, 0.259185791015625, 0.315185546875, 0.371185302734375, 0.42718505859375, 0.483184814453125, 0.5391845703125, 0.595184326171875, 0.65118408203125, 0.707183837890625, 0.76318359375, 0.819183349609375, 0.87518310546875, 0.931182861328125, 0.9871826171875, 1.043182373046875, 1.09918212890625, 1.155181884765625, 1.211181640625, 1.267181396484375, 1.32318115234375, 1.379180908203125, 1.4351806640625, 1.491180419921875, 1.54718017578125, 1.603179931640625, 1.6591796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 8.0, 5.0, 6.0, 10.0, 10.0, 15.0, 22.0, 13.0, 28.0, 23.0, 21.0, 29.0, 18.0, 39.0, 36.0, 41.0, 37.0, 41.0, 45.0, 30.0, 46.0, 37.0, 43.0, 34.0, 45.0, 25.0, 44.0, 32.0, 22.0, 23.0, 33.0, 23.0, 16.0, 22.0, 15.0, 13.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.517232418060303, -4.373436450958252, -4.229640483856201, -4.08584451675415, -3.9420485496520996, -3.798252582550049, -3.654456615447998, -3.5106606483459473, -3.3668646812438965, -3.2230687141418457, -3.079272747039795, -2.935476779937744, -2.7916808128356934, -2.6478848457336426, -2.504088878631592, -2.360292911529541, -2.2164969444274902, -2.0727009773254395, -1.9289050102233887, -1.785109043121338, -1.641313076019287, -1.4975171089172363, -1.3537211418151855, -1.2099251747131348, -1.066129207611084, -0.9223332405090332, -0.7785372734069824, -0.6347413063049316, -0.49094533920288086, -0.3471493721008301, -0.2033534049987793, -0.059557437896728516, 0.08423805236816406, 0.22803401947021484, 0.3718299865722656, 0.5156259536743164, 0.6594219207763672, 0.803217887878418, 0.9470138549804688, 1.0908098220825195, 1.2346057891845703, 1.378401756286621, 1.5221977233886719, 1.6659936904907227, 1.8097896575927734, 1.9535856246948242, 2.097381591796875, 2.241177558898926, 2.3849735260009766, 2.5287694931030273, 2.672565460205078, 2.816361427307129, 2.9601573944091797, 3.1039533615112305, 3.2477493286132812, 3.391545295715332, 3.535341262817383, 3.6791372299194336, 3.8229331970214844, 3.966729164123535, 4.110525131225586, 4.254321098327637, 4.3981170654296875, 4.541913032531738, 4.685708999633789]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 3.0, 9.0, 11.0, 16.0, 15.0, 21.0, 19.0, 22.0, 26.0, 38.0, 38.0, 26.0, 39.0, 45.0, 30.0, 41.0, 33.0, 37.0, 45.0, 41.0, 53.0, 40.0, 37.0, 43.0, 42.0, 31.0, 26.0, 22.0, 27.0, 14.0, 12.0, 20.0, 14.0, 19.0, 11.0, 2.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.090559959411621, -3.9513328075408936, -3.812105655670166, -3.6728785037994385, -3.533651351928711, -3.3944244384765625, -3.255197286605835, -3.1159701347351074, -2.97674298286438, -2.8375158309936523, -2.698288679122925, -2.5590615272521973, -2.419834613800049, -2.280607223510742, -2.1413803100585938, -2.002153158187866, -1.8629260063171387, -1.7236988544464111, -1.5844717025756836, -1.4452446699142456, -1.306017518043518, -1.1667903661727905, -1.0275633335113525, -0.888336181640625, -0.7491090297698975, -0.6098818778991699, -0.47065478563308716, -0.331427663564682, -0.19220054149627686, -0.052973389625549316, 0.08625370264053345, 0.2254807949066162, 0.36470842361450195, 0.5039355754852295, 0.6431626677513123, 0.782389760017395, 0.9216169118881226, 1.06084406375885, 1.200071096420288, 1.3392982482910156, 1.4785254001617432, 1.6177525520324707, 1.7569797039031982, 1.8962067365646362, 2.035433769226074, 2.174661159515381, 2.3138880729675293, 2.453115224838257, 2.5923423767089844, 2.731569528579712, 2.8707966804504395, 3.010023832321167, 3.1492509841918945, 3.288477897644043, 3.4277050495147705, 3.566932201385498, 3.7061593532562256, 3.845386505126953, 3.9846136569976807, 4.123840808868408, 4.263067722320557, 4.402295112609863, 4.541522026062012, 4.68074893951416, 4.819976329803467]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 10.0, 11.0, 20.0, 28.0, 53.0, 50.0, 110.0, 162.0, 254.0, 395.0, 595.0, 925.0, 1441.0, 2206.0, 3629.0, 5537.0, 8472.0, 13021.0, 19837.0, 29254.0, 42684.0, 58854.0, 77628.0, 95532.0, 108910.0, 113591.0, 108386.0, 95293.0, 77259.0, 58353.0, 41674.0, 28676.0, 19758.0, 12755.0, 8175.0, 5442.0, 3540.0, 2171.0, 1402.0, 838.0, 558.0, 364.0, 249.0, 156.0, 93.0, 59.0, 52.0, 32.0, 24.0, 19.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1650390625, -1.1241302490234375, -1.083221435546875, -1.0423126220703125, -1.00140380859375, -0.9604949951171875, -0.919586181640625, -0.8786773681640625, -0.8377685546875, -0.7968597412109375, -0.755950927734375, -0.7150421142578125, -0.67413330078125, -0.6332244873046875, -0.592315673828125, -0.5514068603515625, -0.510498046875, -0.4695892333984375, -0.428680419921875, -0.3877716064453125, -0.34686279296875, -0.3059539794921875, -0.265045166015625, -0.2241363525390625, -0.1832275390625, -0.1423187255859375, -0.101409912109375, -0.0605010986328125, -0.01959228515625, 0.0213165283203125, 0.062225341796875, 0.1031341552734375, 0.14404296875, 0.1849517822265625, 0.225860595703125, 0.2667694091796875, 0.30767822265625, 0.3485870361328125, 0.389495849609375, 0.4304046630859375, 0.4713134765625, 0.5122222900390625, 0.553131103515625, 0.5940399169921875, 0.63494873046875, 0.6758575439453125, 0.716766357421875, 0.7576751708984375, 0.798583984375, 0.8394927978515625, 0.880401611328125, 0.9213104248046875, 0.96221923828125, 1.0031280517578125, 1.044036865234375, 1.0849456787109375, 1.1258544921875, 1.1667633056640625, 1.207672119140625, 1.2485809326171875, 1.28948974609375, 1.3303985595703125, 1.371307373046875, 1.4122161865234375, 1.453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 1.0, 11.0, 12.0, 10.0, 13.0, 19.0, 16.0, 27.0, 30.0, 19.0, 26.0, 46.0, 38.0, 31.0, 38.0, 51.0, 37.0, 47.0, 44.0, 49.0, 37.0, 38.0, 33.0, 43.0, 39.0, 32.0, 32.0, 29.0, 18.0, 26.0, 25.0, 21.0, 10.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.26519775390625, -4.1163330078125, -3.96746826171875, -3.818603515625, -3.66973876953125, -3.5208740234375, -3.37200927734375, -3.22314453125, -3.07427978515625, -2.9254150390625, -2.77655029296875, -2.627685546875, -2.47882080078125, -2.3299560546875, -2.18109130859375, -2.0322265625, -1.88336181640625, -1.7344970703125, -1.58563232421875, -1.436767578125, -1.28790283203125, -1.1390380859375, -0.99017333984375, -0.84130859375, -0.69244384765625, -0.5435791015625, -0.39471435546875, -0.245849609375, -0.09698486328125, 0.0518798828125, 0.20074462890625, 0.349609375, 0.49847412109375, 0.6473388671875, 0.79620361328125, 0.945068359375, 1.09393310546875, 1.2427978515625, 1.39166259765625, 1.54052734375, 1.68939208984375, 1.8382568359375, 1.98712158203125, 2.135986328125, 2.28485107421875, 2.4337158203125, 2.58258056640625, 2.7314453125, 2.88031005859375, 3.0291748046875, 3.17803955078125, 3.326904296875, 3.47576904296875, 3.6246337890625, 3.77349853515625, 3.92236328125, 4.07122802734375, 4.2200927734375, 4.36895751953125, 4.517822265625, 4.66668701171875, 4.8155517578125, 4.96441650390625, 5.11328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 19.0, 31.0, 35.0, 58.0, 90.0, 140.0, 217.0, 368.0, 637.0, 1033.0, 1635.0, 2798.0, 4767.0, 8001.0, 13786.0, 23202.0, 39196.0, 62344.0, 95008.0, 131943.0, 156560.0, 153076.0, 124345.0, 87784.0, 56333.0, 34536.0, 20615.0, 12211.0, 7188.0, 4143.0, 2588.0, 1482.0, 924.0, 557.0, 310.0, 206.0, 148.0, 75.0, 51.0, 37.0, 19.0, 11.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.291015625, -2.223419189453125, -2.15582275390625, -2.088226318359375, -2.0206298828125, -1.953033447265625, -1.88543701171875, -1.817840576171875, -1.750244140625, -1.682647705078125, -1.61505126953125, -1.547454833984375, -1.4798583984375, -1.412261962890625, -1.34466552734375, -1.277069091796875, -1.20947265625, -1.141876220703125, -1.07427978515625, -1.006683349609375, -0.9390869140625, -0.871490478515625, -0.80389404296875, -0.736297607421875, -0.668701171875, -0.601104736328125, -0.53350830078125, -0.465911865234375, -0.3983154296875, -0.330718994140625, -0.26312255859375, -0.195526123046875, -0.1279296875, -0.060333251953125, 0.00726318359375, 0.074859619140625, 0.1424560546875, 0.210052490234375, 0.27764892578125, 0.345245361328125, 0.412841796875, 0.480438232421875, 0.54803466796875, 0.615631103515625, 0.6832275390625, 0.750823974609375, 0.81842041015625, 0.886016845703125, 0.95361328125, 1.021209716796875, 1.08880615234375, 1.156402587890625, 1.2239990234375, 1.291595458984375, 1.35919189453125, 1.426788330078125, 1.494384765625, 1.561981201171875, 1.62957763671875, 1.697174072265625, 1.7647705078125, 1.832366943359375, 1.89996337890625, 1.967559814453125, 2.03515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 8.0, 6.0, 12.0, 12.0, 12.0, 18.0, 11.0, 17.0, 24.0, 23.0, 28.0, 33.0, 30.0, 38.0, 32.0, 41.0, 38.0, 41.0, 32.0, 48.0, 40.0, 39.0, 36.0, 39.0, 39.0, 35.0, 32.0, 35.0, 24.0, 29.0, 18.0, 15.0, 25.0, 17.0, 16.0, 14.0, 6.0, 6.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.42315673828125, -2.3345947265625, -2.24603271484375, -2.157470703125, -2.06890869140625, -1.9803466796875, -1.89178466796875, -1.80322265625, -1.71466064453125, -1.6260986328125, -1.53753662109375, -1.448974609375, -1.36041259765625, -1.2718505859375, -1.18328857421875, -1.0947265625, -1.00616455078125, -0.9176025390625, -0.82904052734375, -0.740478515625, -0.65191650390625, -0.5633544921875, -0.47479248046875, -0.38623046875, -0.29766845703125, -0.2091064453125, -0.12054443359375, -0.031982421875, 0.05657958984375, 0.1451416015625, 0.23370361328125, 0.322265625, 0.41082763671875, 0.4993896484375, 0.58795166015625, 0.676513671875, 0.76507568359375, 0.8536376953125, 0.94219970703125, 1.03076171875, 1.11932373046875, 1.2078857421875, 1.29644775390625, 1.385009765625, 1.47357177734375, 1.5621337890625, 1.65069580078125, 1.7392578125, 1.82781982421875, 1.9163818359375, 2.00494384765625, 2.093505859375, 2.18206787109375, 2.2706298828125, 2.35919189453125, 2.44775390625, 2.53631591796875, 2.6248779296875, 2.71343994140625, 2.802001953125, 2.89056396484375, 2.9791259765625, 3.06768798828125, 3.15625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 13.0, 14.0, 26.0, 36.0, 52.0, 85.0, 102.0, 177.0, 296.0, 434.0, 637.0, 989.0, 1444.0, 2237.0, 3346.0, 4969.0, 7785.0, 11736.0, 17718.0, 25914.0, 38488.0, 55079.0, 75259.0, 98560.0, 117896.0, 124522.0, 116924.0, 98361.0, 75394.0, 54371.0, 37997.0, 26292.0, 17350.0, 11610.0, 7704.0, 5057.0, 3230.0, 2168.0, 1523.0, 886.0, 645.0, 410.0, 275.0, 176.0, 132.0, 81.0, 48.0, 32.0, 23.0, 19.0, 11.0, 7.0, 3.0, 6.0, 1.0, 1.0, 2.0], "bins": [-0.62158203125, -0.602447509765625, -0.58331298828125, -0.564178466796875, -0.5450439453125, -0.525909423828125, -0.50677490234375, -0.487640380859375, -0.468505859375, -0.449371337890625, -0.43023681640625, -0.411102294921875, -0.3919677734375, -0.372833251953125, -0.35369873046875, -0.334564208984375, -0.3154296875, -0.296295166015625, -0.27716064453125, -0.258026123046875, -0.2388916015625, -0.219757080078125, -0.20062255859375, -0.181488037109375, -0.162353515625, -0.143218994140625, -0.12408447265625, -0.104949951171875, -0.0858154296875, -0.066680908203125, -0.04754638671875, -0.028411865234375, -0.00927734375, 0.009857177734375, 0.02899169921875, 0.048126220703125, 0.0672607421875, 0.086395263671875, 0.10552978515625, 0.124664306640625, 0.143798828125, 0.162933349609375, 0.18206787109375, 0.201202392578125, 0.2203369140625, 0.239471435546875, 0.25860595703125, 0.277740478515625, 0.296875, 0.316009521484375, 0.33514404296875, 0.354278564453125, 0.3734130859375, 0.392547607421875, 0.41168212890625, 0.430816650390625, 0.449951171875, 0.469085693359375, 0.48822021484375, 0.507354736328125, 0.5264892578125, 0.545623779296875, 0.56475830078125, 0.583892822265625, 0.60302734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 1.0, 9.0, 4.0, 11.0, 7.0, 12.0, 19.0, 20.0, 21.0, 27.0, 23.0, 29.0, 36.0, 39.0, 44.0, 45.0, 56.0, 47.0, 47.0, 44.0, 53.0, 52.0, 35.0, 43.0, 42.0, 46.0, 22.0, 32.0, 26.0, 14.0, 19.0, 18.0, 10.0, 10.0, 8.0, 3.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.622526466846466e-05, -4.476681351661682e-05, -4.330836236476898e-05, -4.184991121292114e-05, -4.03914600610733e-05, -3.8933008909225464e-05, -3.7474557757377625e-05, -3.6016106605529785e-05, -3.4557655453681946e-05, -3.3099204301834106e-05, -3.164075314998627e-05, -3.0182301998138428e-05, -2.872385084629059e-05, -2.726539969444275e-05, -2.580694854259491e-05, -2.434849739074707e-05, -2.289004623889923e-05, -2.143159508705139e-05, -1.9973143935203552e-05, -1.8514692783355713e-05, -1.7056241631507874e-05, -1.5597790479660034e-05, -1.4139339327812195e-05, -1.2680888175964355e-05, -1.1222437024116516e-05, -9.763985872268677e-06, -8.305534720420837e-06, -6.847083568572998e-06, -5.388632416725159e-06, -3.930181264877319e-06, -2.47173011302948e-06, -1.0132789611816406e-06, 4.4517219066619873e-07, 1.903623342514038e-06, 3.3620744943618774e-06, 4.820525646209717e-06, 6.278976798057556e-06, 7.737427949905396e-06, 9.195879101753235e-06, 1.0654330253601074e-05, 1.2112781405448914e-05, 1.3571232557296753e-05, 1.5029683709144592e-05, 1.648813486099243e-05, 1.794658601284027e-05, 1.940503716468811e-05, 2.086348831653595e-05, 2.232193946838379e-05, 2.378039062023163e-05, 2.5238841772079468e-05, 2.6697292923927307e-05, 2.8155744075775146e-05, 2.9614195227622986e-05, 3.1072646379470825e-05, 3.2531097531318665e-05, 3.3989548683166504e-05, 3.544799983501434e-05, 3.690645098686218e-05, 3.836490213871002e-05, 3.982335329055786e-05, 4.12818044424057e-05, 4.274025559425354e-05, 4.419870674610138e-05, 4.565715789794922e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 29.0, 28.0, 50.0, 75.0, 108.0, 166.0, 243.0, 358.0, 538.0, 806.0, 1288.0, 1883.0, 2780.0, 4306.0, 6387.0, 9452.0, 14497.0, 20675.0, 29831.0, 41972.0, 56830.0, 73791.0, 91570.0, 104722.0, 109984.0, 105716.0, 93462.0, 76274.0, 58771.0, 43968.0, 31167.0, 21662.0, 14979.0, 9912.0, 6814.0, 4495.0, 2999.0, 1988.0, 1355.0, 927.0, 592.0, 342.0, 233.0, 164.0, 122.0, 74.0, 63.0, 24.0, 23.0, 15.0, 10.0, 6.0, 2.0, 3.0], "bins": [-0.744140625, -0.7226104736328125, -0.701080322265625, -0.6795501708984375, -0.65802001953125, -0.6364898681640625, -0.614959716796875, -0.5934295654296875, -0.5718994140625, -0.5503692626953125, -0.528839111328125, -0.5073089599609375, -0.48577880859375, -0.4642486572265625, -0.442718505859375, -0.4211883544921875, -0.399658203125, -0.3781280517578125, -0.356597900390625, -0.3350677490234375, -0.31353759765625, -0.2920074462890625, -0.270477294921875, -0.2489471435546875, -0.2274169921875, -0.2058868408203125, -0.184356689453125, -0.1628265380859375, -0.14129638671875, -0.1197662353515625, -0.098236083984375, -0.0767059326171875, -0.05517578125, -0.0336456298828125, -0.012115478515625, 0.0094146728515625, 0.03094482421875, 0.0524749755859375, 0.074005126953125, 0.0955352783203125, 0.1170654296875, 0.1385955810546875, 0.160125732421875, 0.1816558837890625, 0.20318603515625, 0.2247161865234375, 0.246246337890625, 0.2677764892578125, 0.289306640625, 0.3108367919921875, 0.332366943359375, 0.3538970947265625, 0.37542724609375, 0.3969573974609375, 0.418487548828125, 0.4400177001953125, 0.4615478515625, 0.4830780029296875, 0.504608154296875, 0.5261383056640625, 0.54766845703125, 0.5691986083984375, 0.590728759765625, 0.6122589111328125, 0.6337890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 3.0, 9.0, 5.0, 7.0, 10.0, 9.0, 14.0, 12.0, 25.0, 20.0, 26.0, 30.0, 38.0, 26.0, 36.0, 30.0, 45.0, 46.0, 43.0, 40.0, 44.0, 47.0, 47.0, 45.0, 36.0, 34.0, 44.0, 28.0, 42.0, 21.0, 16.0, 15.0, 17.0, 11.0, 14.0, 9.0, 9.0, 5.0, 6.0, 7.0, 8.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2607421875, -0.25238800048828125, -0.2440338134765625, -0.23567962646484375, -0.227325439453125, -0.21897125244140625, -0.2106170654296875, -0.20226287841796875, -0.19390869140625, -0.18555450439453125, -0.1772003173828125, -0.16884613037109375, -0.160491943359375, -0.15213775634765625, -0.1437835693359375, -0.13542938232421875, -0.1270751953125, -0.11872100830078125, -0.1103668212890625, -0.10201263427734375, -0.093658447265625, -0.08530426025390625, -0.0769500732421875, -0.06859588623046875, -0.06024169921875, -0.05188751220703125, -0.0435333251953125, -0.03517913818359375, -0.026824951171875, -0.01847076416015625, -0.0101165771484375, -0.00176239013671875, 0.006591796875, 0.01494598388671875, 0.0233001708984375, 0.03165435791015625, 0.040008544921875, 0.04836273193359375, 0.0567169189453125, 0.06507110595703125, 0.07342529296875, 0.08177947998046875, 0.0901336669921875, 0.09848785400390625, 0.106842041015625, 0.11519622802734375, 0.1235504150390625, 0.13190460205078125, 0.1402587890625, 0.14861297607421875, 0.1569671630859375, 0.16532135009765625, 0.173675537109375, 0.18202972412109375, 0.1903839111328125, 0.19873809814453125, 0.20709228515625, 0.21544647216796875, 0.2238006591796875, 0.23215484619140625, 0.240509033203125, 0.24886322021484375, 0.2572174072265625, 0.26557159423828125, 0.27392578125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 2.0, 5.0, 9.0, 12.0, 12.0, 23.0, 15.0, 28.0, 22.0, 20.0, 28.0, 33.0, 35.0, 36.0, 29.0, 42.0, 46.0, 40.0, 34.0, 36.0, 41.0, 46.0, 42.0, 38.0, 26.0, 37.0, 32.0, 30.0, 31.0, 21.0, 26.0, 16.0, 21.0, 14.0, 11.0, 12.0, 5.0, 4.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-4.51206636428833, -4.367865562438965, -4.223665237426758, -4.079464435577393, -3.9352638721466064, -3.7910633087158203, -3.646862745285034, -3.502662181854248, -3.358461380004883, -3.2142608165740967, -3.0700602531433105, -2.9258594512939453, -2.781658887863159, -2.637458324432373, -2.493257761001587, -2.349057197570801, -2.2048566341400146, -2.0606560707092285, -1.9164553880691528, -1.7722548246383667, -1.628054141998291, -1.4838535785675049, -1.3396530151367188, -1.195452332496643, -1.051251769065857, -0.907051146030426, -0.7628505229949951, -0.618649959564209, -0.4744493365287781, -0.33024871349334717, -0.18604815006256104, -0.04184746742248535, 0.10235309600830078, 0.2465537041425705, 0.3907543122768402, 0.5349549055099487, 0.6791555285453796, 0.8233561515808105, 0.9675567150115967, 1.1117573976516724, 1.2559579610824585, 1.4001585245132446, 1.5443592071533203, 1.6885597705841064, 1.8327603340148926, 1.9769610166549683, 2.121161460876465, 2.26536226272583, 2.409562826156616, 2.5537633895874023, 2.6979639530181885, 2.8421645164489746, 2.98636531829834, 3.130565881729126, 3.274766445159912, 3.4189672470092773, 3.5631675720214844, 3.7073681354522705, 3.8515686988830566, 3.995769500732422, 4.139969825744629, 4.284170627593994, 4.428371429443359, 4.572571754455566, 4.716772556304932]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 10.0, 14.0, 12.0, 18.0, 24.0, 17.0, 21.0, 31.0, 41.0, 28.0, 29.0, 46.0, 42.0, 38.0, 39.0, 26.0, 47.0, 39.0, 46.0, 48.0, 46.0, 30.0, 43.0, 36.0, 35.0, 21.0, 29.0, 20.0, 15.0, 14.0, 19.0, 13.0, 18.0, 7.0, 6.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.038114547729492, -3.8989460468292236, -3.759777545928955, -3.6206090450286865, -3.481440544128418, -3.3422718048095703, -3.2031033039093018, -3.063934803009033, -2.9247663021087646, -2.785597801208496, -2.6464293003082275, -2.507260799407959, -2.3680920600891113, -2.228923797607422, -2.089755058288574, -1.9505865573883057, -1.811418056488037, -1.6722495555877686, -1.5330810546875, -1.393912434577942, -1.2547439336776733, -1.1155754327774048, -0.9764068722724915, -0.8372383117675781, -0.6980698108673096, -0.558901309967041, -0.4197327494621277, -0.28056421875953674, -0.1413956880569458, -0.002227187156677246, 0.13694137334823608, 0.2761099338531494, 0.41527795791625977, 0.5544464588165283, 0.6936150193214417, 0.832783579826355, 0.9719520807266235, 1.111120581626892, 1.2502892017364502, 1.3894577026367188, 1.5286262035369873, 1.6677947044372559, 1.8069632053375244, 1.9461318254470825, 2.0853004455566406, 2.22446870803833, 2.3636374473571777, 2.5028059482574463, 2.641974449157715, 2.7811429500579834, 2.920311450958252, 3.0594799518585205, 3.198648452758789, 3.3378171920776367, 3.4769856929779053, 3.616154193878174, 3.7553226947784424, 3.894491195678711, 4.033659934997559, 4.172828197479248, 4.311996936798096, 4.451165199279785, 4.590333938598633, 4.7295026779174805, 4.86867094039917]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 12.0, 9.0, 15.0, 26.0, 49.0, 72.0, 105.0, 198.0, 286.0, 454.0, 716.0, 1000.0, 1524.0, 2373.0, 3617.0, 5282.0, 7689.0, 11058.0, 15758.0, 22105.0, 29868.0, 39687.0, 50307.0, 61510.0, 72344.0, 81790.0, 87386.0, 89079.0, 85466.0, 78930.0, 68618.0, 57847.0, 46280.0, 35894.0, 26870.0, 19800.0, 14193.0, 9926.0, 6811.0, 4644.0, 3035.0, 2097.0, 1334.0, 883.0, 568.0, 378.0, 247.0, 148.0, 101.0, 62.0, 42.0, 28.0, 17.0, 13.0, 6.0, 2.0, 3.0, 1.0], "bins": [-2.1484375, -2.0839691162109375, -2.019500732421875, -1.9550323486328125, -1.89056396484375, -1.8260955810546875, -1.761627197265625, -1.6971588134765625, -1.6326904296875, -1.5682220458984375, -1.503753662109375, -1.4392852783203125, -1.37481689453125, -1.3103485107421875, -1.245880126953125, -1.1814117431640625, -1.116943359375, -1.0524749755859375, -0.988006591796875, -0.9235382080078125, -0.85906982421875, -0.7946014404296875, -0.730133056640625, -0.6656646728515625, -0.6011962890625, -0.5367279052734375, -0.472259521484375, -0.4077911376953125, -0.34332275390625, -0.2788543701171875, -0.214385986328125, -0.1499176025390625, -0.08544921875, -0.0209808349609375, 0.043487548828125, 0.1079559326171875, 0.17242431640625, 0.2368927001953125, 0.301361083984375, 0.3658294677734375, 0.4302978515625, 0.4947662353515625, 0.559234619140625, 0.6237030029296875, 0.68817138671875, 0.7526397705078125, 0.817108154296875, 0.8815765380859375, 0.946044921875, 1.0105133056640625, 1.074981689453125, 1.1394500732421875, 1.20391845703125, 1.2683868408203125, 1.332855224609375, 1.3973236083984375, 1.4617919921875, 1.5262603759765625, 1.590728759765625, 1.6551971435546875, 1.71966552734375, 1.7841339111328125, 1.848602294921875, 1.9130706787109375, 1.9775390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 8.0, 6.0, 11.0, 9.0, 18.0, 10.0, 11.0, 30.0, 22.0, 29.0, 32.0, 24.0, 37.0, 39.0, 36.0, 45.0, 41.0, 37.0, 39.0, 38.0, 42.0, 47.0, 48.0, 34.0, 28.0, 31.0, 33.0, 28.0, 25.0, 18.0, 27.0, 24.0, 16.0, 15.0, 10.0, 12.0, 10.0, 6.0, 1.0, 7.0, 4.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.86224365234375, -3.7205810546875, -3.57891845703125, -3.437255859375, -3.29559326171875, -3.1539306640625, -3.01226806640625, -2.87060546875, -2.72894287109375, -2.5872802734375, -2.44561767578125, -2.303955078125, -2.16229248046875, -2.0206298828125, -1.87896728515625, -1.7373046875, -1.59564208984375, -1.4539794921875, -1.31231689453125, -1.170654296875, -1.02899169921875, -0.8873291015625, -0.74566650390625, -0.60400390625, -0.46234130859375, -0.3206787109375, -0.17901611328125, -0.037353515625, 0.10430908203125, 0.2459716796875, 0.38763427734375, 0.529296875, 0.67095947265625, 0.8126220703125, 0.95428466796875, 1.095947265625, 1.23760986328125, 1.3792724609375, 1.52093505859375, 1.66259765625, 1.80426025390625, 1.9459228515625, 2.08758544921875, 2.229248046875, 2.37091064453125, 2.5125732421875, 2.65423583984375, 2.7958984375, 2.93756103515625, 3.0792236328125, 3.22088623046875, 3.362548828125, 3.50421142578125, 3.6458740234375, 3.78753662109375, 3.92919921875, 4.07086181640625, 4.2125244140625, 4.35418701171875, 4.495849609375, 4.63751220703125, 4.7791748046875, 4.92083740234375, 5.0625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 7.0, 8.0, 20.0, 29.0, 56.0, 80.0, 142.0, 216.0, 336.0, 578.0, 867.0, 1562.0, 2442.0, 3847.0, 6247.0, 9939.0, 15083.0, 23236.0, 34472.0, 48604.0, 66092.0, 83709.0, 100740.0, 109883.0, 111016.0, 103535.0, 89821.0, 70981.0, 53482.0, 38127.0, 26109.0, 17576.0, 11098.0, 6955.0, 4374.0, 2770.0, 1739.0, 1034.0, 658.0, 411.0, 267.0, 184.0, 74.0, 43.0, 30.0, 31.0, 19.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-2.939453125, -2.853363037109375, -2.76727294921875, -2.681182861328125, -2.5950927734375, -2.509002685546875, -2.42291259765625, -2.336822509765625, -2.250732421875, -2.164642333984375, -2.07855224609375, -1.992462158203125, -1.9063720703125, -1.820281982421875, -1.73419189453125, -1.648101806640625, -1.56201171875, -1.475921630859375, -1.38983154296875, -1.303741455078125, -1.2176513671875, -1.131561279296875, -1.04547119140625, -0.959381103515625, -0.873291015625, -0.787200927734375, -0.70111083984375, -0.615020751953125, -0.5289306640625, -0.442840576171875, -0.35675048828125, -0.270660400390625, -0.1845703125, -0.098480224609375, -0.01239013671875, 0.073699951171875, 0.1597900390625, 0.245880126953125, 0.33197021484375, 0.418060302734375, 0.504150390625, 0.590240478515625, 0.67633056640625, 0.762420654296875, 0.8485107421875, 0.934600830078125, 1.02069091796875, 1.106781005859375, 1.19287109375, 1.278961181640625, 1.36505126953125, 1.451141357421875, 1.5372314453125, 1.623321533203125, 1.70941162109375, 1.795501708984375, 1.881591796875, 1.967681884765625, 2.05377197265625, 2.139862060546875, 2.2259521484375, 2.312042236328125, 2.39813232421875, 2.484222412109375, 2.5703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 15.0, 12.0, 11.0, 22.0, 25.0, 21.0, 24.0, 25.0, 27.0, 25.0, 39.0, 40.0, 22.0, 31.0, 36.0, 35.0, 49.0, 34.0, 40.0, 43.0, 37.0, 39.0, 41.0, 25.0, 29.0, 25.0, 28.0, 18.0, 21.0, 21.0, 19.0, 15.0, 15.0, 8.0, 12.0, 7.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-2.8046875, -2.718109130859375, -2.63153076171875, -2.544952392578125, -2.4583740234375, -2.371795654296875, -2.28521728515625, -2.198638916015625, -2.112060546875, -2.025482177734375, -1.93890380859375, -1.852325439453125, -1.7657470703125, -1.679168701171875, -1.59259033203125, -1.506011962890625, -1.41943359375, -1.332855224609375, -1.24627685546875, -1.159698486328125, -1.0731201171875, -0.986541748046875, -0.89996337890625, -0.813385009765625, -0.726806640625, -0.640228271484375, -0.55364990234375, -0.467071533203125, -0.3804931640625, -0.293914794921875, -0.20733642578125, -0.120758056640625, -0.0341796875, 0.052398681640625, 0.13897705078125, 0.225555419921875, 0.3121337890625, 0.398712158203125, 0.48529052734375, 0.571868896484375, 0.658447265625, 0.745025634765625, 0.83160400390625, 0.918182373046875, 1.0047607421875, 1.091339111328125, 1.17791748046875, 1.264495849609375, 1.35107421875, 1.437652587890625, 1.52423095703125, 1.610809326171875, 1.6973876953125, 1.783966064453125, 1.87054443359375, 1.957122802734375, 2.043701171875, 2.130279541015625, 2.21685791015625, 2.303436279296875, 2.3900146484375, 2.476593017578125, 2.56317138671875, 2.649749755859375, 2.736328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 13.0, 14.0, 22.0, 47.0, 58.0, 112.0, 179.0, 246.0, 429.0, 739.0, 1124.0, 1776.0, 2815.0, 4438.0, 7053.0, 10804.0, 16070.0, 23503.0, 33679.0, 46482.0, 61059.0, 76513.0, 90354.0, 99827.0, 102820.0, 99263.0, 88925.0, 74805.0, 60133.0, 45174.0, 32962.0, 23012.0, 15711.0, 10185.0, 6653.0, 4296.0, 2681.0, 1763.0, 1074.0, 624.0, 415.0, 292.0, 147.0, 106.0, 64.0, 43.0, 18.0, 17.0, 9.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.7971572875976562, -0.7700958251953125, -0.7430343627929688, -0.715972900390625, -0.6889114379882812, -0.6618499755859375, -0.6347885131835938, -0.60772705078125, -0.5806655883789062, -0.5536041259765625, -0.5265426635742188, -0.499481201171875, -0.47241973876953125, -0.4453582763671875, -0.41829681396484375, -0.3912353515625, -0.36417388916015625, -0.3371124267578125, -0.31005096435546875, -0.282989501953125, -0.25592803955078125, -0.2288665771484375, -0.20180511474609375, -0.17474365234375, -0.14768218994140625, -0.1206207275390625, -0.09355926513671875, -0.066497802734375, -0.03943634033203125, -0.0123748779296875, 0.01468658447265625, 0.041748046875, 0.06880950927734375, 0.0958709716796875, 0.12293243408203125, 0.149993896484375, 0.17705535888671875, 0.2041168212890625, 0.23117828369140625, 0.25823974609375, 0.28530120849609375, 0.3123626708984375, 0.33942413330078125, 0.366485595703125, 0.39354705810546875, 0.4206085205078125, 0.44766998291015625, 0.4747314453125, 0.5017929077148438, 0.5288543701171875, 0.5559158325195312, 0.582977294921875, 0.6100387573242188, 0.6371002197265625, 0.6641616821289062, 0.69122314453125, 0.7182846069335938, 0.7453460693359375, 0.7724075317382812, 0.799468994140625, 0.8265304565429688, 0.8535919189453125, 0.8806533813476562, 0.90771484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 6.0, 11.0, 16.0, 8.0, 18.0, 19.0, 21.0, 24.0, 30.0, 30.0, 46.0, 45.0, 60.0, 51.0, 46.0, 65.0, 51.0, 50.0, 45.0, 39.0, 47.0, 39.0, 34.0, 33.0, 29.0, 27.0, 20.0, 7.0, 16.0, 14.0, 9.0, 8.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00013053417205810547, -0.0001265648752450943, -0.00012259557843208313, -0.00011862628161907196, -0.00011465698480606079, -0.00011068768799304962, -0.00010671839118003845, -0.00010274909436702728, -9.877979755401611e-05, -9.481050074100494e-05, -9.084120392799377e-05, -8.68719071149826e-05, -8.290261030197144e-05, -7.893331348896027e-05, -7.49640166759491e-05, -7.099471986293793e-05, -6.702542304992676e-05, -6.305612623691559e-05, -5.908682942390442e-05, -5.511753261089325e-05, -5.114823579788208e-05, -4.717893898487091e-05, -4.320964217185974e-05, -3.924034535884857e-05, -3.52710485458374e-05, -3.130175173282623e-05, -2.7332454919815063e-05, -2.3363158106803894e-05, -1.9393861293792725e-05, -1.5424564480781555e-05, -1.1455267667770386e-05, -7.485970854759216e-06, -3.516674041748047e-06, 4.5262277126312256e-07, 4.421919584274292e-06, 8.391216397285461e-06, 1.2360513210296631e-05, 1.63298100233078e-05, 2.029910683631897e-05, 2.426840364933014e-05, 2.823770046234131e-05, 3.220699727535248e-05, 3.617629408836365e-05, 4.014559090137482e-05, 4.4114887714385986e-05, 4.8084184527397156e-05, 5.2053481340408325e-05, 5.6022778153419495e-05, 5.9992074966430664e-05, 6.396137177944183e-05, 6.7930668592453e-05, 7.189996540546417e-05, 7.586926221847534e-05, 7.983855903148651e-05, 8.380785584449768e-05, 8.777715265750885e-05, 9.174644947052002e-05, 9.571574628353119e-05, 9.968504309654236e-05, 0.00010365433990955353, 0.0001076236367225647, 0.00011159293353557587, 0.00011556223034858704, 0.0001195315271615982, 0.00012350082397460938]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 13.0, 13.0, 17.0, 27.0, 47.0, 68.0, 97.0, 165.0, 266.0, 362.0, 587.0, 845.0, 1392.0, 2189.0, 3377.0, 5400.0, 8510.0, 12751.0, 19222.0, 28258.0, 40183.0, 54541.0, 69777.0, 85747.0, 97775.0, 104514.0, 103669.0, 95866.0, 82020.0, 66665.0, 51166.0, 36988.0, 25915.0, 17384.0, 11527.0, 7549.0, 4835.0, 3154.0, 2117.0, 1295.0, 822.0, 531.0, 326.0, 199.0, 134.0, 78.0, 61.0, 41.0, 22.0, 23.0, 18.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.951171875, -0.9213409423828125, -0.891510009765625, -0.8616790771484375, -0.83184814453125, -0.8020172119140625, -0.772186279296875, -0.7423553466796875, -0.7125244140625, -0.6826934814453125, -0.652862548828125, -0.6230316162109375, -0.59320068359375, -0.5633697509765625, -0.533538818359375, -0.5037078857421875, -0.473876953125, -0.4440460205078125, -0.414215087890625, -0.3843841552734375, -0.35455322265625, -0.3247222900390625, -0.294891357421875, -0.2650604248046875, -0.2352294921875, -0.2053985595703125, -0.175567626953125, -0.1457366943359375, -0.11590576171875, -0.0860748291015625, -0.056243896484375, -0.0264129638671875, 0.00341796875, 0.0332489013671875, 0.063079833984375, 0.0929107666015625, 0.12274169921875, 0.1525726318359375, 0.182403564453125, 0.2122344970703125, 0.2420654296875, 0.2718963623046875, 0.301727294921875, 0.3315582275390625, 0.36138916015625, 0.3912200927734375, 0.421051025390625, 0.4508819580078125, 0.480712890625, 0.5105438232421875, 0.540374755859375, 0.5702056884765625, 0.60003662109375, 0.6298675537109375, 0.659698486328125, 0.6895294189453125, 0.7193603515625, 0.7491912841796875, 0.779022216796875, 0.8088531494140625, 0.83868408203125, 0.8685150146484375, 0.898345947265625, 0.9281768798828125, 0.9580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 2.0, 12.0, 8.0, 6.0, 11.0, 11.0, 15.0, 29.0, 21.0, 33.0, 23.0, 29.0, 37.0, 34.0, 49.0, 35.0, 28.0, 39.0, 46.0, 48.0, 38.0, 39.0, 35.0, 44.0, 37.0, 45.0, 31.0, 37.0, 31.0, 25.0, 17.0, 30.0, 13.0, 16.0, 12.0, 5.0, 10.0, 7.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.474853515625, -0.4618339538574219, -0.44881439208984375, -0.4357948303222656, -0.4227752685546875, -0.4097557067871094, -0.39673614501953125, -0.3837165832519531, -0.370697021484375, -0.3576774597167969, -0.34465789794921875, -0.3316383361816406, -0.3186187744140625, -0.3055992126464844, -0.29257965087890625, -0.2795600891113281, -0.26654052734375, -0.2535209655761719, -0.24050140380859375, -0.22748184204101562, -0.2144622802734375, -0.20144271850585938, -0.18842315673828125, -0.17540359497070312, -0.162384033203125, -0.14936447143554688, -0.13634490966796875, -0.12332534790039062, -0.1103057861328125, -0.09728622436523438, -0.08426666259765625, -0.07124710083007812, -0.0582275390625, -0.045207977294921875, -0.03218841552734375, -0.019168853759765625, -0.0061492919921875, 0.006870269775390625, 0.01988983154296875, 0.032909393310546875, 0.045928955078125, 0.058948516845703125, 0.07196807861328125, 0.08498764038085938, 0.0980072021484375, 0.11102676391601562, 0.12404632568359375, 0.13706588745117188, 0.15008544921875, 0.16310501098632812, 0.17612457275390625, 0.18914413452148438, 0.2021636962890625, 0.21518325805664062, 0.22820281982421875, 0.24122238159179688, 0.254241943359375, 0.2672615051269531, 0.28028106689453125, 0.2933006286621094, 0.3063201904296875, 0.3193397521972656, 0.33235931396484375, 0.3453788757324219, 0.3583984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 8.0, 6.0, 8.0, 7.0, 11.0, 16.0, 15.0, 24.0, 24.0, 27.0, 28.0, 29.0, 34.0, 23.0, 37.0, 41.0, 48.0, 36.0, 43.0, 32.0, 42.0, 41.0, 35.0, 51.0, 34.0, 25.0, 27.0, 28.0, 38.0, 22.0, 26.0, 20.0, 20.0, 14.0, 19.0, 15.0, 4.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2646613121032715, -4.12288761138916, -3.981113910675049, -3.8393402099609375, -3.697566509246826, -3.555792808532715, -3.4140191078186035, -3.272245407104492, -3.130471706390381, -2.9886980056762695, -2.846924304962158, -2.705150604248047, -2.5633769035339355, -2.421603202819824, -2.279829502105713, -2.1380558013916016, -1.9962821006774902, -1.854508399963379, -1.7127346992492676, -1.5709609985351562, -1.429187297821045, -1.2874135971069336, -1.1456398963928223, -1.003866195678711, -0.8620924949645996, -0.7203187942504883, -0.578545093536377, -0.4367713928222656, -0.2949976921081543, -0.15322399139404297, -0.01145029067993164, 0.1303234100341797, 0.2720966339111328, 0.41387033462524414, 0.5556440353393555, 0.6974177360534668, 0.8391914367675781, 0.9809651374816895, 1.1227388381958008, 1.264512538909912, 1.4062862396240234, 1.5480599403381348, 1.689833641052246, 1.8316073417663574, 1.9733810424804688, 2.11515474319458, 2.2569284439086914, 2.3987021446228027, 2.540475845336914, 2.6822495460510254, 2.8240232467651367, 2.965796947479248, 3.1075706481933594, 3.2493443489074707, 3.391118049621582, 3.5328917503356934, 3.6746654510498047, 3.816439151763916, 3.9582128524780273, 4.099986553192139, 4.24176025390625, 4.383533954620361, 4.525307655334473, 4.667081356048584, 4.808855056762695]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 5.0, 6.0, 14.0, 7.0, 13.0, 13.0, 17.0, 17.0, 22.0, 16.0, 29.0, 26.0, 32.0, 31.0, 29.0, 38.0, 33.0, 47.0, 40.0, 42.0, 36.0, 47.0, 36.0, 52.0, 35.0, 36.0, 33.0, 21.0, 20.0, 15.0, 30.0, 19.0, 21.0, 23.0, 10.0, 16.0, 12.0, 12.0, 8.0, 6.0, 7.0, 9.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.049232006072998, -3.9119884967803955, -3.774744987487793, -3.6375017166137695, -3.500258207321167, -3.3630146980285645, -3.225771427154541, -3.0885279178619385, -2.951284408569336, -2.8140408992767334, -2.676797389984131, -2.5395541191101074, -2.402310609817505, -2.2650671005249023, -2.127823829650879, -1.9905803203582764, -1.8533368110656738, -1.7160933017730713, -1.5788499116897583, -1.4416065216064453, -1.3043630123138428, -1.1671195030212402, -1.0298761129379272, -0.8926326632499695, -0.7553892135620117, -0.618145763874054, -0.4809023141860962, -0.3436588644981384, -0.20641541481018066, -0.0691719651222229, 0.06807148456573486, 0.20531493425369263, 0.3425579071044922, 0.47980135679244995, 0.6170448064804077, 0.7542882561683655, 0.8915317058563232, 1.0287752151489258, 1.1660186052322388, 1.3032619953155518, 1.4405055046081543, 1.5777490139007568, 1.7149924039840698, 1.8522357940673828, 1.9894793033599854, 2.126722812652588, 2.2639660835266113, 2.401209592819214, 2.5384531021118164, 2.675696611404419, 2.8129401206970215, 2.950183391571045, 3.0874269008636475, 3.22467041015625, 3.3619136810302734, 3.499157190322876, 3.6364006996154785, 3.773644208908081, 3.9108877182006836, 4.048130989074707, 4.1853742599487305, 4.322618007659912, 4.4598612785339355, 4.597105026245117, 4.734348297119141]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 13.0, 18.0, 20.0, 52.0, 78.0, 150.0, 251.0, 430.0, 730.0, 1308.0, 2242.0, 4056.0, 6875.0, 11846.0, 21494.0, 37755.0, 65274.0, 111450.0, 185615.0, 291583.0, 425852.0, 553519.0, 616842.0, 576084.0, 457080.0, 320938.0, 205819.0, 124126.0, 73244.0, 42265.0, 24200.0, 13886.0, 8053.0, 4561.0, 2707.0, 1541.0, 901.0, 558.0, 341.0, 197.0, 134.0, 76.0, 55.0, 25.0, 12.0, 13.0, 5.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.984619140625, -3.84033203125, -3.696044921875, -3.5517578125, -3.407470703125, -3.26318359375, -3.118896484375, -2.974609375, -2.830322265625, -2.68603515625, -2.541748046875, -2.3974609375, -2.253173828125, -2.10888671875, -1.964599609375, -1.8203125, -1.676025390625, -1.53173828125, -1.387451171875, -1.2431640625, -1.098876953125, -0.95458984375, -0.810302734375, -0.666015625, -0.521728515625, -0.37744140625, -0.233154296875, -0.0888671875, 0.055419921875, 0.19970703125, 0.343994140625, 0.48828125, 0.632568359375, 0.77685546875, 0.921142578125, 1.0654296875, 1.209716796875, 1.35400390625, 1.498291015625, 1.642578125, 1.786865234375, 1.93115234375, 2.075439453125, 2.2197265625, 2.364013671875, 2.50830078125, 2.652587890625, 2.796875, 2.941162109375, 3.08544921875, 3.229736328125, 3.3740234375, 3.518310546875, 3.66259765625, 3.806884765625, 3.951171875, 4.095458984375, 4.23974609375, 4.384033203125, 4.5283203125, 4.672607421875, 4.81689453125, 4.961181640625, 5.10546875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 12.0, 7.0, 4.0, 11.0, 9.0, 13.0, 16.0, 14.0, 26.0, 16.0, 23.0, 20.0, 19.0, 25.0, 35.0, 37.0, 43.0, 18.0, 45.0, 37.0, 42.0, 48.0, 35.0, 38.0, 42.0, 39.0, 27.0, 36.0, 26.0, 25.0, 25.0, 18.0, 16.0, 19.0, 12.0, 22.0, 15.0, 11.0, 9.0, 6.0, 14.0, 8.0, 3.0, 2.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.53125, -3.415679931640625, -3.30010986328125, -3.184539794921875, -3.0689697265625, -2.953399658203125, -2.83782958984375, -2.722259521484375, -2.606689453125, -2.491119384765625, -2.37554931640625, -2.259979248046875, -2.1444091796875, -2.028839111328125, -1.91326904296875, -1.797698974609375, -1.68212890625, -1.566558837890625, -1.45098876953125, -1.335418701171875, -1.2198486328125, -1.104278564453125, -0.98870849609375, -0.873138427734375, -0.757568359375, -0.641998291015625, -0.52642822265625, -0.410858154296875, -0.2952880859375, -0.179718017578125, -0.06414794921875, 0.051422119140625, 0.1669921875, 0.282562255859375, 0.39813232421875, 0.513702392578125, 0.6292724609375, 0.744842529296875, 0.86041259765625, 0.975982666015625, 1.091552734375, 1.207122802734375, 1.32269287109375, 1.438262939453125, 1.5538330078125, 1.669403076171875, 1.78497314453125, 1.900543212890625, 2.01611328125, 2.131683349609375, 2.24725341796875, 2.362823486328125, 2.4783935546875, 2.593963623046875, 2.70953369140625, 2.825103759765625, 2.940673828125, 3.056243896484375, 3.17181396484375, 3.287384033203125, 3.4029541015625, 3.518524169921875, 3.63409423828125, 3.749664306640625, 3.865234375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 17.0, 23.0, 25.0, 65.0, 84.0, 119.0, 222.0, 341.0, 582.0, 886.0, 1492.0, 2335.0, 3784.0, 6200.0, 10161.0, 15923.0, 25854.0, 40538.0, 63014.0, 96395.0, 142604.0, 203818.0, 277835.0, 355985.0, 425309.0, 464206.0, 461403.0, 415177.0, 342718.0, 263612.0, 192845.0, 132971.0, 89301.0, 58055.0, 37906.0, 23851.0, 14777.0, 9071.0, 5676.0, 3510.0, 2160.0, 1284.0, 826.0, 484.0, 315.0, 196.0, 131.0, 73.0, 50.0, 26.0, 23.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0], "bins": [-4.1953125, -4.0638427734375, -3.932373046875, -3.8009033203125, -3.66943359375, -3.5379638671875, -3.406494140625, -3.2750244140625, -3.1435546875, -3.0120849609375, -2.880615234375, -2.7491455078125, -2.61767578125, -2.4862060546875, -2.354736328125, -2.2232666015625, -2.091796875, -1.9603271484375, -1.828857421875, -1.6973876953125, -1.56591796875, -1.4344482421875, -1.302978515625, -1.1715087890625, -1.0400390625, -0.9085693359375, -0.777099609375, -0.6456298828125, -0.51416015625, -0.3826904296875, -0.251220703125, -0.1197509765625, 0.01171875, 0.1431884765625, 0.274658203125, 0.4061279296875, 0.53759765625, 0.6690673828125, 0.800537109375, 0.9320068359375, 1.0634765625, 1.1949462890625, 1.326416015625, 1.4578857421875, 1.58935546875, 1.7208251953125, 1.852294921875, 1.9837646484375, 2.115234375, 2.2467041015625, 2.378173828125, 2.5096435546875, 2.64111328125, 2.7725830078125, 2.904052734375, 3.0355224609375, 3.1669921875, 3.2984619140625, 3.429931640625, 3.5614013671875, 3.69287109375, 3.8243408203125, 3.955810546875, 4.0872802734375, 4.21875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 16.0, 20.0, 17.0, 35.0, 39.0, 51.0, 46.0, 55.0, 66.0, 84.0, 96.0, 112.0, 121.0, 130.0, 169.0, 203.0, 179.0, 190.0, 198.0, 192.0, 185.0, 190.0, 215.0, 190.0, 163.0, 176.0, 156.0, 126.0, 113.0, 94.0, 72.0, 72.0, 63.0, 55.0, 45.0, 30.0, 21.0, 19.0, 19.0, 8.0, 11.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.15234375, -2.0902862548828125, -2.028228759765625, -1.9661712646484375, -1.90411376953125, -1.8420562744140625, -1.779998779296875, -1.7179412841796875, -1.6558837890625, -1.5938262939453125, -1.531768798828125, -1.4697113037109375, -1.40765380859375, -1.3455963134765625, -1.283538818359375, -1.2214813232421875, -1.159423828125, -1.0973663330078125, -1.035308837890625, -0.9732513427734375, -0.91119384765625, -0.8491363525390625, -0.787078857421875, -0.7250213623046875, -0.6629638671875, -0.6009063720703125, -0.538848876953125, -0.4767913818359375, -0.41473388671875, -0.3526763916015625, -0.290618896484375, -0.2285614013671875, -0.16650390625, -0.1044464111328125, -0.042388916015625, 0.0196685791015625, 0.08172607421875, 0.1437835693359375, 0.205841064453125, 0.2678985595703125, 0.3299560546875, 0.3920135498046875, 0.454071044921875, 0.5161285400390625, 0.57818603515625, 0.6402435302734375, 0.702301025390625, 0.7643585205078125, 0.826416015625, 0.8884735107421875, 0.950531005859375, 1.0125885009765625, 1.07464599609375, 1.1367034912109375, 1.198760986328125, 1.2608184814453125, 1.3228759765625, 1.3849334716796875, 1.446990966796875, 1.5090484619140625, 1.57110595703125, 1.6331634521484375, 1.695220947265625, 1.7572784423828125, 1.8193359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 4.0, 7.0, 4.0, 7.0, 18.0, 16.0, 18.0, 28.0, 33.0, 23.0, 33.0, 37.0, 31.0, 44.0, 52.0, 50.0, 48.0, 41.0, 41.0, 40.0, 39.0, 32.0, 45.0, 36.0, 39.0, 43.0, 29.0, 30.0, 24.0, 13.0, 18.0, 15.0, 9.0, 13.0, 11.0, 2.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.619921684265137, -4.439360618591309, -4.2587995529174805, -4.078238487243652, -3.8976776599884033, -3.717116594314575, -3.536555767059326, -3.355994701385498, -3.17543363571167, -2.994872570037842, -2.8143115043640137, -2.6337506771087646, -2.4531896114349365, -2.2726285457611084, -2.0920677185058594, -1.9115066528320312, -1.7309455871582031, -1.550384521484375, -1.3698235750198364, -1.1892626285552979, -1.0087015628814697, -0.8281405568122864, -0.647579550743103, -0.46701860427856445, -0.28645753860473633, -0.10589653253555298, 0.07466447353363037, 0.2552254796028137, 0.43578648567199707, 0.6163474917411804, 0.7969084978103638, 0.9774694442749023, 1.1580305099487305, 1.3385915756225586, 1.5191525220870972, 1.6997134685516357, 1.8802745342254639, 2.060835599899292, 2.241396427154541, 2.421957492828369, 2.6025185585021973, 2.7830796241760254, 2.9636406898498535, 3.1442015171051025, 3.3247625827789307, 3.505323648452759, 3.685884475708008, 3.866445541381836, 4.047006607055664, 4.227567672729492, 4.40812873840332, 4.588689804077148, 4.769250869750977, 4.9498114585876465, 5.130372524261475, 5.310933589935303, 5.491494655609131, 5.672055721282959, 5.852616786956787, 6.033177852630615, 6.213738441467285, 6.394299507141113, 6.574860572814941, 6.7554216384887695, 6.935982704162598]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 10.0, 15.0, 15.0, 26.0, 27.0, 20.0, 32.0, 32.0, 39.0, 36.0, 34.0, 44.0, 50.0, 52.0, 55.0, 50.0, 54.0, 37.0, 43.0, 46.0, 31.0, 28.0, 29.0, 29.0, 28.0, 23.0, 18.0, 14.0, 15.0, 10.0, 11.0, 9.0, 6.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.437704563140869, -5.2626214027404785, -5.08753776550293, -4.912454605102539, -4.73737096786499, -4.5622878074646, -4.387204170227051, -4.21212100982666, -4.0370378494262695, -3.8619544506073, -3.68687105178833, -3.5117878913879395, -3.3367042541503906, -3.16162109375, -2.9865376949310303, -2.8114542961120605, -2.6363706588745117, -2.461287260055542, -2.2862038612365723, -2.1111207008361816, -1.9360371828079224, -1.7609537839889526, -1.5858705043792725, -1.4107871055603027, -1.235703706741333, -1.0606203079223633, -0.8855369687080383, -0.7104536294937134, -0.5353702306747437, -0.3602868318557739, -0.18520355224609375, -0.010120153427124023, 0.1649637222290039, 0.34004709124565125, 0.5151304602622986, 0.6902137994766235, 0.8652971982955933, 1.040380597114563, 1.2154638767242432, 1.390547275543213, 1.5656306743621826, 1.7407140731811523, 1.915797472000122, 2.090880870819092, 2.2659640312194824, 2.4410476684570312, 2.616130828857422, 2.7912142276763916, 2.9662976264953613, 3.141381025314331, 3.316464424133301, 3.4915475845336914, 3.6666312217712402, 3.841714382171631, 4.01679801940918, 4.19188117980957, 4.366964340209961, 4.542047500610352, 4.7171311378479, 4.892214298248291, 5.06729793548584, 5.2423810958862305, 5.417464256286621, 5.59254789352417, 5.767631530761719]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 6.0, 12.0, 14.0, 27.0, 38.0, 51.0, 91.0, 150.0, 226.0, 367.0, 571.0, 933.0, 1532.0, 2617.0, 3999.0, 6704.0, 11026.0, 17248.0, 26922.0, 41101.0, 60026.0, 82258.0, 104938.0, 122373.0, 127316.0, 117259.0, 97401.0, 74115.0, 52686.0, 35283.0, 23044.0, 14648.0, 9213.0, 5588.0, 3287.0, 2041.0, 1348.0, 769.0, 490.0, 303.0, 190.0, 108.0, 79.0, 56.0, 43.0, 16.0, 22.0, 5.0, 3.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.595703125, -1.5447540283203125, -1.493804931640625, -1.4428558349609375, -1.39190673828125, -1.3409576416015625, -1.290008544921875, -1.2390594482421875, -1.1881103515625, -1.1371612548828125, -1.086212158203125, -1.0352630615234375, -0.98431396484375, -0.9333648681640625, -0.882415771484375, -0.8314666748046875, -0.780517578125, -0.7295684814453125, -0.678619384765625, -0.6276702880859375, -0.57672119140625, -0.5257720947265625, -0.474822998046875, -0.4238739013671875, -0.3729248046875, -0.3219757080078125, -0.271026611328125, -0.2200775146484375, -0.16912841796875, -0.1181793212890625, -0.067230224609375, -0.0162811279296875, 0.03466796875, 0.0856170654296875, 0.136566162109375, 0.1875152587890625, 0.23846435546875, 0.2894134521484375, 0.340362548828125, 0.3913116455078125, 0.4422607421875, 0.4932098388671875, 0.544158935546875, 0.5951080322265625, 0.64605712890625, 0.6970062255859375, 0.747955322265625, 0.7989044189453125, 0.849853515625, 0.9008026123046875, 0.951751708984375, 1.0027008056640625, 1.05364990234375, 1.1045989990234375, 1.155548095703125, 1.2064971923828125, 1.2574462890625, 1.3083953857421875, 1.359344482421875, 1.4102935791015625, 1.46124267578125, 1.5121917724609375, 1.563140869140625, 1.6140899658203125, 1.6650390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 19.0, 8.0, 20.0, 22.0, 22.0, 19.0, 35.0, 33.0, 37.0, 39.0, 38.0, 42.0, 55.0, 44.0, 62.0, 63.0, 38.0, 49.0, 40.0, 42.0, 32.0, 35.0, 28.0, 20.0, 29.0, 20.0, 22.0, 13.0, 15.0, 6.0, 6.0, 7.0, 2.0, 8.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5234375, -5.3372802734375, -5.151123046875, -4.9649658203125, -4.77880859375, -4.5926513671875, -4.406494140625, -4.2203369140625, -4.0341796875, -3.8480224609375, -3.661865234375, -3.4757080078125, -3.28955078125, -3.1033935546875, -2.917236328125, -2.7310791015625, -2.544921875, -2.3587646484375, -2.172607421875, -1.9864501953125, -1.80029296875, -1.6141357421875, -1.427978515625, -1.2418212890625, -1.0556640625, -0.8695068359375, -0.683349609375, -0.4971923828125, -0.31103515625, -0.1248779296875, 0.061279296875, 0.2474365234375, 0.43359375, 0.6197509765625, 0.805908203125, 0.9920654296875, 1.17822265625, 1.3643798828125, 1.550537109375, 1.7366943359375, 1.9228515625, 2.1090087890625, 2.295166015625, 2.4813232421875, 2.66748046875, 2.8536376953125, 3.039794921875, 3.2259521484375, 3.412109375, 3.5982666015625, 3.784423828125, 3.9705810546875, 4.15673828125, 4.3428955078125, 4.529052734375, 4.7152099609375, 4.9013671875, 5.0875244140625, 5.273681640625, 5.4598388671875, 5.64599609375, 5.8321533203125, 6.018310546875, 6.2044677734375, 6.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 13.0, 29.0, 31.0, 30.0, 54.0, 91.0, 117.0, 230.0, 376.0, 588.0, 974.0, 1603.0, 2661.0, 4709.0, 8206.0, 14706.0, 25836.0, 45045.0, 74226.0, 115580.0, 157426.0, 173257.0, 150687.0, 107806.0, 68752.0, 40876.0, 23386.0, 13280.0, 7566.0, 4333.0, 2378.0, 1431.0, 838.0, 499.0, 329.0, 217.0, 144.0, 83.0, 49.0, 37.0, 23.0, 19.0, 10.0, 8.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.463134765625, -2.37939453125, -2.295654296875, -2.2119140625, -2.128173828125, -2.04443359375, -1.960693359375, -1.876953125, -1.793212890625, -1.70947265625, -1.625732421875, -1.5419921875, -1.458251953125, -1.37451171875, -1.290771484375, -1.20703125, -1.123291015625, -1.03955078125, -0.955810546875, -0.8720703125, -0.788330078125, -0.70458984375, -0.620849609375, -0.537109375, -0.453369140625, -0.36962890625, -0.285888671875, -0.2021484375, -0.118408203125, -0.03466796875, 0.049072265625, 0.1328125, 0.216552734375, 0.30029296875, 0.384033203125, 0.4677734375, 0.551513671875, 0.63525390625, 0.718994140625, 0.802734375, 0.886474609375, 0.97021484375, 1.053955078125, 1.1376953125, 1.221435546875, 1.30517578125, 1.388916015625, 1.47265625, 1.556396484375, 1.64013671875, 1.723876953125, 1.8076171875, 1.891357421875, 1.97509765625, 2.058837890625, 2.142578125, 2.226318359375, 2.31005859375, 2.393798828125, 2.4775390625, 2.561279296875, 2.64501953125, 2.728759765625, 2.8125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 5.0, 12.0, 7.0, 21.0, 15.0, 18.0, 12.0, 22.0, 31.0, 23.0, 24.0, 24.0, 31.0, 37.0, 45.0, 50.0, 33.0, 44.0, 43.0, 59.0, 44.0, 44.0, 35.0, 41.0, 39.0, 30.0, 32.0, 28.0, 19.0, 21.0, 20.0, 13.0, 13.0, 13.0, 11.0, 8.0, 6.0, 4.0, 5.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.52734375, -3.42144775390625, -3.3155517578125, -3.20965576171875, -3.103759765625, -2.99786376953125, -2.8919677734375, -2.78607177734375, -2.68017578125, -2.57427978515625, -2.4683837890625, -2.36248779296875, -2.256591796875, -2.15069580078125, -2.0447998046875, -1.93890380859375, -1.8330078125, -1.72711181640625, -1.6212158203125, -1.51531982421875, -1.409423828125, -1.30352783203125, -1.1976318359375, -1.09173583984375, -0.98583984375, -0.87994384765625, -0.7740478515625, -0.66815185546875, -0.562255859375, -0.45635986328125, -0.3504638671875, -0.24456787109375, -0.138671875, -0.03277587890625, 0.0731201171875, 0.17901611328125, 0.284912109375, 0.39080810546875, 0.4967041015625, 0.60260009765625, 0.70849609375, 0.81439208984375, 0.9202880859375, 1.02618408203125, 1.132080078125, 1.23797607421875, 1.3438720703125, 1.44976806640625, 1.5556640625, 1.66156005859375, 1.7674560546875, 1.87335205078125, 1.979248046875, 2.08514404296875, 2.1910400390625, 2.29693603515625, 2.40283203125, 2.50872802734375, 2.6146240234375, 2.72052001953125, 2.826416015625, 2.93231201171875, 3.0382080078125, 3.14410400390625, 3.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 10.0, 12.0, 16.0, 18.0, 30.0, 59.0, 76.0, 106.0, 160.0, 230.0, 371.0, 561.0, 850.0, 1453.0, 2276.0, 3656.0, 6089.0, 10258.0, 17092.0, 28561.0, 46667.0, 73351.0, 108649.0, 144170.0, 160701.0, 144554.0, 108377.0, 72631.0, 46309.0, 28066.0, 17177.0, 10196.0, 6009.0, 3729.0, 2256.0, 1344.0, 816.0, 552.0, 367.0, 250.0, 145.0, 105.0, 81.0, 58.0, 32.0, 28.0, 18.0, 12.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0], "bins": [-1.005859375, -0.9766998291015625, -0.947540283203125, -0.9183807373046875, -0.88922119140625, -0.8600616455078125, -0.830902099609375, -0.8017425537109375, -0.7725830078125, -0.7434234619140625, -0.714263916015625, -0.6851043701171875, -0.65594482421875, -0.6267852783203125, -0.597625732421875, -0.5684661865234375, -0.539306640625, -0.5101470947265625, -0.480987548828125, -0.4518280029296875, -0.42266845703125, -0.3935089111328125, -0.364349365234375, -0.3351898193359375, -0.3060302734375, -0.2768707275390625, -0.247711181640625, -0.2185516357421875, -0.18939208984375, -0.1602325439453125, -0.131072998046875, -0.1019134521484375, -0.07275390625, -0.0435943603515625, -0.014434814453125, 0.0147247314453125, 0.04388427734375, 0.0730438232421875, 0.102203369140625, 0.1313629150390625, 0.1605224609375, 0.1896820068359375, 0.218841552734375, 0.2480010986328125, 0.27716064453125, 0.3063201904296875, 0.335479736328125, 0.3646392822265625, 0.393798828125, 0.4229583740234375, 0.452117919921875, 0.4812774658203125, 0.51043701171875, 0.5395965576171875, 0.568756103515625, 0.5979156494140625, 0.6270751953125, 0.6562347412109375, 0.685394287109375, 0.7145538330078125, 0.74371337890625, 0.7728729248046875, 0.802032470703125, 0.8311920166015625, 0.8603515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 14.0, 12.0, 23.0, 19.0, 17.0, 28.0, 24.0, 40.0, 38.0, 52.0, 43.0, 47.0, 42.0, 50.0, 60.0, 63.0, 43.0, 50.0, 65.0, 40.0, 34.0, 33.0, 30.0, 24.0, 28.0, 18.0, 12.0, 11.0, 14.0, 4.0, 3.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.526708602905273e-05, -6.325077265501022e-05, -6.123445928096771e-05, -5.92181459069252e-05, -5.720183253288269e-05, -5.518551915884018e-05, -5.316920578479767e-05, -5.115289241075516e-05, -4.9136579036712646e-05, -4.7120265662670135e-05, -4.5103952288627625e-05, -4.3087638914585114e-05, -4.10713255405426e-05, -3.905501216650009e-05, -3.703869879245758e-05, -3.502238541841507e-05, -3.300607204437256e-05, -3.098975867033005e-05, -2.8973445296287537e-05, -2.6957131922245026e-05, -2.4940818548202515e-05, -2.2924505174160004e-05, -2.0908191800117493e-05, -1.889187842607498e-05, -1.687556505203247e-05, -1.485925167798996e-05, -1.2842938303947449e-05, -1.0826624929904938e-05, -8.810311555862427e-06, -6.793998181819916e-06, -4.777684807777405e-06, -2.761371433734894e-06, -7.450580596923828e-07, 1.2712553143501282e-06, 3.287568688392639e-06, 5.30388206243515e-06, 7.320195436477661e-06, 9.336508810520172e-06, 1.1352822184562683e-05, 1.3369135558605194e-05, 1.5385448932647705e-05, 1.7401762306690216e-05, 1.9418075680732727e-05, 2.1434389054775238e-05, 2.345070242881775e-05, 2.546701580286026e-05, 2.748332917690277e-05, 2.9499642550945282e-05, 3.151595592498779e-05, 3.3532269299030304e-05, 3.5548582673072815e-05, 3.7564896047115326e-05, 3.958120942115784e-05, 4.159752279520035e-05, 4.361383616924286e-05, 4.563014954328537e-05, 4.764646291732788e-05, 4.966277629137039e-05, 5.16790896654129e-05, 5.3695403039455414e-05, 5.5711716413497925e-05, 5.7728029787540436e-05, 5.974434316158295e-05, 6.176065653562546e-05, 6.377696990966797e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 10.0, 6.0, 12.0, 13.0, 24.0, 28.0, 43.0, 89.0, 128.0, 184.0, 289.0, 535.0, 989.0, 1939.0, 3711.0, 7343.0, 15410.0, 31620.0, 63501.0, 113544.0, 172727.0, 203433.0, 177624.0, 120345.0, 67605.0, 34446.0, 16447.0, 8180.0, 3978.0, 1995.0, 967.0, 549.0, 297.0, 186.0, 119.0, 85.0, 56.0, 31.0, 17.0, 19.0, 14.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6533203125, -1.60546875, -1.5576171875, -1.509765625, -1.4619140625, -1.4140625, -1.3662109375, -1.318359375, -1.2705078125, -1.22265625, -1.1748046875, -1.126953125, -1.0791015625, -1.03125, -0.9833984375, -0.935546875, -0.8876953125, -0.83984375, -0.7919921875, -0.744140625, -0.6962890625, -0.6484375, -0.6005859375, -0.552734375, -0.5048828125, -0.45703125, -0.4091796875, -0.361328125, -0.3134765625, -0.265625, -0.2177734375, -0.169921875, -0.1220703125, -0.07421875, -0.0263671875, 0.021484375, 0.0693359375, 0.1171875, 0.1650390625, 0.212890625, 0.2607421875, 0.30859375, 0.3564453125, 0.404296875, 0.4521484375, 0.5, 0.5478515625, 0.595703125, 0.6435546875, 0.69140625, 0.7392578125, 0.787109375, 0.8349609375, 0.8828125, 0.9306640625, 0.978515625, 1.0263671875, 1.07421875, 1.1220703125, 1.169921875, 1.2177734375, 1.265625, 1.3134765625, 1.361328125, 1.4091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 11.0, 8.0, 21.0, 12.0, 34.0, 34.0, 52.0, 43.0, 71.0, 71.0, 79.0, 73.0, 59.0, 62.0, 57.0, 54.0, 48.0, 30.0, 29.0, 35.0, 22.0, 18.0, 16.0, 11.0, 5.0, 8.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.615234375, -0.5971298217773438, -0.5790252685546875, -0.5609207153320312, -0.542816162109375, -0.5247116088867188, -0.5066070556640625, -0.48850250244140625, -0.47039794921875, -0.45229339599609375, -0.4341888427734375, -0.41608428955078125, -0.397979736328125, -0.37987518310546875, -0.3617706298828125, -0.34366607666015625, -0.3255615234375, -0.30745697021484375, -0.2893524169921875, -0.27124786376953125, -0.253143310546875, -0.23503875732421875, -0.2169342041015625, -0.19882965087890625, -0.18072509765625, -0.16262054443359375, -0.1445159912109375, -0.12641143798828125, -0.108306884765625, -0.09020233154296875, -0.0720977783203125, -0.05399322509765625, -0.035888671875, -0.01778411865234375, 0.0003204345703125, 0.01842498779296875, 0.036529541015625, 0.05463409423828125, 0.0727386474609375, 0.09084320068359375, 0.10894775390625, 0.12705230712890625, 0.1451568603515625, 0.16326141357421875, 0.181365966796875, 0.19947052001953125, 0.2175750732421875, 0.23567962646484375, 0.2537841796875, 0.27188873291015625, 0.2899932861328125, 0.30809783935546875, 0.326202392578125, 0.34430694580078125, 0.3624114990234375, 0.38051605224609375, 0.39862060546875, 0.41672515869140625, 0.4348297119140625, 0.45293426513671875, 0.471038818359375, 0.48914337158203125, 0.5072479248046875, 0.5253524780273438, 0.54345703125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 9.0, 12.0, 18.0, 18.0, 22.0, 27.0, 32.0, 26.0, 40.0, 33.0, 41.0, 45.0, 50.0, 45.0, 39.0, 43.0, 51.0, 29.0, 33.0, 39.0, 39.0, 39.0, 37.0, 35.0, 28.0, 33.0, 22.0, 16.0, 15.0, 8.0, 11.0, 10.0, 12.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.606533050537109, -4.428823947906494, -4.251114845275879, -4.0734052658081055, -3.8956964015960693, -3.717987060546875, -3.5402779579162598, -3.3625688552856445, -3.1848597526550293, -3.007150650024414, -2.8294413089752197, -2.6517322063446045, -2.4740231037139893, -2.296313762664795, -2.1186046600341797, -1.9408955574035645, -1.7631862163543701, -1.5854769945144653, -1.40776789188385, -1.2300586700439453, -1.05234956741333, -0.8746403455734253, -0.6969311237335205, -0.5192220211029053, -0.3415127992630005, -0.16380362212657928, 0.013905555009841919, 0.19161474704742432, 0.3693239092826843, 0.5470330715179443, 0.7247422933578491, 0.9024513959884644, 1.0801606178283691, 1.257869839668274, 1.4355789422988892, 1.613288164138794, 1.7909972667694092, 1.968706488609314, 2.1464157104492188, 2.324124813079834, 2.501833915710449, 2.6795430183410645, 2.857252359390259, 3.034961462020874, 3.2126705646514893, 3.3903799057006836, 3.568089008331299, 3.745798110961914, 3.9235074520111084, 4.101216793060303, 4.278925895690918, 4.456634998321533, 4.634344100952148, 4.812053203582764, 4.989762306213379, 5.167471885681152, 5.345180988311768, 5.522890090942383, 5.700599193572998, 5.878308296203613, 6.056017875671387, 6.233726978302002, 6.411436080932617, 6.589145183563232, 6.766854286193848]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 9.0, 9.0, 14.0, 17.0, 24.0, 24.0, 22.0, 33.0, 31.0, 42.0, 34.0, 34.0, 41.0, 57.0, 52.0, 48.0, 54.0, 56.0, 42.0, 36.0, 40.0, 27.0, 37.0, 28.0, 31.0, 23.0, 25.0, 19.0, 18.0, 13.0, 8.0, 10.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.419719696044922, -5.245616912841797, -5.071514129638672, -4.897411346435547, -4.72330904006958, -4.549206256866455, -4.37510347366333, -4.201000690460205, -4.026898384094238, -3.8527956008911133, -3.6786930561065674, -3.5045902729034424, -3.3304877281188965, -3.1563849449157715, -2.9822821617126465, -2.8081793785095215, -2.6340765953063965, -2.4599738121032715, -2.2858712673187256, -2.1117684841156006, -1.9376658201217651, -1.7635631561279297, -1.5894603729248047, -1.4153577089309692, -1.2412550449371338, -1.0671523809432983, -0.8930496573448181, -0.7189469337463379, -0.5448442697525024, -0.370741605758667, -0.196638822555542, -0.022536158561706543, 0.1515665054321289, 0.32566919922828674, 0.4997718930244446, 0.6738746166229248, 0.8479772806167603, 1.0220799446105957, 1.1961827278137207, 1.3702853918075562, 1.5443880558013916, 1.718490719795227, 1.8925933837890625, 2.0666961669921875, 2.2407989501953125, 2.4149014949798584, 2.5890042781829834, 2.7631068229675293, 2.9372096061706543, 3.1113123893737793, 3.285414934158325, 3.45951771736145, 3.633620262145996, 3.807723045349121, 3.981825828552246, 4.155928611755371, 4.330031394958496, 4.504134178161621, 4.678236961364746, 4.852339744567871, 5.026442050933838, 5.200544834136963, 5.374647617340088, 5.548750400543213, 5.72285270690918]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 7.0, 3.0, 8.0, 20.0, 24.0, 35.0, 45.0, 80.0, 136.0, 205.0, 320.0, 493.0, 680.0, 1113.0, 1542.0, 2339.0, 3434.0, 4928.0, 7269.0, 10565.0, 15196.0, 21199.0, 28352.0, 38253.0, 49151.0, 60675.0, 71988.0, 80866.0, 87183.0, 89407.0, 86298.0, 79505.0, 70013.0, 59148.0, 47233.0, 37177.0, 27354.0, 20096.0, 14453.0, 10237.0, 7025.0, 4762.0, 3276.0, 2254.0, 1441.0, 961.0, 613.0, 412.0, 281.0, 180.0, 102.0, 77.0, 55.0, 43.0, 21.0, 16.0, 7.0, 3.0, 7.0, 5.0, 0.0, 0.0, 1.0], "bins": [-2.1953125, -2.1231689453125, -2.051025390625, -1.9788818359375, -1.90673828125, -1.8345947265625, -1.762451171875, -1.6903076171875, -1.6181640625, -1.5460205078125, -1.473876953125, -1.4017333984375, -1.32958984375, -1.2574462890625, -1.185302734375, -1.1131591796875, -1.041015625, -0.9688720703125, -0.896728515625, -0.8245849609375, -0.75244140625, -0.6802978515625, -0.608154296875, -0.5360107421875, -0.4638671875, -0.3917236328125, -0.319580078125, -0.2474365234375, -0.17529296875, -0.1031494140625, -0.031005859375, 0.0411376953125, 0.11328125, 0.1854248046875, 0.257568359375, 0.3297119140625, 0.40185546875, 0.4739990234375, 0.546142578125, 0.6182861328125, 0.6904296875, 0.7625732421875, 0.834716796875, 0.9068603515625, 0.97900390625, 1.0511474609375, 1.123291015625, 1.1954345703125, 1.267578125, 1.3397216796875, 1.411865234375, 1.4840087890625, 1.55615234375, 1.6282958984375, 1.700439453125, 1.7725830078125, 1.8447265625, 1.9168701171875, 1.989013671875, 2.0611572265625, 2.13330078125, 2.2054443359375, 2.277587890625, 2.3497314453125, 2.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 8.0, 3.0, 3.0, 9.0, 11.0, 11.0, 19.0, 16.0, 25.0, 31.0, 24.0, 35.0, 33.0, 39.0, 29.0, 36.0, 44.0, 43.0, 49.0, 40.0, 43.0, 53.0, 49.0, 45.0, 34.0, 30.0, 34.0, 34.0, 34.0, 31.0, 15.0, 12.0, 17.0, 8.0, 6.0, 5.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5625, -5.391845703125, -5.22119140625, -5.050537109375, -4.8798828125, -4.709228515625, -4.53857421875, -4.367919921875, -4.197265625, -4.026611328125, -3.85595703125, -3.685302734375, -3.5146484375, -3.343994140625, -3.17333984375, -3.002685546875, -2.83203125, -2.661376953125, -2.49072265625, -2.320068359375, -2.1494140625, -1.978759765625, -1.80810546875, -1.637451171875, -1.466796875, -1.296142578125, -1.12548828125, -0.954833984375, -0.7841796875, -0.613525390625, -0.44287109375, -0.272216796875, -0.1015625, 0.069091796875, 0.23974609375, 0.410400390625, 0.5810546875, 0.751708984375, 0.92236328125, 1.093017578125, 1.263671875, 1.434326171875, 1.60498046875, 1.775634765625, 1.9462890625, 2.116943359375, 2.28759765625, 2.458251953125, 2.62890625, 2.799560546875, 2.97021484375, 3.140869140625, 3.3115234375, 3.482177734375, 3.65283203125, 3.823486328125, 3.994140625, 4.164794921875, 4.33544921875, 4.506103515625, 4.6767578125, 4.847412109375, 5.01806640625, 5.188720703125, 5.359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 19.0, 24.0, 42.0, 56.0, 101.0, 128.0, 247.0, 375.0, 554.0, 800.0, 1374.0, 2057.0, 3105.0, 4783.0, 7070.0, 10708.0, 15354.0, 22102.0, 30598.0, 41435.0, 53931.0, 66941.0, 79995.0, 89466.0, 95261.0, 95177.0, 89257.0, 79571.0, 66672.0, 53610.0, 40522.0, 30335.0, 21409.0, 15011.0, 10348.0, 6924.0, 4481.0, 3079.0, 1979.0, 1283.0, 825.0, 565.0, 366.0, 231.0, 142.0, 92.0, 50.0, 33.0, 24.0, 13.0, 10.0, 4.0, 4.0, 6.0, 1.0], "bins": [-2.828125, -2.744873046875, -2.66162109375, -2.578369140625, -2.4951171875, -2.411865234375, -2.32861328125, -2.245361328125, -2.162109375, -2.078857421875, -1.99560546875, -1.912353515625, -1.8291015625, -1.745849609375, -1.66259765625, -1.579345703125, -1.49609375, -1.412841796875, -1.32958984375, -1.246337890625, -1.1630859375, -1.079833984375, -0.99658203125, -0.913330078125, -0.830078125, -0.746826171875, -0.66357421875, -0.580322265625, -0.4970703125, -0.413818359375, -0.33056640625, -0.247314453125, -0.1640625, -0.080810546875, 0.00244140625, 0.085693359375, 0.1689453125, 0.252197265625, 0.33544921875, 0.418701171875, 0.501953125, 0.585205078125, 0.66845703125, 0.751708984375, 0.8349609375, 0.918212890625, 1.00146484375, 1.084716796875, 1.16796875, 1.251220703125, 1.33447265625, 1.417724609375, 1.5009765625, 1.584228515625, 1.66748046875, 1.750732421875, 1.833984375, 1.917236328125, 2.00048828125, 2.083740234375, 2.1669921875, 2.250244140625, 2.33349609375, 2.416748046875, 2.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 7.0, 10.0, 10.0, 7.0, 18.0, 8.0, 21.0, 17.0, 20.0, 12.0, 19.0, 29.0, 23.0, 28.0, 47.0, 37.0, 32.0, 34.0, 31.0, 33.0, 44.0, 36.0, 41.0, 37.0, 38.0, 31.0, 34.0, 40.0, 35.0, 19.0, 22.0, 28.0, 12.0, 17.0, 11.0, 19.0, 11.0, 11.0, 11.0, 12.0, 5.0, 4.0, 6.0, 6.0, 5.0, 2.0, 0.0, 6.0, 1.0, 1.0], "bins": [-3.21484375, -3.121429443359375, -3.02801513671875, -2.934600830078125, -2.8411865234375, -2.747772216796875, -2.65435791015625, -2.560943603515625, -2.467529296875, -2.374114990234375, -2.28070068359375, -2.187286376953125, -2.0938720703125, -2.000457763671875, -1.90704345703125, -1.813629150390625, -1.72021484375, -1.626800537109375, -1.53338623046875, -1.439971923828125, -1.3465576171875, -1.253143310546875, -1.15972900390625, -1.066314697265625, -0.972900390625, -0.879486083984375, -0.78607177734375, -0.692657470703125, -0.5992431640625, -0.505828857421875, -0.41241455078125, -0.319000244140625, -0.2255859375, -0.132171630859375, -0.03875732421875, 0.054656982421875, 0.1480712890625, 0.241485595703125, 0.33489990234375, 0.428314208984375, 0.521728515625, 0.615142822265625, 0.70855712890625, 0.801971435546875, 0.8953857421875, 0.988800048828125, 1.08221435546875, 1.175628662109375, 1.26904296875, 1.362457275390625, 1.45587158203125, 1.549285888671875, 1.6427001953125, 1.736114501953125, 1.82952880859375, 1.922943115234375, 2.016357421875, 2.109771728515625, 2.20318603515625, 2.296600341796875, 2.3900146484375, 2.483428955078125, 2.57684326171875, 2.670257568359375, 2.763671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 4.0, 11.0, 11.0, 24.0, 29.0, 39.0, 49.0, 71.0, 108.0, 118.0, 195.0, 259.0, 395.0, 591.0, 882.0, 1483.0, 2224.0, 3649.0, 6133.0, 10201.0, 16945.0, 28466.0, 45726.0, 70258.0, 98269.0, 124988.0, 139623.0, 135865.0, 115867.0, 87994.0, 60268.0, 38266.0, 23630.0, 13884.0, 8394.0, 5094.0, 2981.0, 1906.0, 1202.0, 758.0, 499.0, 363.0, 247.0, 170.0, 120.0, 75.0, 72.0, 47.0, 39.0, 24.0, 17.0, 5.0, 8.0, 9.0, 4.0, 2.0], "bins": [-1.72265625, -1.6731719970703125, -1.623687744140625, -1.5742034912109375, -1.52471923828125, -1.4752349853515625, -1.425750732421875, -1.3762664794921875, -1.3267822265625, -1.2772979736328125, -1.227813720703125, -1.1783294677734375, -1.12884521484375, -1.0793609619140625, -1.029876708984375, -0.9803924560546875, -0.930908203125, -0.8814239501953125, -0.831939697265625, -0.7824554443359375, -0.73297119140625, -0.6834869384765625, -0.634002685546875, -0.5845184326171875, -0.5350341796875, -0.4855499267578125, -0.436065673828125, -0.3865814208984375, -0.33709716796875, -0.2876129150390625, -0.238128662109375, -0.1886444091796875, -0.13916015625, -0.0896759033203125, -0.040191650390625, 0.0092926025390625, 0.05877685546875, 0.1082611083984375, 0.157745361328125, 0.2072296142578125, 0.2567138671875, 0.3061981201171875, 0.355682373046875, 0.4051666259765625, 0.45465087890625, 0.5041351318359375, 0.553619384765625, 0.6031036376953125, 0.652587890625, 0.7020721435546875, 0.751556396484375, 0.8010406494140625, 0.85052490234375, 0.9000091552734375, 0.949493408203125, 0.9989776611328125, 1.0484619140625, 1.0979461669921875, 1.147430419921875, 1.1969146728515625, 1.24639892578125, 1.2958831787109375, 1.345367431640625, 1.3948516845703125, 1.4443359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 8.0, 10.0, 15.0, 27.0, 25.0, 37.0, 42.0, 46.0, 50.0, 62.0, 71.0, 83.0, 73.0, 66.0, 72.0, 70.0, 52.0, 59.0, 33.0, 25.0, 16.0, 17.0, 11.0, 6.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025844573974609375, -0.0002501383423805237, -0.0002418309450149536, -0.00023352354764938354, -0.00022521615028381348, -0.0002169087529182434, -0.00020860135555267334, -0.00020029395818710327, -0.0001919865608215332, -0.00018367916345596313, -0.00017537176609039307, -0.000167064368724823, -0.00015875697135925293, -0.00015044957399368286, -0.0001421421766281128, -0.00013383477926254272, -0.00012552738189697266, -0.00011721998453140259, -0.00010891258716583252, -0.00010060518980026245, -9.229779243469238e-05, -8.399039506912231e-05, -7.568299770355225e-05, -6.737560033798218e-05, -5.906820297241211e-05, -5.076080560684204e-05, -4.245340824127197e-05, -3.4146010875701904e-05, -2.5838613510131836e-05, -1.7531216144561768e-05, -9.2238187789917e-06, -9.164214134216309e-07, 7.3909759521484375e-06, 1.5698373317718506e-05, 2.4005770683288574e-05, 3.231316804885864e-05, 4.062056541442871e-05, 4.892796277999878e-05, 5.723536014556885e-05, 6.554275751113892e-05, 7.385015487670898e-05, 8.215755224227905e-05, 9.046494960784912e-05, 9.877234697341919e-05, 0.00010707974433898926, 0.00011538714170455933, 0.0001236945390701294, 0.00013200193643569946, 0.00014030933380126953, 0.0001486167311668396, 0.00015692412853240967, 0.00016523152589797974, 0.0001735389232635498, 0.00018184632062911987, 0.00019015371799468994, 0.00019846111536026, 0.00020676851272583008, 0.00021507591009140015, 0.00022338330745697021, 0.00023169070482254028, 0.00023999810218811035, 0.0002483054995536804, 0.0002566128969192505, 0.00026492029428482056, 0.0002732276916503906]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 15.0, 10.0, 22.0, 31.0, 32.0, 62.0, 88.0, 99.0, 157.0, 196.0, 296.0, 426.0, 605.0, 892.0, 1475.0, 2403.0, 4152.0, 7231.0, 13458.0, 24308.0, 43709.0, 75054.0, 115455.0, 152411.0, 168060.0, 151982.0, 114190.0, 73600.0, 43098.0, 23902.0, 12958.0, 7181.0, 4145.0, 2447.0, 1470.0, 934.0, 629.0, 399.0, 279.0, 201.0, 134.0, 91.0, 88.0, 48.0, 38.0, 26.0, 16.0, 14.0, 7.0, 13.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.9169921875, -1.8541107177734375, -1.791229248046875, -1.7283477783203125, -1.66546630859375, -1.6025848388671875, -1.539703369140625, -1.4768218994140625, -1.4139404296875, -1.3510589599609375, -1.288177490234375, -1.2252960205078125, -1.16241455078125, -1.0995330810546875, -1.036651611328125, -0.9737701416015625, -0.910888671875, -0.8480072021484375, -0.785125732421875, -0.7222442626953125, -0.65936279296875, -0.5964813232421875, -0.533599853515625, -0.4707183837890625, -0.4078369140625, -0.3449554443359375, -0.282073974609375, -0.2191925048828125, -0.15631103515625, -0.0934295654296875, -0.030548095703125, 0.0323333740234375, 0.09521484375, 0.1580963134765625, 0.220977783203125, 0.2838592529296875, 0.34674072265625, 0.4096221923828125, 0.472503662109375, 0.5353851318359375, 0.5982666015625, 0.6611480712890625, 0.724029541015625, 0.7869110107421875, 0.84979248046875, 0.9126739501953125, 0.975555419921875, 1.0384368896484375, 1.101318359375, 1.1641998291015625, 1.227081298828125, 1.2899627685546875, 1.35284423828125, 1.4157257080078125, 1.478607177734375, 1.5414886474609375, 1.6043701171875, 1.6672515869140625, 1.730133056640625, 1.7930145263671875, 1.85589599609375, 1.9187774658203125, 1.981658935546875, 2.0445404052734375, 2.107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 6.0, 4.0, 11.0, 7.0, 23.0, 18.0, 26.0, 31.0, 43.0, 46.0, 49.0, 61.0, 76.0, 77.0, 65.0, 60.0, 69.0, 54.0, 62.0, 38.0, 36.0, 25.0, 24.0, 21.0, 16.0, 11.0, 12.0, 7.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7698135375976562, -0.7432403564453125, -0.7166671752929688, -0.690093994140625, -0.6635208129882812, -0.6369476318359375, -0.6103744506835938, -0.58380126953125, -0.5572280883789062, -0.5306549072265625, -0.5040817260742188, -0.477508544921875, -0.45093536376953125, -0.4243621826171875, -0.39778900146484375, -0.3712158203125, -0.34464263916015625, -0.3180694580078125, -0.29149627685546875, -0.264923095703125, -0.23834991455078125, -0.2117767333984375, -0.18520355224609375, -0.15863037109375, -0.13205718994140625, -0.1054840087890625, -0.07891082763671875, -0.052337646484375, -0.02576446533203125, 0.0008087158203125, 0.02738189697265625, 0.053955078125, 0.08052825927734375, 0.1071014404296875, 0.13367462158203125, 0.160247802734375, 0.18682098388671875, 0.2133941650390625, 0.23996734619140625, 0.26654052734375, 0.29311370849609375, 0.3196868896484375, 0.34626007080078125, 0.372833251953125, 0.39940643310546875, 0.4259796142578125, 0.45255279541015625, 0.4791259765625, 0.5056991577148438, 0.5322723388671875, 0.5588455200195312, 0.585418701171875, 0.6119918823242188, 0.6385650634765625, 0.6651382446289062, 0.69171142578125, 0.7182846069335938, 0.7448577880859375, 0.7714309692382812, 0.798004150390625, 0.8245773315429688, 0.8511505126953125, 0.8777236938476562, 0.904296875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 4.0, 12.0, 11.0, 15.0, 30.0, 29.0, 21.0, 27.0, 35.0, 35.0, 41.0, 44.0, 50.0, 44.0, 47.0, 42.0, 37.0, 42.0, 33.0, 38.0, 39.0, 26.0, 42.0, 29.0, 42.0, 25.0, 22.0, 24.0, 11.0, 18.0, 18.0, 6.0, 14.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.629572868347168, -4.454378604888916, -4.279183864593506, -4.103989601135254, -3.928795099258423, -3.753600597381592, -3.57840633392334, -3.403211832046509, -3.2280173301696777, -3.0528228282928467, -2.8776283264160156, -2.7024340629577637, -2.5272395610809326, -2.3520450592041016, -2.1768507957458496, -2.0016562938690186, -1.8264617919921875, -1.6512672901153564, -1.476072907447815, -1.3008785247802734, -1.1256840229034424, -0.9504895806312561, -0.7752951383590698, -0.6001007556915283, -0.42490625381469727, -0.249711811542511, -0.07451736927032471, 0.10067707300186157, 0.27587151527404785, 0.45106595754623413, 0.6262603998184204, 0.8014547824859619, 0.976649284362793, 1.151843786239624, 1.3270381689071655, 1.502232551574707, 1.677427053451538, 1.8526215553283691, 2.027815818786621, 2.203010320663452, 2.378204822540283, 2.5533993244171143, 2.7285938262939453, 2.9037880897521973, 3.0789825916290283, 3.2541770935058594, 3.4293713569641113, 3.6045658588409424, 3.7797603607177734, 3.9549548625946045, 4.1301493644714355, 4.3053436279296875, 4.480538368225098, 4.65573263168335, 4.830926895141602, 5.006121635437012, 5.181315898895264, 5.356510162353516, 5.531704902648926, 5.706899166107178, 5.88209342956543, 6.05728816986084, 6.232482433319092, 6.407676696777344, 6.582871437072754]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 6.0, 9.0, 12.0, 19.0, 20.0, 19.0, 33.0, 22.0, 20.0, 39.0, 47.0, 34.0, 43.0, 41.0, 44.0, 49.0, 48.0, 43.0, 51.0, 34.0, 31.0, 44.0, 35.0, 43.0, 36.0, 28.0, 16.0, 14.0, 25.0, 16.0, 15.0, 15.0, 7.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.130115032196045, -5.945184707641602, -5.76025390625, -5.575323104858398, -5.390392780303955, -5.205462455749512, -5.02053165435791, -4.835600852966309, -4.650670528411865, -4.465740203857422, -4.28080940246582, -4.095878601074219, -3.9109482765197754, -3.726017713546753, -3.5410871505737305, -3.356156587600708, -3.1712260246276855, -2.986295461654663, -2.8013648986816406, -2.616434335708618, -2.4315037727355957, -2.2465732097625732, -2.061642646789551, -1.8767120838165283, -1.6917815208435059, -1.5068509578704834, -1.321920394897461, -1.1369898319244385, -0.952059268951416, -0.7671287059783936, -0.5821981430053711, -0.39726758003234863, -0.21233701705932617, -0.02740645408630371, 0.15752410888671875, 0.3424546718597412, 0.5273852348327637, 0.7123157978057861, 0.8972463607788086, 1.082176923751831, 1.2671074867248535, 1.452038049697876, 1.6369686126708984, 1.821899175643921, 2.0068297386169434, 2.191760301589966, 2.3766908645629883, 2.5616214275360107, 2.746551990509033, 2.9314825534820557, 3.116413116455078, 3.3013436794281006, 3.486274242401123, 3.6712048053741455, 3.856135368347168, 4.0410661697387695, 4.225996494293213, 4.410926818847656, 4.595857620239258, 4.780788421630859, 4.965718746185303, 5.150649070739746, 5.335579872131348, 5.520510673522949, 5.705440998077393]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 6.0, 10.0, 16.0, 37.0, 53.0, 87.0, 126.0, 215.0, 341.0, 539.0, 813.0, 1322.0, 2041.0, 3431.0, 5646.0, 9188.0, 15043.0, 24286.0, 39685.0, 63116.0, 99632.0, 152582.0, 225284.0, 315492.0, 409150.0, 485593.0, 512007.0, 482289.0, 403513.0, 310456.0, 220785.0, 149417.0, 96920.0, 62406.0, 38983.0, 24192.0, 15112.0, 9232.0, 5650.0, 3637.0, 2181.0, 1418.0, 841.0, 512.0, 379.0, 227.0, 127.0, 83.0, 65.0, 47.0, 25.0, 20.0, 8.0, 10.0, 10.0, 2.0, 3.0], "bins": [-4.96875, -4.82037353515625, -4.6719970703125, -4.52362060546875, -4.375244140625, -4.22686767578125, -4.0784912109375, -3.93011474609375, -3.78173828125, -3.63336181640625, -3.4849853515625, -3.33660888671875, -3.188232421875, -3.03985595703125, -2.8914794921875, -2.74310302734375, -2.5947265625, -2.44635009765625, -2.2979736328125, -2.14959716796875, -2.001220703125, -1.85284423828125, -1.7044677734375, -1.55609130859375, -1.40771484375, -1.25933837890625, -1.1109619140625, -0.96258544921875, -0.814208984375, -0.66583251953125, -0.5174560546875, -0.36907958984375, -0.220703125, -0.07232666015625, 0.0760498046875, 0.22442626953125, 0.372802734375, 0.52117919921875, 0.6695556640625, 0.81793212890625, 0.96630859375, 1.11468505859375, 1.2630615234375, 1.41143798828125, 1.559814453125, 1.70819091796875, 1.8565673828125, 2.00494384765625, 2.1533203125, 2.30169677734375, 2.4500732421875, 2.59844970703125, 2.746826171875, 2.89520263671875, 3.0435791015625, 3.19195556640625, 3.34033203125, 3.48870849609375, 3.6370849609375, 3.78546142578125, 3.933837890625, 4.08221435546875, 4.2305908203125, 4.37896728515625, 4.52734375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 13.0, 9.0, 8.0, 7.0, 15.0, 18.0, 18.0, 18.0, 21.0, 25.0, 33.0, 31.0, 32.0, 36.0, 47.0, 30.0, 42.0, 46.0, 37.0, 61.0, 34.0, 47.0, 33.0, 35.0, 35.0, 42.0, 32.0, 30.0, 20.0, 18.0, 22.0, 17.0, 13.0, 13.0, 12.0, 14.0, 10.0, 2.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.89453125, -4.732421875, -4.5703125, -4.408203125, -4.24609375, -4.083984375, -3.921875, -3.759765625, -3.59765625, -3.435546875, -3.2734375, -3.111328125, -2.94921875, -2.787109375, -2.625, -2.462890625, -2.30078125, -2.138671875, -1.9765625, -1.814453125, -1.65234375, -1.490234375, -1.328125, -1.166015625, -1.00390625, -0.841796875, -0.6796875, -0.517578125, -0.35546875, -0.193359375, -0.03125, 0.130859375, 0.29296875, 0.455078125, 0.6171875, 0.779296875, 0.94140625, 1.103515625, 1.265625, 1.427734375, 1.58984375, 1.751953125, 1.9140625, 2.076171875, 2.23828125, 2.400390625, 2.5625, 2.724609375, 2.88671875, 3.048828125, 3.2109375, 3.373046875, 3.53515625, 3.697265625, 3.859375, 4.021484375, 4.18359375, 4.345703125, 4.5078125, 4.669921875, 4.83203125, 4.994140625, 5.15625, 5.318359375, 5.48046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 22.0, 26.0, 49.0, 72.0, 107.0, 177.0, 271.0, 481.0, 731.0, 1291.0, 2118.0, 3515.0, 5804.0, 9666.0, 16200.0, 27074.0, 44241.0, 71532.0, 113834.0, 172312.0, 249372.0, 341674.0, 426890.0, 489286.0, 500957.0, 462004.0, 384676.0, 292543.0, 206408.0, 139017.0, 89568.0, 56511.0, 34265.0, 20720.0, 12380.0, 7433.0, 4313.0, 2629.0, 1562.0, 1013.0, 554.0, 367.0, 208.0, 158.0, 91.0, 51.0, 37.0, 19.0, 16.0, 11.0, 8.0, 4.0, 3.0, 1.0, 2.0], "bins": [-5.875, -5.6982421875, -5.521484375, -5.3447265625, -5.16796875, -4.9912109375, -4.814453125, -4.6376953125, -4.4609375, -4.2841796875, -4.107421875, -3.9306640625, -3.75390625, -3.5771484375, -3.400390625, -3.2236328125, -3.046875, -2.8701171875, -2.693359375, -2.5166015625, -2.33984375, -2.1630859375, -1.986328125, -1.8095703125, -1.6328125, -1.4560546875, -1.279296875, -1.1025390625, -0.92578125, -0.7490234375, -0.572265625, -0.3955078125, -0.21875, -0.0419921875, 0.134765625, 0.3115234375, 0.48828125, 0.6650390625, 0.841796875, 1.0185546875, 1.1953125, 1.3720703125, 1.548828125, 1.7255859375, 1.90234375, 2.0791015625, 2.255859375, 2.4326171875, 2.609375, 2.7861328125, 2.962890625, 3.1396484375, 3.31640625, 3.4931640625, 3.669921875, 3.8466796875, 4.0234375, 4.2001953125, 4.376953125, 4.5537109375, 4.73046875, 4.9072265625, 5.083984375, 5.2607421875, 5.4375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 8.0, 12.0, 14.0, 12.0, 19.0, 15.0, 32.0, 34.0, 47.0, 55.0, 60.0, 69.0, 95.0, 111.0, 121.0, 128.0, 153.0, 152.0, 152.0, 175.0, 172.0, 187.0, 203.0, 198.0, 188.0, 175.0, 173.0, 159.0, 171.0, 145.0, 128.0, 104.0, 88.0, 95.0, 73.0, 59.0, 65.0, 53.0, 45.0, 26.0, 25.0, 24.0, 13.0, 15.0, 9.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0], "bins": [-2.533203125, -2.458160400390625, -2.38311767578125, -2.308074951171875, -2.2330322265625, -2.157989501953125, -2.08294677734375, -2.007904052734375, -1.932861328125, -1.857818603515625, -1.78277587890625, -1.707733154296875, -1.6326904296875, -1.557647705078125, -1.48260498046875, -1.407562255859375, -1.33251953125, -1.257476806640625, -1.18243408203125, -1.107391357421875, -1.0323486328125, -0.957305908203125, -0.88226318359375, -0.807220458984375, -0.732177734375, -0.657135009765625, -0.58209228515625, -0.507049560546875, -0.4320068359375, -0.356964111328125, -0.28192138671875, -0.206878662109375, -0.1318359375, -0.056793212890625, 0.01824951171875, 0.093292236328125, 0.1683349609375, 0.243377685546875, 0.31842041015625, 0.393463134765625, 0.468505859375, 0.543548583984375, 0.61859130859375, 0.693634033203125, 0.7686767578125, 0.843719482421875, 0.91876220703125, 0.993804931640625, 1.06884765625, 1.143890380859375, 1.21893310546875, 1.293975830078125, 1.3690185546875, 1.444061279296875, 1.51910400390625, 1.594146728515625, 1.669189453125, 1.744232177734375, 1.81927490234375, 1.894317626953125, 1.9693603515625, 2.044403076171875, 2.11944580078125, 2.194488525390625, 2.26953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 4.0, 15.0, 15.0, 11.0, 18.0, 20.0, 26.0, 26.0, 23.0, 46.0, 32.0, 38.0, 33.0, 34.0, 40.0, 30.0, 55.0, 37.0, 35.0, 30.0, 36.0, 42.0, 39.0, 37.0, 32.0, 29.0, 35.0, 22.0, 24.0, 19.0, 13.0, 14.0, 12.0, 8.0, 9.0, 14.0, 4.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.971009254455566, -5.765902519226074, -5.560795307159424, -5.355688571929932, -5.150581359863281, -4.945474624633789, -4.740367889404297, -4.5352606773376465, -4.330153465270996, -4.125046730041504, -3.9199395179748535, -3.7148327827453613, -3.509725570678711, -3.3046188354492188, -3.0995118618011475, -2.894404888153076, -2.689298152923584, -2.4841911792755127, -2.2790842056274414, -2.073977470397949, -1.8688703775405884, -1.663763403892517, -1.4586565494537354, -1.253549575805664, -1.0484426021575928, -0.8433356285095215, -0.638228714466095, -0.43312180042266846, -0.22801482677459717, -0.02290785312652588, 0.18219900131225586, 0.38730597496032715, 0.5924124717712402, 0.7975194454193115, 1.0026264190673828, 1.2077332735061646, 1.4128402471542358, 1.6179472208023071, 1.8230540752410889, 2.02816104888916, 2.2332680225372314, 2.4383749961853027, 2.643481969833374, 2.8485889434814453, 3.0536956787109375, 3.258802890777588, 3.46390962600708, 3.6690165996551514, 3.8741235733032227, 4.079230308532715, 4.284337520599365, 4.489444255828857, 4.694551467895508, 4.899658203125, 5.104764938354492, 5.309872150421143, 5.514979362487793, 5.720086097717285, 5.9251933097839355, 6.130300045013428, 6.335407257080078, 6.54051399230957, 6.7456207275390625, 6.950727939605713, 7.155834674835205]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 17.0, 19.0, 18.0, 21.0, 24.0, 26.0, 32.0, 37.0, 39.0, 43.0, 49.0, 35.0, 45.0, 45.0, 50.0, 57.0, 36.0, 39.0, 39.0, 47.0, 29.0, 36.0, 25.0, 25.0, 25.0, 25.0, 18.0, 16.0, 10.0, 7.0, 14.0, 6.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.6981635093688965, -7.480841159820557, -7.263519287109375, -7.046196937561035, -6.8288750648498535, -6.611552715301514, -6.394230842590332, -6.176908493041992, -5.959586143493652, -5.7422637939453125, -5.524941921234131, -5.307619571685791, -5.090297698974609, -4.8729753494262695, -4.65565299987793, -4.438331127166748, -4.221009254455566, -4.003686904907227, -3.786365032196045, -3.569042682647705, -3.3517208099365234, -3.1343984603881836, -2.917076349258423, -2.699754238128662, -2.4824321269989014, -2.2651100158691406, -2.04778790473938, -1.8304656744003296, -1.6131435632705688, -1.395821452140808, -1.1784992218017578, -0.9611771106719971, -0.7438549995422363, -0.5265328884124756, -0.30921071767807007, -0.09188854694366455, 0.1254335641860962, 0.34275567531585693, 0.5600779056549072, 0.777400016784668, 0.9947221279144287, 1.2120442390441895, 1.4293663501739502, 1.6466885805130005, 1.8640106916427612, 2.0813326835632324, 2.2986550331115723, 2.515977144241333, 2.7332992553710938, 2.9506213665008545, 3.1679434776306152, 3.385265827178955, 3.6025876998901367, 3.8199100494384766, 4.037232398986816, 4.254554271697998, 4.47187614440918, 4.6891984939575195, 4.906520366668701, 5.123842716217041, 5.341164588928223, 5.5584869384765625, 5.775809288024902, 5.993131160736084, 6.210453510284424]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 7.0, 16.0, 10.0, 16.0, 26.0, 46.0, 30.0, 57.0, 87.0, 112.0, 146.0, 232.0, 309.0, 633.0, 1143.0, 2161.0, 5053.0, 12342.0, 31300.0, 74814.0, 155189.0, 240988.0, 239847.0, 155168.0, 74942.0, 31369.0, 12424.0, 4956.0, 2234.0, 1075.0, 651.0, 325.0, 262.0, 163.0, 111.0, 74.0, 61.0, 47.0, 30.0, 20.0, 26.0, 14.0, 9.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.11328125, -4.962890625, -4.8125, -4.662109375, -4.51171875, -4.361328125, -4.2109375, -4.060546875, -3.91015625, -3.759765625, -3.609375, -3.458984375, -3.30859375, -3.158203125, -3.0078125, -2.857421875, -2.70703125, -2.556640625, -2.40625, -2.255859375, -2.10546875, -1.955078125, -1.8046875, -1.654296875, -1.50390625, -1.353515625, -1.203125, -1.052734375, -0.90234375, -0.751953125, -0.6015625, -0.451171875, -0.30078125, -0.150390625, 0.0, 0.150390625, 0.30078125, 0.451171875, 0.6015625, 0.751953125, 0.90234375, 1.052734375, 1.203125, 1.353515625, 1.50390625, 1.654296875, 1.8046875, 1.955078125, 2.10546875, 2.255859375, 2.40625, 2.556640625, 2.70703125, 2.857421875, 3.0078125, 3.158203125, 3.30859375, 3.458984375, 3.609375, 3.759765625, 3.91015625, 4.060546875, 4.2109375, 4.361328125, 4.51171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 4.0, 2.0, 6.0, 15.0, 14.0, 21.0, 26.0, 24.0, 23.0, 35.0, 30.0, 44.0, 32.0, 50.0, 38.0, 47.0, 40.0, 53.0, 53.0, 54.0, 56.0, 41.0, 34.0, 28.0, 34.0, 36.0, 22.0, 22.0, 24.0, 15.0, 16.0, 10.0, 14.0, 8.0, 5.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.8519287109375, -7.610107421875, -7.3682861328125, -7.12646484375, -6.8846435546875, -6.642822265625, -6.4010009765625, -6.1591796875, -5.9173583984375, -5.675537109375, -5.4337158203125, -5.19189453125, -4.9500732421875, -4.708251953125, -4.4664306640625, -4.224609375, -3.9827880859375, -3.740966796875, -3.4991455078125, -3.25732421875, -3.0155029296875, -2.773681640625, -2.5318603515625, -2.2900390625, -2.0482177734375, -1.806396484375, -1.5645751953125, -1.32275390625, -1.0809326171875, -0.839111328125, -0.5972900390625, -0.35546875, -0.1136474609375, 0.128173828125, 0.3699951171875, 0.61181640625, 0.8536376953125, 1.095458984375, 1.3372802734375, 1.5791015625, 1.8209228515625, 2.062744140625, 2.3045654296875, 2.54638671875, 2.7882080078125, 3.030029296875, 3.2718505859375, 3.513671875, 3.7554931640625, 3.997314453125, 4.2391357421875, 4.48095703125, 4.7227783203125, 4.964599609375, 5.2064208984375, 5.4482421875, 5.6900634765625, 5.931884765625, 6.1737060546875, 6.41552734375, 6.6573486328125, 6.899169921875, 7.1409912109375, 7.3828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 3.0, 7.0, 4.0, 5.0, 4.0, 14.0, 18.0, 29.0, 22.0, 49.0, 46.0, 57.0, 80.0, 109.0, 183.0, 305.0, 470.0, 795.0, 1426.0, 2840.0, 5911.0, 13474.0, 32937.0, 84607.0, 196841.0, 305393.0, 228568.0, 103276.0, 40356.0, 16356.0, 7002.0, 3323.0, 1668.0, 861.0, 493.0, 296.0, 214.0, 136.0, 97.0, 80.0, 56.0, 37.0, 30.0, 21.0, 14.0, 11.0, 11.0, 6.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21484375, -5.99761962890625, -5.7803955078125, -5.56317138671875, -5.345947265625, -5.12872314453125, -4.9114990234375, -4.69427490234375, -4.47705078125, -4.25982666015625, -4.0426025390625, -3.82537841796875, -3.608154296875, -3.39093017578125, -3.1737060546875, -2.95648193359375, -2.7392578125, -2.52203369140625, -2.3048095703125, -2.08758544921875, -1.870361328125, -1.65313720703125, -1.4359130859375, -1.21868896484375, -1.00146484375, -0.78424072265625, -0.5670166015625, -0.34979248046875, -0.132568359375, 0.08465576171875, 0.3018798828125, 0.51910400390625, 0.736328125, 0.95355224609375, 1.1707763671875, 1.38800048828125, 1.605224609375, 1.82244873046875, 2.0396728515625, 2.25689697265625, 2.47412109375, 2.69134521484375, 2.9085693359375, 3.12579345703125, 3.343017578125, 3.56024169921875, 3.7774658203125, 3.99468994140625, 4.2119140625, 4.42913818359375, 4.6463623046875, 4.86358642578125, 5.080810546875, 5.29803466796875, 5.5152587890625, 5.73248291015625, 5.94970703125, 6.16693115234375, 6.3841552734375, 6.60137939453125, 6.818603515625, 7.03582763671875, 7.2530517578125, 7.47027587890625, 7.6875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 2.0, 8.0, 10.0, 7.0, 23.0, 20.0, 13.0, 38.0, 27.0, 33.0, 36.0, 26.0, 46.0, 46.0, 48.0, 45.0, 41.0, 55.0, 44.0, 47.0, 49.0, 45.0, 49.0, 42.0, 39.0, 16.0, 33.0, 15.0, 19.0, 14.0, 10.0, 12.0, 6.0, 4.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.41796875, -5.2664794921875, -5.114990234375, -4.9635009765625, -4.81201171875, -4.6605224609375, -4.509033203125, -4.3575439453125, -4.2060546875, -4.0545654296875, -3.903076171875, -3.7515869140625, -3.60009765625, -3.4486083984375, -3.297119140625, -3.1456298828125, -2.994140625, -2.8426513671875, -2.691162109375, -2.5396728515625, -2.38818359375, -2.2366943359375, -2.085205078125, -1.9337158203125, -1.7822265625, -1.6307373046875, -1.479248046875, -1.3277587890625, -1.17626953125, -1.0247802734375, -0.873291015625, -0.7218017578125, -0.5703125, -0.4188232421875, -0.267333984375, -0.1158447265625, 0.03564453125, 0.1871337890625, 0.338623046875, 0.4901123046875, 0.6416015625, 0.7930908203125, 0.944580078125, 1.0960693359375, 1.24755859375, 1.3990478515625, 1.550537109375, 1.7020263671875, 1.853515625, 2.0050048828125, 2.156494140625, 2.3079833984375, 2.45947265625, 2.6109619140625, 2.762451171875, 2.9139404296875, 3.0654296875, 3.2169189453125, 3.368408203125, 3.5198974609375, 3.67138671875, 3.8228759765625, 3.974365234375, 4.1258544921875, 4.27734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 20.0, 24.0, 20.0, 32.0, 72.0, 103.0, 158.0, 242.0, 397.0, 625.0, 972.0, 1738.0, 2787.0, 4733.0, 8207.0, 13806.0, 23590.0, 40079.0, 66192.0, 103170.0, 146114.0, 171284.0, 157148.0, 116710.0, 76113.0, 46480.0, 27941.0, 16212.0, 9347.0, 5635.0, 3400.0, 1980.0, 1217.0, 737.0, 459.0, 302.0, 182.0, 112.0, 67.0, 49.0, 31.0, 18.0, 13.0, 13.0, 13.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.3887176513671875, -1.341888427734375, -1.2950592041015625, -1.24822998046875, -1.2014007568359375, -1.154571533203125, -1.1077423095703125, -1.0609130859375, -1.0140838623046875, -0.967254638671875, -0.9204254150390625, -0.87359619140625, -0.8267669677734375, -0.779937744140625, -0.7331085205078125, -0.686279296875, -0.6394500732421875, -0.592620849609375, -0.5457916259765625, -0.49896240234375, -0.4521331787109375, -0.405303955078125, -0.3584747314453125, -0.3116455078125, -0.2648162841796875, -0.217987060546875, -0.1711578369140625, -0.12432861328125, -0.0774993896484375, -0.030670166015625, 0.0161590576171875, 0.06298828125, 0.1098175048828125, 0.156646728515625, 0.2034759521484375, 0.25030517578125, 0.2971343994140625, 0.343963623046875, 0.3907928466796875, 0.4376220703125, 0.4844512939453125, 0.531280517578125, 0.5781097412109375, 0.62493896484375, 0.6717681884765625, 0.718597412109375, 0.7654266357421875, 0.812255859375, 0.8590850830078125, 0.905914306640625, 0.9527435302734375, 0.99957275390625, 1.0464019775390625, 1.093231201171875, 1.1400604248046875, 1.1868896484375, 1.2337188720703125, 1.280548095703125, 1.3273773193359375, 1.37420654296875, 1.4210357666015625, 1.467864990234375, 1.5146942138671875, 1.5615234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 6.0, 9.0, 13.0, 26.0, 23.0, 20.0, 31.0, 32.0, 43.0, 50.0, 46.0, 52.0, 59.0, 60.0, 51.0, 53.0, 62.0, 56.0, 36.0, 38.0, 38.0, 27.0, 32.0, 21.0, 21.0, 18.0, 13.0, 10.0, 8.0, 2.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.334087371826172e-05, -9.061302989721298e-05, -8.788518607616425e-05, -8.515734225511551e-05, -8.242949843406677e-05, -7.970165461301804e-05, -7.69738107919693e-05, -7.424596697092056e-05, -7.151812314987183e-05, -6.879027932882309e-05, -6.606243550777435e-05, -6.333459168672562e-05, -6.060674786567688e-05, -5.787890404462814e-05, -5.515106022357941e-05, -5.242321640253067e-05, -4.9695372581481934e-05, -4.69675287604332e-05, -4.423968493938446e-05, -4.1511841118335724e-05, -3.878399729728699e-05, -3.605615347623825e-05, -3.3328309655189514e-05, -3.060046583414078e-05, -2.787262201309204e-05, -2.5144778192043304e-05, -2.2416934370994568e-05, -1.968909054994583e-05, -1.6961246728897095e-05, -1.4233402907848358e-05, -1.1505559086799622e-05, -8.777715265750885e-06, -6.0498714447021484e-06, -3.322027623653412e-06, -5.941838026046753e-07, 2.1336600184440613e-06, 4.861503839492798e-06, 7.5893476605415344e-06, 1.0317191481590271e-05, 1.3045035302639008e-05, 1.5772879123687744e-05, 1.850072294473648e-05, 2.1228566765785217e-05, 2.3956410586833954e-05, 2.668425440788269e-05, 2.9412098228931427e-05, 3.2139942049980164e-05, 3.48677858710289e-05, 3.759562969207764e-05, 4.032347351312637e-05, 4.305131733417511e-05, 4.5779161155223846e-05, 4.850700497627258e-05, 5.123484879732132e-05, 5.3962692618370056e-05, 5.669053643941879e-05, 5.941838026046753e-05, 6.214622408151627e-05, 6.4874067902565e-05, 6.760191172361374e-05, 7.032975554466248e-05, 7.305759936571121e-05, 7.578544318675995e-05, 7.851328700780869e-05, 8.124113082885742e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 5.0, 6.0, 13.0, 6.0, 21.0, 41.0, 38.0, 54.0, 68.0, 93.0, 121.0, 207.0, 300.0, 443.0, 680.0, 1072.0, 1814.0, 2770.0, 4721.0, 8290.0, 14201.0, 24115.0, 41007.0, 66921.0, 101961.0, 138732.0, 160337.0, 152432.0, 119144.0, 81914.0, 51934.0, 30933.0, 17703.0, 10469.0, 6246.0, 3580.0, 2188.0, 1353.0, 871.0, 563.0, 339.0, 247.0, 186.0, 127.0, 68.0, 70.0, 50.0, 35.0, 19.0, 21.0, 13.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0], "bins": [-1.9716796875, -1.91143798828125, -1.8511962890625, -1.79095458984375, -1.730712890625, -1.67047119140625, -1.6102294921875, -1.54998779296875, -1.48974609375, -1.42950439453125, -1.3692626953125, -1.30902099609375, -1.248779296875, -1.18853759765625, -1.1282958984375, -1.06805419921875, -1.0078125, -0.94757080078125, -0.8873291015625, -0.82708740234375, -0.766845703125, -0.70660400390625, -0.6463623046875, -0.58612060546875, -0.52587890625, -0.46563720703125, -0.4053955078125, -0.34515380859375, -0.284912109375, -0.22467041015625, -0.1644287109375, -0.10418701171875, -0.0439453125, 0.01629638671875, 0.0765380859375, 0.13677978515625, 0.197021484375, 0.25726318359375, 0.3175048828125, 0.37774658203125, 0.43798828125, 0.49822998046875, 0.5584716796875, 0.61871337890625, 0.678955078125, 0.73919677734375, 0.7994384765625, 0.85968017578125, 0.919921875, 0.98016357421875, 1.0404052734375, 1.10064697265625, 1.160888671875, 1.22113037109375, 1.2813720703125, 1.34161376953125, 1.40185546875, 1.46209716796875, 1.5223388671875, 1.58258056640625, 1.642822265625, 1.70306396484375, 1.7633056640625, 1.82354736328125, 1.8837890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 9.0, 17.0, 15.0, 17.0, 25.0, 28.0, 29.0, 46.0, 52.0, 38.0, 47.0, 58.0, 54.0, 53.0, 52.0, 68.0, 47.0, 47.0, 30.0, 39.0, 36.0, 23.0, 23.0, 23.0, 15.0, 22.0, 11.0, 11.0, 7.0, 6.0, 8.0, 3.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64599609375, -0.624237060546875, -0.60247802734375, -0.580718994140625, -0.5589599609375, -0.537200927734375, -0.51544189453125, -0.493682861328125, -0.471923828125, -0.450164794921875, -0.42840576171875, -0.406646728515625, -0.3848876953125, -0.363128662109375, -0.34136962890625, -0.319610595703125, -0.2978515625, -0.276092529296875, -0.25433349609375, -0.232574462890625, -0.2108154296875, -0.189056396484375, -0.16729736328125, -0.145538330078125, -0.123779296875, -0.102020263671875, -0.08026123046875, -0.058502197265625, -0.0367431640625, -0.014984130859375, 0.00677490234375, 0.028533935546875, 0.05029296875, 0.072052001953125, 0.09381103515625, 0.115570068359375, 0.1373291015625, 0.159088134765625, 0.18084716796875, 0.202606201171875, 0.224365234375, 0.246124267578125, 0.26788330078125, 0.289642333984375, 0.3114013671875, 0.333160400390625, 0.35491943359375, 0.376678466796875, 0.3984375, 0.420196533203125, 0.44195556640625, 0.463714599609375, 0.4854736328125, 0.507232666015625, 0.52899169921875, 0.550750732421875, 0.572509765625, 0.594268798828125, 0.61602783203125, 0.637786865234375, 0.6595458984375, 0.681304931640625, 0.70306396484375, 0.724822998046875, 0.74658203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 8.0, 6.0, 10.0, 17.0, 10.0, 9.0, 17.0, 17.0, 22.0, 24.0, 37.0, 30.0, 36.0, 38.0, 34.0, 42.0, 32.0, 34.0, 44.0, 48.0, 35.0, 37.0, 32.0, 42.0, 32.0, 50.0, 32.0, 26.0, 36.0, 25.0, 26.0, 14.0, 18.0, 11.0, 13.0, 10.0, 9.0, 12.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.94512414932251, -5.736369609832764, -5.527614593505859, -5.318860054016113, -5.110105514526367, -4.901350975036621, -4.692595958709717, -4.483841419219971, -4.275086402893066, -4.06633186340332, -3.857577085494995, -3.64882230758667, -3.440067768096924, -3.2313129901885986, -3.0225582122802734, -2.8138036727905273, -2.6050491333007812, -2.396294355392456, -2.18753981590271, -1.9787850379943848, -1.7700303792953491, -1.5612757205963135, -1.3525209426879883, -1.1437662839889526, -0.935011625289917, -0.7262569665908813, -0.5175022482872009, -0.3087475299835205, -0.09999287128448486, 0.10876178741455078, 0.317516565322876, 0.5262712240219116, 0.7350263595581055, 0.9437810182571411, 1.1525356769561768, 1.361290454864502, 1.5700451135635376, 1.7787997722625732, 1.9875545501708984, 2.1963090896606445, 2.4050638675689697, 2.613818645477295, 2.822573184967041, 3.031327962875366, 3.2400827407836914, 3.4488372802734375, 3.6575920581817627, 3.866346836090088, 4.075101375579834, 4.28385591506958, 4.492610931396484, 4.7013654708862305, 4.910120010375977, 5.118874549865723, 5.327629566192627, 5.536384105682373, 5.745139122009277, 5.953893661499023, 6.162648677825928, 6.371403217315674, 6.58015775680542, 6.788912773132324, 6.99766731262207, 7.206421852111816, 7.4151763916015625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 2.0, 7.0, 12.0, 17.0, 17.0, 20.0, 22.0, 19.0, 29.0, 27.0, 37.0, 44.0, 38.0, 40.0, 50.0, 42.0, 49.0, 41.0, 50.0, 47.0, 37.0, 40.0, 34.0, 39.0, 31.0, 28.0, 25.0, 28.0, 14.0, 21.0, 21.0, 10.0, 10.0, 14.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-7.611947059631348, -7.398141384124756, -7.184335708618164, -6.9705305099487305, -6.756724834442139, -6.542919158935547, -6.329113483428955, -6.115307807922363, -5.9015021324157715, -5.68769645690918, -5.473890781402588, -5.260085105895996, -5.0462799072265625, -4.832474231719971, -4.618668556213379, -4.404862880706787, -4.191057205200195, -3.9772515296936035, -3.763446092605591, -3.549640417098999, -3.3358347415924072, -3.1220293045043945, -2.9082236289978027, -2.694417953491211, -2.4806127548217773, -2.2668070793151855, -2.053001642227173, -1.839195966720581, -1.6253902912139893, -1.411584734916687, -1.1977791786193848, -0.983973503112793, -0.7701678276062012, -0.5563622117042542, -0.3425566256046295, -0.12875103950500488, 0.08505457639694214, 0.29886019229888916, 0.5126657485961914, 0.7264714241027832, 0.9402769804000854, 1.1540825366973877, 1.3678882122039795, 1.5816937685012817, 1.795499324798584, 2.009305000305176, 2.2231106758117676, 2.4369163513183594, 2.650721788406372, 2.864527463912964, 3.0783329010009766, 3.2921385765075684, 3.50594425201416, 3.719749927520752, 3.9335553646087646, 4.147360801696777, 4.361166477203369, 4.574972152709961, 4.788777828216553, 5.0025835037231445, 5.216388702392578, 5.43019437789917, 5.644000053405762, 5.8578057289123535, 6.071611404418945]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 10.0, 3.0, 11.0, 30.0, 33.0, 64.0, 94.0, 158.0, 233.0, 376.0, 574.0, 936.0, 1467.0, 2336.0, 3429.0, 5453.0, 8656.0, 13308.0, 19685.0, 29118.0, 42039.0, 56987.0, 74241.0, 90938.0, 104558.0, 108800.0, 106928.0, 95167.0, 79143.0, 62074.0, 45741.0, 32039.0, 22226.0, 14817.0, 9612.0, 6221.0, 3963.0, 2590.0, 1619.0, 1095.0, 711.0, 391.0, 277.0, 155.0, 106.0, 59.0, 31.0, 27.0, 19.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.890625, -3.77496337890625, -3.6593017578125, -3.54364013671875, -3.427978515625, -3.31231689453125, -3.1966552734375, -3.08099365234375, -2.96533203125, -2.84967041015625, -2.7340087890625, -2.61834716796875, -2.502685546875, -2.38702392578125, -2.2713623046875, -2.15570068359375, -2.0400390625, -1.92437744140625, -1.8087158203125, -1.69305419921875, -1.577392578125, -1.46173095703125, -1.3460693359375, -1.23040771484375, -1.11474609375, -0.99908447265625, -0.8834228515625, -0.76776123046875, -0.652099609375, -0.53643798828125, -0.4207763671875, -0.30511474609375, -0.189453125, -0.07379150390625, 0.0418701171875, 0.15753173828125, 0.273193359375, 0.38885498046875, 0.5045166015625, 0.62017822265625, 0.73583984375, 0.85150146484375, 0.9671630859375, 1.08282470703125, 1.198486328125, 1.31414794921875, 1.4298095703125, 1.54547119140625, 1.6611328125, 1.77679443359375, 1.8924560546875, 2.00811767578125, 2.123779296875, 2.23944091796875, 2.3551025390625, 2.47076416015625, 2.58642578125, 2.70208740234375, 2.8177490234375, 2.93341064453125, 3.049072265625, 3.16473388671875, 3.2803955078125, 3.39605712890625, 3.51171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 13.0, 15.0, 13.0, 23.0, 18.0, 24.0, 29.0, 40.0, 37.0, 42.0, 51.0, 38.0, 48.0, 50.0, 48.0, 45.0, 51.0, 45.0, 44.0, 26.0, 43.0, 35.0, 24.0, 40.0, 22.0, 20.0, 14.0, 11.0, 18.0, 11.0, 6.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.875, -7.6492919921875, -7.423583984375, -7.1978759765625, -6.97216796875, -6.7464599609375, -6.520751953125, -6.2950439453125, -6.0693359375, -5.8436279296875, -5.617919921875, -5.3922119140625, -5.16650390625, -4.9407958984375, -4.715087890625, -4.4893798828125, -4.263671875, -4.0379638671875, -3.812255859375, -3.5865478515625, -3.36083984375, -3.1351318359375, -2.909423828125, -2.6837158203125, -2.4580078125, -2.2322998046875, -2.006591796875, -1.7808837890625, -1.55517578125, -1.3294677734375, -1.103759765625, -0.8780517578125, -0.65234375, -0.4266357421875, -0.200927734375, 0.0247802734375, 0.25048828125, 0.4761962890625, 0.701904296875, 0.9276123046875, 1.1533203125, 1.3790283203125, 1.604736328125, 1.8304443359375, 2.05615234375, 2.2818603515625, 2.507568359375, 2.7332763671875, 2.958984375, 3.1846923828125, 3.410400390625, 3.6361083984375, 3.86181640625, 4.0875244140625, 4.313232421875, 4.5389404296875, 4.7646484375, 4.9903564453125, 5.216064453125, 5.4417724609375, 5.66748046875, 5.8931884765625, 6.118896484375, 6.3446044921875, 6.5703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 13.0, 19.0, 23.0, 31.0, 69.0, 96.0, 143.0, 240.0, 387.0, 583.0, 1018.0, 1667.0, 2613.0, 4266.0, 7042.0, 11552.0, 18847.0, 30024.0, 47156.0, 70059.0, 96616.0, 120474.0, 133762.0, 131147.0, 113413.0, 87400.0, 61265.0, 40978.0, 26122.0, 16203.0, 9710.0, 6044.0, 3702.0, 2252.0, 1339.0, 849.0, 520.0, 339.0, 210.0, 138.0, 92.0, 58.0, 34.0, 17.0, 11.0, 12.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.78515625, -5.61907958984375, -5.4530029296875, -5.28692626953125, -5.120849609375, -4.95477294921875, -4.7886962890625, -4.62261962890625, -4.45654296875, -4.29046630859375, -4.1243896484375, -3.95831298828125, -3.792236328125, -3.62615966796875, -3.4600830078125, -3.29400634765625, -3.1279296875, -2.96185302734375, -2.7957763671875, -2.62969970703125, -2.463623046875, -2.29754638671875, -2.1314697265625, -1.96539306640625, -1.79931640625, -1.63323974609375, -1.4671630859375, -1.30108642578125, -1.135009765625, -0.96893310546875, -0.8028564453125, -0.63677978515625, -0.470703125, -0.30462646484375, -0.1385498046875, 0.02752685546875, 0.193603515625, 0.35968017578125, 0.5257568359375, 0.69183349609375, 0.85791015625, 1.02398681640625, 1.1900634765625, 1.35614013671875, 1.522216796875, 1.68829345703125, 1.8543701171875, 2.02044677734375, 2.1865234375, 2.35260009765625, 2.5186767578125, 2.68475341796875, 2.850830078125, 3.01690673828125, 3.1829833984375, 3.34906005859375, 3.51513671875, 3.68121337890625, 3.8472900390625, 4.01336669921875, 4.179443359375, 4.34552001953125, 4.5115966796875, 4.67767333984375, 4.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 0.0, 3.0, 5.0, 5.0, 8.0, 14.0, 8.0, 12.0, 9.0, 21.0, 17.0, 25.0, 22.0, 25.0, 27.0, 33.0, 28.0, 30.0, 34.0, 36.0, 32.0, 34.0, 51.0, 34.0, 32.0, 40.0, 29.0, 27.0, 46.0, 26.0, 37.0, 33.0, 25.0, 26.0, 21.0, 11.0, 25.0, 20.0, 12.0, 14.0, 12.0, 9.0, 7.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.775390625, -3.65643310546875, -3.5374755859375, -3.41851806640625, -3.299560546875, -3.18060302734375, -3.0616455078125, -2.94268798828125, -2.82373046875, -2.70477294921875, -2.5858154296875, -2.46685791015625, -2.347900390625, -2.22894287109375, -2.1099853515625, -1.99102783203125, -1.8720703125, -1.75311279296875, -1.6341552734375, -1.51519775390625, -1.396240234375, -1.27728271484375, -1.1583251953125, -1.03936767578125, -0.92041015625, -0.80145263671875, -0.6824951171875, -0.56353759765625, -0.444580078125, -0.32562255859375, -0.2066650390625, -0.08770751953125, 0.03125, 0.15020751953125, 0.2691650390625, 0.38812255859375, 0.507080078125, 0.62603759765625, 0.7449951171875, 0.86395263671875, 0.98291015625, 1.10186767578125, 1.2208251953125, 1.33978271484375, 1.458740234375, 1.57769775390625, 1.6966552734375, 1.81561279296875, 1.9345703125, 2.05352783203125, 2.1724853515625, 2.29144287109375, 2.410400390625, 2.52935791015625, 2.6483154296875, 2.76727294921875, 2.88623046875, 3.00518798828125, 3.1241455078125, 3.24310302734375, 3.362060546875, 3.48101806640625, 3.5999755859375, 3.71893310546875, 3.837890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 8.0, 5.0, 4.0, 11.0, 24.0, 28.0, 43.0, 59.0, 113.0, 166.0, 265.0, 441.0, 604.0, 923.0, 1651.0, 2680.0, 4802.0, 8809.0, 17263.0, 34891.0, 68686.0, 121267.0, 177950.0, 200804.0, 169988.0, 110476.0, 61430.0, 31217.0, 15366.0, 7950.0, 4239.0, 2435.0, 1461.0, 892.0, 583.0, 356.0, 221.0, 158.0, 104.0, 60.0, 54.0, 29.0, 14.0, 13.0, 9.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9609375, -3.849090576171875, -3.73724365234375, -3.625396728515625, -3.5135498046875, -3.401702880859375, -3.28985595703125, -3.178009033203125, -3.066162109375, -2.954315185546875, -2.84246826171875, -2.730621337890625, -2.6187744140625, -2.506927490234375, -2.39508056640625, -2.283233642578125, -2.17138671875, -2.059539794921875, -1.94769287109375, -1.835845947265625, -1.7239990234375, -1.612152099609375, -1.50030517578125, -1.388458251953125, -1.276611328125, -1.164764404296875, -1.05291748046875, -0.941070556640625, -0.8292236328125, -0.717376708984375, -0.60552978515625, -0.493682861328125, -0.3818359375, -0.269989013671875, -0.15814208984375, -0.046295166015625, 0.0655517578125, 0.177398681640625, 0.28924560546875, 0.401092529296875, 0.512939453125, 0.624786376953125, 0.73663330078125, 0.848480224609375, 0.9603271484375, 1.072174072265625, 1.18402099609375, 1.295867919921875, 1.40771484375, 1.519561767578125, 1.63140869140625, 1.743255615234375, 1.8551025390625, 1.966949462890625, 2.07879638671875, 2.190643310546875, 2.302490234375, 2.414337158203125, 2.52618408203125, 2.638031005859375, 2.7498779296875, 2.861724853515625, 2.97357177734375, 3.085418701171875, 3.197265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 6.0, 5.0, 5.0, 13.0, 10.0, 8.0, 17.0, 17.0, 21.0, 51.0, 30.0, 52.0, 55.0, 63.0, 57.0, 81.0, 64.0, 56.0, 58.0, 65.0, 57.0, 50.0, 41.0, 27.0, 30.0, 17.0, 14.0, 11.0, 11.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003275871276855469, -0.0003171004354953766, -0.0003066137433052063, -0.000296127051115036, -0.0002856403589248657, -0.00027515366673469543, -0.00026466697454452515, -0.00025418028235435486, -0.00024369359016418457, -0.00023320689797401428, -0.000222720205783844, -0.0002122335135936737, -0.00020174682140350342, -0.00019126012921333313, -0.00018077343702316284, -0.00017028674483299255, -0.00015980005264282227, -0.00014931336045265198, -0.0001388266682624817, -0.0001283399760723114, -0.00011785328388214111, -0.00010736659169197083, -9.687989950180054e-05, -8.639320731163025e-05, -7.590651512145996e-05, -6.541982293128967e-05, -5.4933130741119385e-05, -4.44464385509491e-05, -3.395974636077881e-05, -2.347305417060852e-05, -1.2986361980438232e-05, -2.4996697902679443e-06, 7.987022399902344e-06, 1.8473714590072632e-05, 2.896040678024292e-05, 3.944709897041321e-05, 4.9933791160583496e-05, 6.0420483350753784e-05, 7.090717554092407e-05, 8.139386773109436e-05, 9.188055992126465e-05, 0.00010236725211143494, 0.00011285394430160522, 0.0001233406364917755, 0.0001338273286819458, 0.0001443140208721161, 0.00015480071306228638, 0.00016528740525245667, 0.00017577409744262695, 0.00018626078963279724, 0.00019674748182296753, 0.00020723417401313782, 0.0002177208662033081, 0.0002282075583934784, 0.00023869425058364868, 0.00024918094277381897, 0.00025966763496398926, 0.00027015432715415955, 0.00028064101934432983, 0.0002911277115345001, 0.0003016144037246704, 0.0003121010959148407, 0.000322587788105011, 0.0003330744802951813, 0.00034356117248535156]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 15.0, 27.0, 38.0, 60.0, 83.0, 139.0, 235.0, 488.0, 808.0, 1504.0, 3133.0, 6463.0, 14508.0, 34007.0, 77509.0, 155656.0, 234499.0, 231620.0, 152298.0, 75695.0, 32954.0, 13874.0, 6515.0, 3058.0, 1515.0, 760.0, 427.0, 256.0, 151.0, 95.0, 48.0, 29.0, 28.0, 14.0, 14.0, 5.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.583251953125, -4.43994140625, -4.296630859375, -4.1533203125, -4.010009765625, -3.86669921875, -3.723388671875, -3.580078125, -3.436767578125, -3.29345703125, -3.150146484375, -3.0068359375, -2.863525390625, -2.72021484375, -2.576904296875, -2.43359375, -2.290283203125, -2.14697265625, -2.003662109375, -1.8603515625, -1.717041015625, -1.57373046875, -1.430419921875, -1.287109375, -1.143798828125, -1.00048828125, -0.857177734375, -0.7138671875, -0.570556640625, -0.42724609375, -0.283935546875, -0.140625, 0.002685546875, 0.14599609375, 0.289306640625, 0.4326171875, 0.575927734375, 0.71923828125, 0.862548828125, 1.005859375, 1.149169921875, 1.29248046875, 1.435791015625, 1.5791015625, 1.722412109375, 1.86572265625, 2.009033203125, 2.15234375, 2.295654296875, 2.43896484375, 2.582275390625, 2.7255859375, 2.868896484375, 3.01220703125, 3.155517578125, 3.298828125, 3.442138671875, 3.58544921875, 3.728759765625, 3.8720703125, 4.015380859375, 4.15869140625, 4.302001953125, 4.4453125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 8.0, 6.0, 13.0, 22.0, 34.0, 30.0, 45.0, 52.0, 44.0, 62.0, 79.0, 70.0, 61.0, 72.0, 71.0, 62.0, 54.0, 38.0, 47.0, 41.0, 24.0, 11.0, 13.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0029296875, -0.96502685546875, -0.9271240234375, -0.88922119140625, -0.851318359375, -0.81341552734375, -0.7755126953125, -0.73760986328125, -0.69970703125, -0.66180419921875, -0.6239013671875, -0.58599853515625, -0.548095703125, -0.51019287109375, -0.4722900390625, -0.43438720703125, -0.396484375, -0.35858154296875, -0.3206787109375, -0.28277587890625, -0.244873046875, -0.20697021484375, -0.1690673828125, -0.13116455078125, -0.09326171875, -0.05535888671875, -0.0174560546875, 0.02044677734375, 0.058349609375, 0.09625244140625, 0.1341552734375, 0.17205810546875, 0.2099609375, 0.24786376953125, 0.2857666015625, 0.32366943359375, 0.361572265625, 0.39947509765625, 0.4373779296875, 0.47528076171875, 0.51318359375, 0.55108642578125, 0.5889892578125, 0.62689208984375, 0.664794921875, 0.70269775390625, 0.7406005859375, 0.77850341796875, 0.81640625, 0.85430908203125, 0.8922119140625, 0.93011474609375, 0.968017578125, 1.00592041015625, 1.0438232421875, 1.08172607421875, 1.11962890625, 1.15753173828125, 1.1954345703125, 1.23333740234375, 1.271240234375, 1.30914306640625, 1.3470458984375, 1.38494873046875, 1.4228515625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 8.0, 6.0, 6.0, 12.0, 14.0, 11.0, 22.0, 21.0, 22.0, 21.0, 31.0, 32.0, 27.0, 36.0, 39.0, 38.0, 40.0, 38.0, 47.0, 36.0, 45.0, 43.0, 54.0, 36.0, 56.0, 31.0, 40.0, 24.0, 35.0, 25.0, 15.0, 17.0, 17.0, 13.0, 15.0, 6.0, 11.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.055531978607178, -5.817721366882324, -5.579910755157471, -5.342100143432617, -5.104289531707764, -4.86647891998291, -4.628668308258057, -4.390857696533203, -4.15304708480835, -3.915236473083496, -3.6774258613586426, -3.439615249633789, -3.2018046379089355, -2.963994026184082, -2.7261834144592285, -2.488372802734375, -2.2505621910095215, -2.012751579284668, -1.7749409675598145, -1.537130355834961, -1.2993197441101074, -1.061509132385254, -0.8236985206604004, -0.5858879089355469, -0.34807729721069336, -0.11026668548583984, 0.12754392623901367, 0.3653545379638672, 0.6031651496887207, 0.8409757614135742, 1.0787863731384277, 1.3165969848632812, 1.5544071197509766, 1.79221773147583, 2.0300283432006836, 2.267838954925537, 2.5056495666503906, 2.743460178375244, 2.9812707901000977, 3.219081401824951, 3.4568920135498047, 3.694702625274658, 3.9325132369995117, 4.170323848724365, 4.408134460449219, 4.645945072174072, 4.883755683898926, 5.121566295623779, 5.359376907348633, 5.597187519073486, 5.83499813079834, 6.072808742523193, 6.310619354248047, 6.5484299659729, 6.786240577697754, 7.024051189422607, 7.261861801147461, 7.4996724128723145, 7.737483024597168, 7.9752936363220215, 8.213104248046875, 8.45091438293457, 8.688725471496582, 8.926536560058594, 9.164346694946289]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 11.0, 11.0, 8.0, 13.0, 16.0, 18.0, 29.0, 24.0, 24.0, 25.0, 30.0, 31.0, 27.0, 35.0, 36.0, 42.0, 45.0, 49.0, 39.0, 40.0, 48.0, 24.0, 40.0, 31.0, 35.0, 26.0, 36.0, 39.0, 24.0, 16.0, 19.0, 18.0, 8.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.899270057678223, -7.664230823516846, -7.429192066192627, -7.19415283203125, -6.959113597869873, -6.724074363708496, -6.489035606384277, -6.2539963722229, -6.018957138061523, -5.7839179039001465, -5.548879146575928, -5.313839912414551, -5.078800678253174, -4.843761444091797, -4.608722686767578, -4.373683452606201, -4.138644695281982, -3.9036056995391846, -3.6685664653778076, -3.4335274696350098, -3.198488235473633, -2.963449239730835, -2.728410243988037, -2.49337100982666, -2.2583320140838623, -2.0232930183410645, -1.7882537841796875, -1.5532147884368896, -1.3181756734848022, -1.0831365585327148, -0.848097562789917, -0.6130584478378296, -0.3780193328857422, -0.14298024773597717, 0.09205883741378784, 0.32709789276123047, 0.5621370077133179, 0.7971761226654053, 1.0322151184082031, 1.2672542333602905, 1.502293348312378, 1.7373324632644653, 1.9723715782165527, 2.2074105739593506, 2.4424495697021484, 2.6774888038635254, 2.9125277996063232, 3.147566795349121, 3.382606029510498, 3.617645025253296, 3.852684259414673, 4.087723255157471, 4.322762489318848, 4.557801246643066, 4.792840480804443, 5.02787971496582, 5.262918472290039, 5.497957706451416, 5.732996463775635, 5.968035697937012, 6.203074932098389, 6.438114166259766, 6.673152923583984, 6.908192157745361, 7.143231391906738]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 12.0, 15.0, 7.0, 25.0, 29.0, 44.0, 61.0, 72.0, 129.0, 177.0, 211.0, 319.0, 490.0, 724.0, 1082.0, 1763.0, 3046.0, 5461.0, 10740.0, 1010745.0, 6248.0, 3472.0, 1982.0, 1228.0, 786.0, 470.0, 352.0, 233.0, 169.0, 135.0, 93.0, 77.0, 48.0, 28.0, 23.0, 23.0, 12.0, 11.0, 10.0, 11.0, 3.0, 3.0, 7.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-113.6257553100586, -110.08724212646484, -106.5487289428711, -103.01021575927734, -99.4717025756836, -95.93318939208984, -92.39466857910156, -88.85615539550781, -85.31764221191406, -81.77912902832031, -78.24061584472656, -74.70210266113281, -71.16358947753906, -67.62507629394531, -64.08656311035156, -60.54804611206055, -57.00953674316406, -53.47102355957031, -49.93251037597656, -46.39399719238281, -42.85548400878906, -39.31697082519531, -35.7784538269043, -32.23994064331055, -28.701427459716797, -25.162914276123047, -21.624401092529297, -18.085886001586914, -14.547372817993164, -11.008859634399414, -7.470344543457031, -3.9318313598632812, -0.3933258056640625, 3.1451878547668457, 6.683701515197754, 10.22221565246582, 13.76072883605957, 17.29924201965332, 20.837757110595703, 24.376270294189453, 27.914783477783203, 31.453296661376953, 34.9918098449707, 38.53032684326172, 42.06884002685547, 45.60735321044922, 49.14586639404297, 52.68437957763672, 56.22289276123047, 59.76140594482422, 63.29991912841797, 66.83843231201172, 70.37694549560547, 73.91545867919922, 77.4539794921875, 80.99249267578125, 84.531005859375, 88.06951904296875, 91.6080322265625, 95.14654541015625, 98.68505859375, 102.22357177734375, 105.7620849609375, 109.30059814453125, 112.839111328125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 6.0, 16.0, 11.0, 17.0, 34.0, 33.0, 54.0, 89.0, 114.0, 181.0, 262.0, 418.0, 637.0, 1049.0, 1705.0, 2605.0, 3972.0, 5866.0, 8469.0, 13056.0, 26909.0, 51286348.0, 70024.0, 17767.0, 10633.0, 7118.0, 4911.0, 3176.0, 2134.0, 1381.0, 825.0, 538.0, 315.0, 232.0, 139.0, 84.0, 56.0, 40.0, 32.0, 28.0, 12.0, 14.0, 14.0, 9.0, 7.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-120.25455474853516, -116.69275665283203, -113.13096618652344, -109.56916809082031, -106.00736999511719, -102.44557189941406, -98.88378143310547, -95.32198333740234, -91.76019287109375, -88.19839477539062, -84.63660430908203, -81.0748062133789, -77.51300811767578, -73.95121765136719, -70.38941955566406, -66.82762145996094, -63.26582336425781, -59.70402908325195, -56.14223098754883, -52.58043670654297, -49.018638610839844, -45.456844329833984, -41.895050048828125, -38.333251953125, -34.77145767211914, -31.20966148376465, -27.647865295410156, -24.086071014404297, -20.524274826049805, -16.962478637695312, -13.400684356689453, -9.838888168334961, -6.2770843505859375, -2.7152886390686035, 0.8465070724487305, 4.408302307128906, 7.970098495483398, 11.53189468383789, 15.09368896484375, 18.655485153198242, 22.217281341552734, 25.779077529907227, 29.34087371826172, 32.90266799926758, 36.46446228027344, 40.02626037597656, 43.58805465698242, 47.14984893798828, 50.711647033691406, 54.273441314697266, 57.83523941040039, 61.39703369140625, 64.95883178710938, 68.5206298828125, 72.0824203491211, 75.64421844482422, 79.20600891113281, 82.76780700683594, 86.32959747314453, 89.89139556884766, 93.45319366455078, 97.01498413085938, 100.5767822265625, 104.13858032226562, 107.70037841796875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 9.0, 14.0, 19.0, 24.0, 28.0, 58.0, 107.0, 149.0, 292.0, 563.0, 958.0, 1791.0, 3706.0, 8168.0, 20475.0, 55699.0, 179703.0, 737063.0, 3538914.0, 1330964.0, 281529.0, 81457.0, 28347.0, 11418.0, 5000.0, 2325.0, 1181.0, 635.0, 377.0, 169.0, 132.0, 59.0, 34.0, 27.0, 15.0, 16.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.90625, -45.59130859375, -44.2763671875, -42.96142578125, -41.646484375, -40.33154296875, -39.0166015625, -37.70166015625, -36.38671875, -35.07177734375, -33.7568359375, -32.44189453125, -31.126953125, -29.81201171875, -28.4970703125, -27.18212890625, -25.8671875, -24.55224609375, -23.2373046875, -21.92236328125, -20.607421875, -19.29248046875, -17.9775390625, -16.66259765625, -15.34765625, -14.03271484375, -12.7177734375, -11.40283203125, -10.087890625, -8.77294921875, -7.4580078125, -6.14306640625, -4.828125, -3.51318359375, -2.1982421875, -0.88330078125, 0.431640625, 1.74658203125, 3.0615234375, 4.37646484375, 5.69140625, 7.00634765625, 8.3212890625, 9.63623046875, 10.951171875, 12.26611328125, 13.5810546875, 14.89599609375, 16.2109375, 17.52587890625, 18.8408203125, 20.15576171875, 21.470703125, 22.78564453125, 24.1005859375, 25.41552734375, 26.73046875, 28.04541015625, 29.3603515625, 30.67529296875, 31.990234375, 33.30517578125, 34.6201171875, 35.93505859375, 37.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 3.0, 6.0, 6.0, 16.0, 15.0, 10.0, 16.0, 24.0, 25.0, 28.0, 41.0, 47.0, 67.0, 63.0, 69.0, 95.0, 127.0, 171.0, 188.0, 168.0, 155.0, 120.0, 106.0, 70.0, 82.0, 53.0, 44.0, 31.0, 43.0, 27.0, 20.0, 19.0, 19.0, 13.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.1796875, -8.901123046875, -8.62255859375, -8.343994140625, -8.0654296875, -7.786865234375, -7.50830078125, -7.229736328125, -6.951171875, -6.672607421875, -6.39404296875, -6.115478515625, -5.8369140625, -5.558349609375, -5.27978515625, -5.001220703125, -4.72265625, -4.444091796875, -4.16552734375, -3.886962890625, -3.6083984375, -3.329833984375, -3.05126953125, -2.772705078125, -2.494140625, -2.215576171875, -1.93701171875, -1.658447265625, -1.3798828125, -1.101318359375, -0.82275390625, -0.544189453125, -0.265625, 0.012939453125, 0.29150390625, 0.570068359375, 0.8486328125, 1.127197265625, 1.40576171875, 1.684326171875, 1.962890625, 2.241455078125, 2.52001953125, 2.798583984375, 3.0771484375, 3.355712890625, 3.63427734375, 3.912841796875, 4.19140625, 4.469970703125, 4.74853515625, 5.027099609375, 5.3056640625, 5.584228515625, 5.86279296875, 6.141357421875, 6.419921875, 6.698486328125, 6.97705078125, 7.255615234375, 7.5341796875, 7.812744140625, 8.09130859375, 8.369873046875, 8.6484375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 8.0, 10.0, 13.0, 32.0, 44.0, 54.0, 120.0, 189.0, 272.0, 416.0, 797.0, 1287.0, 2016.0, 3475.0, 5708.0, 9554.0, 16006.0, 26165.0, 44055.0, 73163.0, 119960.0, 196195.0, 321093.0, 602768.0, 1709161.0, 1727224.0, 608314.0, 324034.0, 196262.0, 119738.0, 73069.0, 44054.0, 26504.0, 15750.0, 9571.0, 5623.0, 3381.0, 2090.0, 1210.0, 792.0, 472.0, 285.0, 180.0, 110.0, 85.0, 43.0, 27.0, 15.0, 13.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-9.640625, -9.3485107421875, -9.056396484375, -8.7642822265625, -8.47216796875, -8.1800537109375, -7.887939453125, -7.5958251953125, -7.3037109375, -7.0115966796875, -6.719482421875, -6.4273681640625, -6.13525390625, -5.8431396484375, -5.551025390625, -5.2589111328125, -4.966796875, -4.6746826171875, -4.382568359375, -4.0904541015625, -3.79833984375, -3.5062255859375, -3.214111328125, -2.9219970703125, -2.6298828125, -2.3377685546875, -2.045654296875, -1.7535400390625, -1.46142578125, -1.1693115234375, -0.877197265625, -0.5850830078125, -0.29296875, -0.0008544921875, 0.291259765625, 0.5833740234375, 0.87548828125, 1.1676025390625, 1.459716796875, 1.7518310546875, 2.0439453125, 2.3360595703125, 2.628173828125, 2.9202880859375, 3.21240234375, 3.5045166015625, 3.796630859375, 4.0887451171875, 4.380859375, 4.6729736328125, 4.965087890625, 5.2572021484375, 5.54931640625, 5.8414306640625, 6.133544921875, 6.4256591796875, 6.7177734375, 7.0098876953125, 7.302001953125, 7.5941162109375, 7.88623046875, 8.1783447265625, 8.470458984375, 8.7625732421875, 9.0546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 2.0, 12.0, 10.0, 14.0, 15.0, 15.0, 20.0, 30.0, 26.0, 38.0, 37.0, 50.0, 64.0, 95.0, 140.0, 199.0, 307.0, 242.0, 176.0, 102.0, 71.0, 65.0, 41.0, 34.0, 19.0, 34.0, 28.0, 24.0, 16.0, 15.0, 14.0, 7.0, 15.0, 4.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.4765625, -12.084228515625, -11.69189453125, -11.299560546875, -10.9072265625, -10.514892578125, -10.12255859375, -9.730224609375, -9.337890625, -8.945556640625, -8.55322265625, -8.160888671875, -7.7685546875, -7.376220703125, -6.98388671875, -6.591552734375, -6.19921875, -5.806884765625, -5.41455078125, -5.022216796875, -4.6298828125, -4.237548828125, -3.84521484375, -3.452880859375, -3.060546875, -2.668212890625, -2.27587890625, -1.883544921875, -1.4912109375, -1.098876953125, -0.70654296875, -0.314208984375, 0.078125, 0.470458984375, 0.86279296875, 1.255126953125, 1.6474609375, 2.039794921875, 2.43212890625, 2.824462890625, 3.216796875, 3.609130859375, 4.00146484375, 4.393798828125, 4.7861328125, 5.178466796875, 5.57080078125, 5.963134765625, 6.35546875, 6.747802734375, 7.14013671875, 7.532470703125, 7.9248046875, 8.317138671875, 8.70947265625, 9.101806640625, 9.494140625, 9.886474609375, 10.27880859375, 10.671142578125, 11.0634765625, 11.455810546875, 11.84814453125, 12.240478515625, 12.6328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 13.0, 27.0, 35.0, 35.0, 36.0, 58.0, 117.0, 179.0, 285.0, 391.0, 657.0, 1041.0, 1739.0, 2972.0, 5707.0, 10804.0, 20970.0, 41446.0, 83681.0, 273678.0, 5568083.0, 148798.0, 63345.0, 31976.0, 16345.0, 8446.0, 4386.0, 2416.0, 1427.0, 821.0, 506.0, 338.0, 201.0, 140.0, 91.0, 66.0, 43.0, 48.0, 26.0, 24.0, 10.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.859375, -24.01123046875, -23.1630859375, -22.31494140625, -21.466796875, -20.61865234375, -19.7705078125, -18.92236328125, -18.07421875, -17.22607421875, -16.3779296875, -15.52978515625, -14.681640625, -13.83349609375, -12.9853515625, -12.13720703125, -11.2890625, -10.44091796875, -9.5927734375, -8.74462890625, -7.896484375, -7.04833984375, -6.2001953125, -5.35205078125, -4.50390625, -3.65576171875, -2.8076171875, -1.95947265625, -1.111328125, -0.26318359375, 0.5849609375, 1.43310546875, 2.28125, 3.12939453125, 3.9775390625, 4.82568359375, 5.673828125, 6.52197265625, 7.3701171875, 8.21826171875, 9.06640625, 9.91455078125, 10.7626953125, 11.61083984375, 12.458984375, 13.30712890625, 14.1552734375, 15.00341796875, 15.8515625, 16.69970703125, 17.5478515625, 18.39599609375, 19.244140625, 20.09228515625, 20.9404296875, 21.78857421875, 22.63671875, 23.48486328125, 24.3330078125, 25.18115234375, 26.029296875, 26.87744140625, 27.7255859375, 28.57373046875, 29.421875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 12.0, 13.0, 18.0, 17.0, 21.0, 22.0, 23.0, 26.0, 26.0, 34.0, 39.0, 42.0, 49.0, 70.0, 162.0, 304.0, 346.0, 244.0, 117.0, 61.0, 59.0, 28.0, 31.0, 38.0, 31.0, 25.0, 22.0, 20.0, 17.0, 16.0, 15.0, 11.0, 9.0, 11.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.53125, -21.89404296875, -21.2568359375, -20.61962890625, -19.982421875, -19.34521484375, -18.7080078125, -18.07080078125, -17.43359375, -16.79638671875, -16.1591796875, -15.52197265625, -14.884765625, -14.24755859375, -13.6103515625, -12.97314453125, -12.3359375, -11.69873046875, -11.0615234375, -10.42431640625, -9.787109375, -9.14990234375, -8.5126953125, -7.87548828125, -7.23828125, -6.60107421875, -5.9638671875, -5.32666015625, -4.689453125, -4.05224609375, -3.4150390625, -2.77783203125, -2.140625, -1.50341796875, -0.8662109375, -0.22900390625, 0.408203125, 1.04541015625, 1.6826171875, 2.31982421875, 2.95703125, 3.59423828125, 4.2314453125, 4.86865234375, 5.505859375, 6.14306640625, 6.7802734375, 7.41748046875, 8.0546875, 8.69189453125, 9.3291015625, 9.96630859375, 10.603515625, 11.24072265625, 11.8779296875, 12.51513671875, 13.15234375, 13.78955078125, 14.4267578125, 15.06396484375, 15.701171875, 16.33837890625, 16.9755859375, 17.61279296875, 18.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 9.0, 12.0, 20.0, 37.0, 58.0, 87.0, 139.0, 270.0, 144.0, 73.0, 53.0, 44.0, 27.0, 16.0, 12.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-944.30517578125, -918.5018310546875, -892.6985473632812, -866.8952026367188, -841.0919189453125, -815.28857421875, -789.4852905273438, -763.6819458007812, -737.878662109375, -712.0753173828125, -686.2720336914062, -660.4686889648438, -634.6654052734375, -608.862060546875, -583.0587768554688, -557.2554321289062, -531.4521484375, -505.6488342285156, -479.84552001953125, -454.0422058105469, -428.2388916015625, -402.435546875, -376.63226318359375, -350.82891845703125, -325.02557373046875, -299.2222595214844, -273.4189453125, -247.61563110351562, -221.81231689453125, -196.0089874267578, -170.20567321777344, -144.40235900878906, -118.59906005859375, -92.79574584960938, -66.992431640625, -41.189109802246094, -15.385795593261719, 10.417526245117188, 36.22084045410156, 62.02415466308594, 87.82746887207031, 113.63078308105469, 139.43409729003906, 165.2374267578125, 191.04074096679688, 216.84405517578125, 242.64736938476562, 268.45068359375, 294.2539978027344, 320.05731201171875, 345.8606262207031, 371.6639404296875, 397.4672546386719, 423.27056884765625, 449.07391357421875, 474.877197265625, 500.6805419921875, 526.48388671875, 552.2871704101562, 578.0905151367188, 603.893798828125, 629.6971435546875, 655.5004272460938, 681.3037719726562, 707.1070556640625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 3.0, 3.0, 11.0, 9.0, 9.0, 8.0, 10.0, 9.0, 18.0, 17.0, 18.0, 26.0, 35.0, 38.0, 34.0, 34.0, 63.0, 71.0, 88.0, 107.0, 77.0, 43.0, 30.0, 39.0, 30.0, 25.0, 19.0, 24.0, 17.0, 15.0, 17.0, 17.0, 13.0, 5.0, 6.0, 6.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-453.8227844238281, -440.02593994140625, -426.22906494140625, -412.4322204589844, -398.6353454589844, -384.8385009765625, -371.0416259765625, -357.2447814941406, -343.44793701171875, -329.6510925292969, -315.8542175292969, -302.057373046875, -288.260498046875, -274.4636535644531, -260.66680908203125, -246.86993408203125, -233.07305908203125, -219.2761993408203, -205.47933959960938, -191.6824951171875, -177.8856201171875, -164.08877563476562, -150.2919158935547, -136.49505615234375, -122.69819641113281, -108.90133666992188, -95.10447692871094, -81.30762481689453, -67.5107650756836, -53.713905334472656, -39.91705322265625, -26.120193481445312, -12.32330322265625, 1.4735546112060547, 15.27041244506836, 29.06726837158203, 42.86412811279297, 56.660987854003906, 70.45783996582031, 84.25469970703125, 98.05155944824219, 111.84841918945312, 125.64527893066406, 139.442138671875, 153.23898315429688, 167.03585815429688, 180.83270263671875, 194.6295623779297, 208.42642211914062, 222.22328186035156, 236.0201416015625, 249.81698608398438, 263.6138610839844, 277.41070556640625, 291.20758056640625, 305.0044250488281, 318.80126953125, 332.5981140136719, 346.3949890136719, 360.19183349609375, 373.98870849609375, 387.7855529785156, 401.5823974609375, 415.3792724609375, 429.1761474609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 8.0, 9.0, 9.0, 20.0, 33.0, 57.0, 76.0, 143.0, 203.0, 329.0, 519.0, 964.0, 1680.0, 3204.0, 6199.0, 13261.0, 33087.0, 123500.0, 2818564.0, 1056227.0, 90080.0, 25736.0, 10422.0, 4680.0, 2350.0, 1233.0, 698.0, 351.0, 222.0, 140.0, 94.0, 56.0, 34.0, 33.0, 22.0, 12.0, 12.0, 7.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48046875, -4.34429931640625, -4.2081298828125, -4.07196044921875, -3.935791015625, -3.79962158203125, -3.6634521484375, -3.52728271484375, -3.39111328125, -3.25494384765625, -3.1187744140625, -2.98260498046875, -2.846435546875, -2.71026611328125, -2.5740966796875, -2.43792724609375, -2.3017578125, -2.16558837890625, -2.0294189453125, -1.89324951171875, -1.757080078125, -1.62091064453125, -1.4847412109375, -1.34857177734375, -1.21240234375, -1.07623291015625, -0.9400634765625, -0.80389404296875, -0.667724609375, -0.53155517578125, -0.3953857421875, -0.25921630859375, -0.123046875, 0.01312255859375, 0.1492919921875, 0.28546142578125, 0.421630859375, 0.55780029296875, 0.6939697265625, 0.83013916015625, 0.96630859375, 1.10247802734375, 1.2386474609375, 1.37481689453125, 1.510986328125, 1.64715576171875, 1.7833251953125, 1.91949462890625, 2.0556640625, 2.19183349609375, 2.3280029296875, 2.46417236328125, 2.600341796875, 2.73651123046875, 2.8726806640625, 3.00885009765625, 3.14501953125, 3.28118896484375, 3.4173583984375, 3.55352783203125, 3.689697265625, 3.82586669921875, 3.9620361328125, 4.09820556640625, 4.234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 7.0, 10.0, 15.0, 23.0, 44.0, 78.0, 147.0, 218.0, 184.0, 118.0, 50.0, 29.0, 16.0, 12.0, 11.0, 4.0, 2.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.65655517578125, -0.6343994140625, -0.61224365234375, -0.590087890625, -0.56793212890625, -0.5457763671875, -0.52362060546875, -0.50146484375, -0.47930908203125, -0.4571533203125, -0.43499755859375, -0.412841796875, -0.39068603515625, -0.3685302734375, -0.34637451171875, -0.32421875, -0.30206298828125, -0.2799072265625, -0.25775146484375, -0.235595703125, -0.21343994140625, -0.1912841796875, -0.16912841796875, -0.14697265625, -0.12481689453125, -0.1026611328125, -0.08050537109375, -0.058349609375, -0.03619384765625, -0.0140380859375, 0.00811767578125, 0.0302734375, 0.05242919921875, 0.0745849609375, 0.09674072265625, 0.118896484375, 0.14105224609375, 0.1632080078125, 0.18536376953125, 0.20751953125, 0.22967529296875, 0.2518310546875, 0.27398681640625, 0.296142578125, 0.31829833984375, 0.3404541015625, 0.36260986328125, 0.384765625, 0.40692138671875, 0.4290771484375, 0.45123291015625, 0.473388671875, 0.49554443359375, 0.5177001953125, 0.53985595703125, 0.56201171875, 0.58416748046875, 0.6063232421875, 0.62847900390625, 0.650634765625, 0.67279052734375, 0.6949462890625, 0.71710205078125, 0.7392578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 6.0, 6.0, 10.0, 17.0, 26.0, 25.0, 43.0, 72.0, 91.0, 135.0, 207.0, 346.0, 547.0, 903.0, 1650.0, 3157.0, 6278.0, 12997.0, 29329.0, 74411.0, 208326.0, 669435.0, 2021681.0, 785885.0, 236529.0, 82728.0, 31874.0, 13700.0, 6458.0, 3164.0, 1732.0, 963.0, 560.0, 318.0, 210.0, 158.0, 96.0, 64.0, 46.0, 32.0, 23.0, 11.0, 5.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.20703125, -2.13482666015625, -2.0626220703125, -1.99041748046875, -1.918212890625, -1.84600830078125, -1.7738037109375, -1.70159912109375, -1.62939453125, -1.55718994140625, -1.4849853515625, -1.41278076171875, -1.340576171875, -1.26837158203125, -1.1961669921875, -1.12396240234375, -1.0517578125, -0.97955322265625, -0.9073486328125, -0.83514404296875, -0.762939453125, -0.69073486328125, -0.6185302734375, -0.54632568359375, -0.47412109375, -0.40191650390625, -0.3297119140625, -0.25750732421875, -0.185302734375, -0.11309814453125, -0.0408935546875, 0.03131103515625, 0.103515625, 0.17572021484375, 0.2479248046875, 0.32012939453125, 0.392333984375, 0.46453857421875, 0.5367431640625, 0.60894775390625, 0.68115234375, 0.75335693359375, 0.8255615234375, 0.89776611328125, 0.969970703125, 1.04217529296875, 1.1143798828125, 1.18658447265625, 1.2587890625, 1.33099365234375, 1.4031982421875, 1.47540283203125, 1.547607421875, 1.61981201171875, 1.6920166015625, 1.76422119140625, 1.83642578125, 1.90863037109375, 1.9808349609375, 2.05303955078125, 2.125244140625, 2.19744873046875, 2.2696533203125, 2.34185791015625, 2.4140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 7.0, 11.0, 11.0, 11.0, 19.0, 31.0, 36.0, 27.0, 48.0, 57.0, 78.0, 79.0, 120.0, 147.0, 195.0, 234.0, 288.0, 400.0, 537.0, 392.0, 301.0, 228.0, 189.0, 125.0, 108.0, 95.0, 62.0, 58.0, 37.0, 30.0, 27.0, 19.0, 14.0, 10.0, 9.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88330078125, -0.8577423095703125, -0.832183837890625, -0.8066253662109375, -0.78106689453125, -0.7555084228515625, -0.729949951171875, -0.7043914794921875, -0.6788330078125, -0.6532745361328125, -0.627716064453125, -0.6021575927734375, -0.57659912109375, -0.5510406494140625, -0.525482177734375, -0.4999237060546875, -0.474365234375, -0.4488067626953125, -0.423248291015625, -0.3976898193359375, -0.37213134765625, -0.3465728759765625, -0.321014404296875, -0.2954559326171875, -0.2698974609375, -0.2443389892578125, -0.218780517578125, -0.1932220458984375, -0.16766357421875, -0.1421051025390625, -0.116546630859375, -0.0909881591796875, -0.0654296875, -0.0398712158203125, -0.014312744140625, 0.0112457275390625, 0.03680419921875, 0.0623626708984375, 0.087921142578125, 0.1134796142578125, 0.1390380859375, 0.1645965576171875, 0.190155029296875, 0.2157135009765625, 0.24127197265625, 0.2668304443359375, 0.292388916015625, 0.3179473876953125, 0.343505859375, 0.3690643310546875, 0.394622802734375, 0.4201812744140625, 0.44573974609375, 0.4712982177734375, 0.496856689453125, 0.5224151611328125, 0.5479736328125, 0.5735321044921875, 0.599090576171875, 0.6246490478515625, 0.65020751953125, 0.6757659912109375, 0.701324462890625, 0.7268829345703125, 0.75244140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 4.0, 17.0, 29.0, 41.0, 79.0, 147.0, 195.0, 174.0, 150.0, 83.0, 36.0, 29.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.308292388916016, -15.845664978027344, -15.383036613464355, -14.920409202575684, -14.457781791687012, -13.995153427124023, -13.532526016235352, -13.06989860534668, -12.607271194458008, -12.144643783569336, -11.682015419006348, -11.219388008117676, -10.756760597229004, -10.294132232666016, -9.831504821777344, -9.368877410888672, -8.906249046325684, -8.443621635437012, -7.980993747711182, -7.518365859985352, -7.05573844909668, -6.59311056137085, -6.1304826736450195, -5.667855262756348, -5.205227375030518, -4.7425994873046875, -4.279972076416016, -3.8173441886901855, -3.3547165393829346, -2.8920888900756836, -2.4294610023498535, -1.9668333530426025, -1.5042057037353516, -1.0415780544281006, -0.5789502859115601, -0.11632251739501953, 0.34630513191223145, 0.8089327812194824, 1.2715606689453125, 1.7341883182525635, 2.1968159675598145, 2.6594436168670654, 3.1220712661743164, 3.5846991539001465, 4.047327041625977, 4.509954452514648, 4.9725823402404785, 5.435210227966309, 5.8978376388549805, 6.3604655265808105, 6.823092937469482, 7.2857208251953125, 7.748348236083984, 8.210975646972656, 8.673604011535645, 9.136231422424316, 9.598859786987305, 10.061487197875977, 10.524115562438965, 10.986742973327637, 11.449370384216309, 11.911998748779297, 12.374626159667969, 12.83725357055664, 13.299880981445312]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 17.0, 22.0, 26.0, 27.0, 21.0, 26.0, 27.0, 27.0, 44.0, 46.0, 41.0, 46.0, 48.0, 44.0, 32.0, 52.0, 54.0, 44.0, 40.0, 47.0, 42.0, 29.0, 30.0, 27.0, 23.0, 14.0, 17.0, 16.0, 6.0, 7.0, 5.0, 8.0, 9.0, 6.0, 3.0, 1.0, 3.0], "bins": [-6.9130048751831055, -6.735654354095459, -6.5583038330078125, -6.380952835083008, -6.203602313995361, -6.026251792907715, -5.848901271820068, -5.671550750732422, -5.494199752807617, -5.316849231719971, -5.139498710632324, -4.9621477127075195, -4.784797191619873, -4.607446670532227, -4.43009614944458, -4.252745628356934, -4.075394630432129, -3.8980441093444824, -3.720693349838257, -3.5433428287506104, -3.3659920692443848, -3.1886415481567383, -3.011291027069092, -2.833940267562866, -2.656589984893799, -2.4792394638061523, -2.3018887042999268, -2.1245381832122803, -1.9471874237060547, -1.7698369026184082, -1.5924862623214722, -1.4151356220245361, -1.2377848625183105, -1.0604342222213745, -0.8830835819244385, -0.7057330012321472, -0.5283823609352112, -0.35103172063827515, -0.1736811399459839, 0.0036695003509521484, 0.18102014064788818, 0.3583707809448242, 0.5357214212417603, 0.7130720019340515, 0.8904226422309875, 1.0677733421325684, 1.2451238632202148, 1.4224745035171509, 1.599825143814087, 1.777175784111023, 1.954526424407959, 2.1318769454956055, 2.309227705001831, 2.4865782260894775, 2.663928985595703, 2.8412795066833496, 3.018630027770996, 3.1959805488586426, 3.373331308364868, 3.5506818294525146, 3.7280325889587402, 3.9053831100463867, 4.082733631134033, 4.26008415222168, 4.437435150146484]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 8.0, 10.0, 8.0, 11.0, 23.0, 20.0, 28.0, 43.0, 49.0, 80.0, 110.0, 194.0, 343.0, 650.0, 1170.0, 2112.0, 4215.0, 9236.0, 25147.0, 112656.0, 665536.0, 172920.0, 32671.0, 11006.0, 4820.0, 2489.0, 1278.0, 674.0, 395.0, 237.0, 119.0, 80.0, 66.0, 31.0, 23.0, 20.0, 18.0, 15.0, 14.0, 12.0, 7.0, 1.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.205078125, -2.1431427001953125, -2.081207275390625, -2.0192718505859375, -1.95733642578125, -1.8954010009765625, -1.833465576171875, -1.7715301513671875, -1.7095947265625, -1.6476593017578125, -1.585723876953125, -1.5237884521484375, -1.46185302734375, -1.3999176025390625, -1.337982177734375, -1.2760467529296875, -1.214111328125, -1.1521759033203125, -1.090240478515625, -1.0283050537109375, -0.96636962890625, -0.9044342041015625, -0.842498779296875, -0.7805633544921875, -0.7186279296875, -0.6566925048828125, -0.594757080078125, -0.5328216552734375, -0.47088623046875, -0.4089508056640625, -0.347015380859375, -0.2850799560546875, -0.22314453125, -0.1612091064453125, -0.099273681640625, -0.0373382568359375, 0.02459716796875, 0.0865325927734375, 0.148468017578125, 0.2104034423828125, 0.2723388671875, 0.3342742919921875, 0.396209716796875, 0.4581451416015625, 0.52008056640625, 0.5820159912109375, 0.643951416015625, 0.7058868408203125, 0.767822265625, 0.8297576904296875, 0.891693115234375, 0.9536285400390625, 1.01556396484375, 1.0774993896484375, 1.139434814453125, 1.2013702392578125, 1.2633056640625, 1.3252410888671875, 1.387176513671875, 1.4491119384765625, 1.51104736328125, 1.5729827880859375, 1.634918212890625, 1.6968536376953125, 1.7587890625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 0.0, 6.0, 7.0, 3.0, 8.0, 12.0, 10.0, 15.0, 26.0, 49.0, 77.0, 121.0, 174.0, 173.0, 133.0, 73.0, 53.0, 25.0, 10.0, 11.0, 5.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6762237548828125, -0.652740478515625, -0.6292572021484375, -0.60577392578125, -0.5822906494140625, -0.558807373046875, -0.5353240966796875, -0.5118408203125, -0.4883575439453125, -0.464874267578125, -0.4413909912109375, -0.41790771484375, -0.3944244384765625, -0.370941162109375, -0.3474578857421875, -0.323974609375, -0.3004913330078125, -0.277008056640625, -0.2535247802734375, -0.23004150390625, -0.2065582275390625, -0.183074951171875, -0.1595916748046875, -0.1361083984375, -0.1126251220703125, -0.089141845703125, -0.0656585693359375, -0.04217529296875, -0.0186920166015625, 0.004791259765625, 0.0282745361328125, 0.0517578125, 0.0752410888671875, 0.098724365234375, 0.1222076416015625, 0.14569091796875, 0.1691741943359375, 0.192657470703125, 0.2161407470703125, 0.2396240234375, 0.2631072998046875, 0.286590576171875, 0.3100738525390625, 0.33355712890625, 0.3570404052734375, 0.380523681640625, 0.4040069580078125, 0.427490234375, 0.4509735107421875, 0.474456787109375, 0.4979400634765625, 0.52142333984375, 0.5449066162109375, 0.568389892578125, 0.5918731689453125, 0.6153564453125, 0.6388397216796875, 0.662322998046875, 0.6858062744140625, 0.70928955078125, 0.7327728271484375, 0.756256103515625, 0.7797393798828125, 0.80322265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 5.0, 11.0, 12.0, 27.0, 30.0, 42.0, 50.0, 69.0, 91.0, 170.0, 255.0, 383.0, 625.0, 1011.0, 1684.0, 3062.0, 5297.0, 10017.0, 19382.0, 40717.0, 93149.0, 239459.0, 358562.0, 152119.0, 62805.0, 28271.0, 13853.0, 7393.0, 3976.0, 2342.0, 1397.0, 821.0, 490.0, 323.0, 202.0, 142.0, 94.0, 54.0, 40.0, 33.0, 25.0, 11.0, 18.0, 7.0, 7.0, 5.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.24609375, -1.20623779296875, -1.1663818359375, -1.12652587890625, -1.086669921875, -1.04681396484375, -1.0069580078125, -0.96710205078125, -0.92724609375, -0.88739013671875, -0.8475341796875, -0.80767822265625, -0.767822265625, -0.72796630859375, -0.6881103515625, -0.64825439453125, -0.6083984375, -0.56854248046875, -0.5286865234375, -0.48883056640625, -0.448974609375, -0.40911865234375, -0.3692626953125, -0.32940673828125, -0.28955078125, -0.24969482421875, -0.2098388671875, -0.16998291015625, -0.130126953125, -0.09027099609375, -0.0504150390625, -0.01055908203125, 0.029296875, 0.06915283203125, 0.1090087890625, 0.14886474609375, 0.188720703125, 0.22857666015625, 0.2684326171875, 0.30828857421875, 0.34814453125, 0.38800048828125, 0.4278564453125, 0.46771240234375, 0.507568359375, 0.54742431640625, 0.5872802734375, 0.62713623046875, 0.6669921875, 0.70684814453125, 0.7467041015625, 0.78656005859375, 0.826416015625, 0.86627197265625, 0.9061279296875, 0.94598388671875, 0.98583984375, 1.02569580078125, 1.0655517578125, 1.10540771484375, 1.145263671875, 1.18511962890625, 1.2249755859375, 1.26483154296875, 1.3046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 3.0, 11.0, 8.0, 14.0, 18.0, 16.0, 21.0, 23.0, 26.0, 25.0, 34.0, 23.0, 42.0, 37.0, 37.0, 34.0, 34.0, 36.0, 39.0, 41.0, 25.0, 33.0, 28.0, 37.0, 36.0, 33.0, 44.0, 24.0, 28.0, 26.0, 17.0, 23.0, 16.0, 15.0, 14.0, 19.0, 8.0, 8.0, 5.0, 6.0, 5.0, 8.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.6552734375, -1.6026763916015625, -1.550079345703125, -1.4974822998046875, -1.44488525390625, -1.3922882080078125, -1.339691162109375, -1.2870941162109375, -1.2344970703125, -1.1819000244140625, -1.129302978515625, -1.0767059326171875, -1.02410888671875, -0.9715118408203125, -0.918914794921875, -0.8663177490234375, -0.813720703125, -0.7611236572265625, -0.708526611328125, -0.6559295654296875, -0.60333251953125, -0.5507354736328125, -0.498138427734375, -0.4455413818359375, -0.3929443359375, -0.3403472900390625, -0.287750244140625, -0.2351531982421875, -0.18255615234375, -0.1299591064453125, -0.077362060546875, -0.0247650146484375, 0.02783203125, 0.0804290771484375, 0.133026123046875, 0.1856231689453125, 0.23822021484375, 0.2908172607421875, 0.343414306640625, 0.3960113525390625, 0.4486083984375, 0.5012054443359375, 0.553802490234375, 0.6063995361328125, 0.65899658203125, 0.7115936279296875, 0.764190673828125, 0.8167877197265625, 0.869384765625, 0.9219818115234375, 0.974578857421875, 1.0271759033203125, 1.07977294921875, 1.1323699951171875, 1.184967041015625, 1.2375640869140625, 1.2901611328125, 1.3427581787109375, 1.395355224609375, 1.4479522705078125, 1.50054931640625, 1.5531463623046875, 1.605743408203125, 1.6583404541015625, 1.7109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 13.0, 20.0, 39.0, 57.0, 131.0, 232.0, 595.0, 1649.0, 5941.0, 35902.0, 627723.0, 347064.0, 22601.0, 4339.0, 1303.0, 471.0, 196.0, 112.0, 48.0, 35.0, 17.0, 14.0, 8.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.899932861328125, -2.79595947265625, -2.691986083984375, -2.5880126953125, -2.484039306640625, -2.38006591796875, -2.276092529296875, -2.172119140625, -2.068145751953125, -1.96417236328125, -1.860198974609375, -1.7562255859375, -1.652252197265625, -1.54827880859375, -1.444305419921875, -1.34033203125, -1.236358642578125, -1.13238525390625, -1.028411865234375, -0.9244384765625, -0.820465087890625, -0.71649169921875, -0.612518310546875, -0.508544921875, -0.404571533203125, -0.30059814453125, -0.196624755859375, -0.0926513671875, 0.011322021484375, 0.11529541015625, 0.219268798828125, 0.3232421875, 0.427215576171875, 0.53118896484375, 0.635162353515625, 0.7391357421875, 0.843109130859375, 0.94708251953125, 1.051055908203125, 1.155029296875, 1.259002685546875, 1.36297607421875, 1.466949462890625, 1.5709228515625, 1.674896240234375, 1.77886962890625, 1.882843017578125, 1.98681640625, 2.090789794921875, 2.19476318359375, 2.298736572265625, 2.4027099609375, 2.506683349609375, 2.61065673828125, 2.714630126953125, 2.818603515625, 2.922576904296875, 3.02655029296875, 3.130523681640625, 3.2344970703125, 3.338470458984375, 3.44244384765625, 3.546417236328125, 3.650390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 13.0, 11.0, 22.0, 30.0, 22.0, 43.0, 43.0, 49.0, 66.0, 57.0, 67.0, 64.0, 72.0, 61.0, 63.0, 52.0, 44.0, 33.0, 39.0, 34.0, 19.0, 16.0, 15.0, 13.0, 8.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9545040130615234e-05, -5.7742930948734283e-05, -5.594082176685333e-05, -5.413871258497238e-05, -5.233660340309143e-05, -5.053449422121048e-05, -4.873238503932953e-05, -4.693027585744858e-05, -4.512816667556763e-05, -4.3326057493686676e-05, -4.1523948311805725e-05, -3.9721839129924774e-05, -3.791972994804382e-05, -3.611762076616287e-05, -3.431551158428192e-05, -3.251340240240097e-05, -3.071129322052002e-05, -2.890918403863907e-05, -2.7107074856758118e-05, -2.5304965674877167e-05, -2.3502856492996216e-05, -2.1700747311115265e-05, -1.9898638129234314e-05, -1.8096528947353363e-05, -1.6294419765472412e-05, -1.4492310583591461e-05, -1.269020140171051e-05, -1.088809221982956e-05, -9.085983037948608e-06, -7.2838738560676575e-06, -5.4817646741867065e-06, -3.6796554923057556e-06, -1.8775463104248047e-06, -7.543712854385376e-08, 1.7266720533370972e-06, 3.528781235218048e-06, 5.330890417098999e-06, 7.13299959897995e-06, 8.935108780860901e-06, 1.0737217962741852e-05, 1.2539327144622803e-05, 1.4341436326503754e-05, 1.6143545508384705e-05, 1.7945654690265656e-05, 1.9747763872146606e-05, 2.1549873054027557e-05, 2.3351982235908508e-05, 2.515409141778946e-05, 2.695620059967041e-05, 2.875830978155136e-05, 3.056041896343231e-05, 3.236252814531326e-05, 3.4164637327194214e-05, 3.5966746509075165e-05, 3.7768855690956116e-05, 3.957096487283707e-05, 4.137307405471802e-05, 4.317518323659897e-05, 4.497729241847992e-05, 4.677940160036087e-05, 4.858151078224182e-05, 5.038361996412277e-05, 5.218572914600372e-05, 5.3987838327884674e-05, 5.5789947509765625e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 9.0, 5.0, 13.0, 25.0, 46.0, 56.0, 115.0, 204.0, 563.0, 1398.0, 4241.0, 19263.0, 176967.0, 741944.0, 86638.0, 12143.0, 3059.0, 1013.0, 438.0, 184.0, 93.0, 52.0, 32.0, 18.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.162445068359375, -2.06121826171875, -1.959991455078125, -1.8587646484375, -1.757537841796875, -1.65631103515625, -1.555084228515625, -1.453857421875, -1.352630615234375, -1.25140380859375, -1.150177001953125, -1.0489501953125, -0.947723388671875, -0.84649658203125, -0.745269775390625, -0.64404296875, -0.542816162109375, -0.44158935546875, -0.340362548828125, -0.2391357421875, -0.137908935546875, -0.03668212890625, 0.064544677734375, 0.165771484375, 0.266998291015625, 0.36822509765625, 0.469451904296875, 0.5706787109375, 0.671905517578125, 0.77313232421875, 0.874359130859375, 0.9755859375, 1.076812744140625, 1.17803955078125, 1.279266357421875, 1.3804931640625, 1.481719970703125, 1.58294677734375, 1.684173583984375, 1.785400390625, 1.886627197265625, 1.98785400390625, 2.089080810546875, 2.1903076171875, 2.291534423828125, 2.39276123046875, 2.493988037109375, 2.59521484375, 2.696441650390625, 2.79766845703125, 2.898895263671875, 3.0001220703125, 3.101348876953125, 3.20257568359375, 3.303802490234375, 3.405029296875, 3.506256103515625, 3.60748291015625, 3.708709716796875, 3.8099365234375, 3.911163330078125, 4.01239013671875, 4.113616943359375, 4.21484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 10.0, 7.0, 8.0, 7.0, 10.0, 13.0, 28.0, 39.0, 40.0, 34.0, 56.0, 59.0, 70.0, 85.0, 73.0, 102.0, 84.0, 64.0, 52.0, 39.0, 38.0, 27.0, 25.0, 8.0, 8.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.861236572265625, -0.82208251953125, -0.782928466796875, -0.7437744140625, -0.704620361328125, -0.66546630859375, -0.626312255859375, -0.587158203125, -0.548004150390625, -0.50885009765625, -0.469696044921875, -0.4305419921875, -0.391387939453125, -0.35223388671875, -0.313079833984375, -0.27392578125, -0.234771728515625, -0.19561767578125, -0.156463623046875, -0.1173095703125, -0.078155517578125, -0.03900146484375, 0.000152587890625, 0.039306640625, 0.078460693359375, 0.11761474609375, 0.156768798828125, 0.1959228515625, 0.235076904296875, 0.27423095703125, 0.313385009765625, 0.3525390625, 0.391693115234375, 0.43084716796875, 0.470001220703125, 0.5091552734375, 0.548309326171875, 0.58746337890625, 0.626617431640625, 0.665771484375, 0.704925537109375, 0.74407958984375, 0.783233642578125, 0.8223876953125, 0.861541748046875, 0.90069580078125, 0.939849853515625, 0.97900390625, 1.018157958984375, 1.05731201171875, 1.096466064453125, 1.1356201171875, 1.174774169921875, 1.21392822265625, 1.253082275390625, 1.292236328125, 1.331390380859375, 1.37054443359375, 1.409698486328125, 1.4488525390625, 1.488006591796875, 1.52716064453125, 1.566314697265625, 1.60546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 1.0, 13.0, 25.0, 45.0, 120.0, 292.0, 340.0, 112.0, 28.0, 15.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.98686218261719, -51.78384780883789, -50.58082962036133, -49.37781524658203, -48.17479705810547, -46.97178268432617, -45.76876449584961, -44.56575012207031, -43.36273193359375, -42.15971755981445, -40.95669937133789, -39.753684997558594, -38.55066680908203, -37.347652435302734, -36.14463424682617, -34.941619873046875, -33.73860549926758, -32.53559112548828, -31.33257293701172, -30.12955665588379, -28.92654037475586, -27.723526000976562, -26.520509719848633, -25.317493438720703, -24.114477157592773, -22.911460876464844, -21.708444595336914, -20.505428314208984, -19.302413940429688, -18.099395751953125, -16.896381378173828, -15.693365097045898, -14.490352630615234, -13.287336349487305, -12.084320068359375, -10.881304740905762, -9.678288459777832, -8.475272178649902, -7.272256374359131, -6.069240570068359, -4.86622428894043, -3.663208246231079, -2.4601922035217285, -1.257176160812378, -0.054160118103027344, 1.1488561630249023, 2.351871967315674, 3.5548877716064453, 4.757904052734375, 5.960920333862305, 7.163936138153076, 8.366951942443848, 9.569968223571777, 10.772984504699707, 11.97599983215332, 13.17901611328125, 14.38203239440918, 15.58504867553711, 16.78806495666504, 17.99108123779297, 19.194095611572266, 20.397113800048828, 21.600128173828125, 22.803144454956055, 24.006160736083984]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 5.0, 4.0, 5.0, 9.0, 7.0, 7.0, 11.0, 20.0, 19.0, 45.0, 94.0, 158.0, 183.0, 149.0, 131.0, 60.0, 38.0, 14.0, 9.0, 4.0, 9.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.76251220703125, -23.435897827148438, -22.109285354614258, -20.782670974731445, -19.456058502197266, -18.129444122314453, -16.80282974243164, -15.476217269897461, -14.149603843688965, -12.822990417480469, -11.496376991271973, -10.169763565063477, -8.843149185180664, -7.516536235809326, -6.189922332763672, -4.863308906555176, -3.5366954803466797, -2.2100820541381836, -0.8834683895111084, 0.4431452751159668, 1.769758701324463, 3.096372127532959, 4.422986030578613, 5.749599456787109, 7.0762128829956055, 8.402826309204102, 9.729439735412598, 11.056053161621094, 12.382667541503906, 13.709280014038086, 15.035894393920898, 16.362506866455078, 17.68912124633789, 19.015735626220703, 20.342348098754883, 21.668962478637695, 22.995574951171875, 24.322189331054688, 25.6488037109375, 26.97541618347168, 28.30202865600586, 29.628643035888672, 30.95525550842285, 32.28186798095703, 33.608482360839844, 34.935096740722656, 36.26171112060547, 37.58832550048828, 38.914939880371094, 40.241554260253906, 41.56816864013672, 42.894779205322266, 44.22139358520508, 45.54800796508789, 46.8746223449707, 48.20123291015625, 49.52784729003906, 50.854461669921875, 52.18107604980469, 53.507686614990234, 54.83430099487305, 56.16091537475586, 57.48752975463867, 58.81414031982422, 60.14075469970703]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 12.0, 22.0, 25.0, 70.0, 113.0, 281.0, 773.0, 2565.0, 12494.0, 216094.0, 3918671.0, 36461.0, 4831.0, 1153.0, 375.0, 141.0, 71.0, 59.0, 27.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.0855712890625, -9.632080078125, -9.1785888671875, -8.72509765625, -8.2716064453125, -7.818115234375, -7.3646240234375, -6.9111328125, -6.4576416015625, -6.004150390625, -5.5506591796875, -5.09716796875, -4.6436767578125, -4.190185546875, -3.7366943359375, -3.283203125, -2.8297119140625, -2.376220703125, -1.9227294921875, -1.46923828125, -1.0157470703125, -0.562255859375, -0.1087646484375, 0.3447265625, 0.7982177734375, 1.251708984375, 1.7052001953125, 2.15869140625, 2.6121826171875, 3.065673828125, 3.5191650390625, 3.97265625, 4.4261474609375, 4.879638671875, 5.3331298828125, 5.78662109375, 6.2401123046875, 6.693603515625, 7.1470947265625, 7.6005859375, 8.0540771484375, 8.507568359375, 8.9610595703125, 9.41455078125, 9.8680419921875, 10.321533203125, 10.7750244140625, 11.228515625, 11.6820068359375, 12.135498046875, 12.5889892578125, 13.04248046875, 13.4959716796875, 13.949462890625, 14.4029541015625, 14.8564453125, 15.3099365234375, 15.763427734375, 16.2169189453125, 16.67041015625, 17.1239013671875, 17.577392578125, 18.0308837890625, 18.484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 8.0, 19.0, 22.0, 35.0, 35.0, 80.0, 91.0, 123.0, 122.0, 125.0, 96.0, 68.0, 62.0, 27.0, 16.0, 10.0, 11.0, 11.0, 2.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.3951263427734375, -0.376678466796875, -0.3582305908203125, -0.33978271484375, -0.3213348388671875, -0.302886962890625, -0.2844390869140625, -0.2659912109375, -0.2475433349609375, -0.229095458984375, -0.2106475830078125, -0.19219970703125, -0.1737518310546875, -0.155303955078125, -0.1368560791015625, -0.118408203125, -0.0999603271484375, -0.081512451171875, -0.0630645751953125, -0.04461669921875, -0.0261688232421875, -0.007720947265625, 0.0107269287109375, 0.0291748046875, 0.0476226806640625, 0.066070556640625, 0.0845184326171875, 0.10296630859375, 0.1214141845703125, 0.139862060546875, 0.1583099365234375, 0.1767578125, 0.1952056884765625, 0.213653564453125, 0.2321014404296875, 0.25054931640625, 0.2689971923828125, 0.287445068359375, 0.3058929443359375, 0.3243408203125, 0.3427886962890625, 0.361236572265625, 0.3796844482421875, 0.39813232421875, 0.4165802001953125, 0.435028076171875, 0.4534759521484375, 0.471923828125, 0.4903717041015625, 0.508819580078125, 0.5272674560546875, 0.54571533203125, 0.5641632080078125, 0.582611083984375, 0.6010589599609375, 0.6195068359375, 0.6379547119140625, 0.656402587890625, 0.6748504638671875, 0.69329833984375, 0.7117462158203125, 0.730194091796875, 0.7486419677734375, 0.76708984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 4.0, 4.0, 8.0, 14.0, 18.0, 25.0, 22.0, 44.0, 58.0, 100.0, 194.0, 283.0, 558.0, 1087.0, 2010.0, 4154.0, 9703.0, 25105.0, 79551.0, 364117.0, 3075539.0, 483529.0, 97446.0, 29737.0, 11160.0, 4803.0, 2297.0, 1190.0, 604.0, 365.0, 202.0, 120.0, 84.0, 40.0, 32.0, 24.0, 20.0, 5.0, 8.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.703125, -4.56304931640625, -4.4229736328125, -4.28289794921875, -4.142822265625, -4.00274658203125, -3.8626708984375, -3.72259521484375, -3.58251953125, -3.44244384765625, -3.3023681640625, -3.16229248046875, -3.022216796875, -2.88214111328125, -2.7420654296875, -2.60198974609375, -2.4619140625, -2.32183837890625, -2.1817626953125, -2.04168701171875, -1.901611328125, -1.76153564453125, -1.6214599609375, -1.48138427734375, -1.34130859375, -1.20123291015625, -1.0611572265625, -0.92108154296875, -0.781005859375, -0.64093017578125, -0.5008544921875, -0.36077880859375, -0.220703125, -0.08062744140625, 0.0594482421875, 0.19952392578125, 0.339599609375, 0.47967529296875, 0.6197509765625, 0.75982666015625, 0.89990234375, 1.03997802734375, 1.1800537109375, 1.32012939453125, 1.460205078125, 1.60028076171875, 1.7403564453125, 1.88043212890625, 2.0205078125, 2.16058349609375, 2.3006591796875, 2.44073486328125, 2.580810546875, 2.72088623046875, 2.8609619140625, 3.00103759765625, 3.14111328125, 3.28118896484375, 3.4212646484375, 3.56134033203125, 3.701416015625, 3.84149169921875, 3.9815673828125, 4.12164306640625, 4.26171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 3.0, 11.0, 13.0, 20.0, 28.0, 50.0, 67.0, 100.0, 141.0, 227.0, 390.0, 1168.0, 893.0, 326.0, 184.0, 137.0, 80.0, 59.0, 36.0, 34.0, 25.0, 19.0, 15.0, 5.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5854415893554688, -0.5619964599609375, -0.5385513305664062, -0.515106201171875, -0.49166107177734375, -0.4682159423828125, -0.44477081298828125, -0.42132568359375, -0.39788055419921875, -0.3744354248046875, -0.35099029541015625, -0.327545166015625, -0.30410003662109375, -0.2806549072265625, -0.25720977783203125, -0.2337646484375, -0.21031951904296875, -0.1868743896484375, -0.16342926025390625, -0.139984130859375, -0.11653900146484375, -0.0930938720703125, -0.06964874267578125, -0.04620361328125, -0.02275848388671875, 0.0006866455078125, 0.02413177490234375, 0.047576904296875, 0.07102203369140625, 0.0944671630859375, 0.11791229248046875, 0.141357421875, 0.16480255126953125, 0.1882476806640625, 0.21169281005859375, 0.235137939453125, 0.25858306884765625, 0.2820281982421875, 0.30547332763671875, 0.32891845703125, 0.35236358642578125, 0.3758087158203125, 0.39925384521484375, 0.422698974609375, 0.44614410400390625, 0.4695892333984375, 0.49303436279296875, 0.5164794921875, 0.5399246215820312, 0.5633697509765625, 0.5868148803710938, 0.610260009765625, 0.6337051391601562, 0.6571502685546875, 0.6805953979492188, 0.70404052734375, 0.7274856567382812, 0.7509307861328125, 0.7743759155273438, 0.797821044921875, 0.8212661743164062, 0.8447113037109375, 0.8681564331054688, 0.8916015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 13.0, 37.0, 83.0, 202.0, 278.0, 212.0, 88.0, 52.0, 18.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.998159408569336, -5.640466690063477, -5.282773494720459, -4.9250807762146, -4.56738805770874, -4.209694862365723, -3.8520021438598633, -3.494309425354004, -3.1366164684295654, -2.778923511505127, -2.4212307929992676, -2.063537836074829, -1.7058449983596802, -1.3481521606445312, -0.9904592037200928, -0.6327664852142334, -0.2750735282897949, 0.08261933922767639, 0.4403122067451477, 0.7980051040649414, 1.1556979417800903, 1.5133907794952393, 1.8710837364196777, 2.228776454925537, 2.5864694118499756, 2.944162368774414, 3.3018550872802734, 3.659548044204712, 4.01724100112915, 4.37493371963501, 4.732626914978027, 5.090319633483887, 5.448012351989746, 5.8057050704956055, 6.163398265838623, 6.521090984344482, 6.878783702850342, 7.236476898193359, 7.594169616699219, 7.951862335205078, 8.309555053710938, 8.667247772216797, 9.024940490722656, 9.382633209228516, 9.740326881408691, 10.09801959991455, 10.45571231842041, 10.81340503692627, 11.171098709106445, 11.528791427612305, 11.886484146118164, 12.244176864624023, 12.6018705368042, 12.959563255310059, 13.317255973815918, 13.674948692321777, 14.032641410827637, 14.390334129333496, 14.748026847839355, 15.105720520019531, 15.46341323852539, 15.82110595703125, 16.17879867553711, 16.53649139404297, 16.894184112548828]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 14.0, 22.0, 25.0, 40.0, 36.0, 46.0, 71.0, 87.0, 100.0, 92.0, 93.0, 73.0, 82.0, 58.0, 39.0, 38.0, 22.0, 17.0, 13.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.600361347198486, -5.441863059997559, -5.283364772796631, -5.124866485595703, -4.966368198394775, -4.807869911193848, -4.64937162399292, -4.490873336791992, -4.332375526428223, -4.173877239227295, -4.015378952026367, -3.8568806648254395, -3.6983823776245117, -3.539884090423584, -3.3813860416412354, -3.2228877544403076, -3.064389228820801, -2.905890941619873, -2.7473926544189453, -2.5888943672180176, -2.43039608001709, -2.271897792816162, -2.1133997440338135, -1.9549014568328857, -1.796403169631958, -1.6379048824310303, -1.4794065952301025, -1.3209084272384644, -1.1624101400375366, -1.0039118528366089, -0.8454136252403259, -0.686915397644043, -0.528416633605957, -0.3699183762073517, -0.21142011880874634, -0.05292186141014099, 0.10557639598846436, 0.2640746831893921, 0.42257291078567505, 0.581071138381958, 0.7395694255828857, 0.8980677127838135, 1.0565659999847412, 1.2150641679763794, 1.3735624551773071, 1.5320607423782349, 1.690558910369873, 1.8490571975708008, 2.0075554847717285, 2.1660537719726562, 2.324552059173584, 2.4830503463745117, 2.6415486335754395, 2.800046920776367, 2.958544969558716, 3.1170432567596436, 3.2755415439605713, 3.434039831161499, 3.5925381183624268, 3.7510364055633545, 3.909534454345703, 4.068032741546631, 4.226531028747559, 4.385029315948486, 4.543527603149414]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 7.0, 5.0, 13.0, 16.0, 29.0, 27.0, 37.0, 68.0, 106.0, 148.0, 247.0, 409.0, 755.0, 1459.0, 3028.0, 7369.0, 21725.0, 92201.0, 490112.0, 343754.0, 60332.0, 15656.0, 5690.0, 2461.0, 1175.0, 653.0, 387.0, 225.0, 155.0, 86.0, 77.0, 34.0, 25.0, 19.0, 9.0, 13.0, 6.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0], "bins": [-4.5, -4.374542236328125, -4.24908447265625, -4.123626708984375, -3.9981689453125, -3.872711181640625, -3.74725341796875, -3.621795654296875, -3.496337890625, -3.370880126953125, -3.24542236328125, -3.119964599609375, -2.9945068359375, -2.869049072265625, -2.74359130859375, -2.618133544921875, -2.49267578125, -2.367218017578125, -2.24176025390625, -2.116302490234375, -1.9908447265625, -1.865386962890625, -1.73992919921875, -1.614471435546875, -1.489013671875, -1.363555908203125, -1.23809814453125, -1.112640380859375, -0.9871826171875, -0.861724853515625, -0.73626708984375, -0.610809326171875, -0.4853515625, -0.359893798828125, -0.23443603515625, -0.108978271484375, 0.0164794921875, 0.141937255859375, 0.26739501953125, 0.392852783203125, 0.518310546875, 0.643768310546875, 0.76922607421875, 0.894683837890625, 1.0201416015625, 1.145599365234375, 1.27105712890625, 1.396514892578125, 1.52197265625, 1.647430419921875, 1.77288818359375, 1.898345947265625, 2.0238037109375, 2.149261474609375, 2.27471923828125, 2.400177001953125, 2.525634765625, 2.651092529296875, 2.77655029296875, 2.902008056640625, 3.0274658203125, 3.152923583984375, 3.27838134765625, 3.403839111328125, 3.529296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 5.0, 17.0, 22.0, 36.0, 54.0, 63.0, 101.0, 109.0, 126.0, 97.0, 115.0, 77.0, 53.0, 40.0, 27.0, 14.0, 15.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.4199371337890625, -0.401397705078125, -0.3828582763671875, -0.36431884765625, -0.3457794189453125, -0.327239990234375, -0.3087005615234375, -0.2901611328125, -0.2716217041015625, -0.253082275390625, -0.2345428466796875, -0.21600341796875, -0.1974639892578125, -0.178924560546875, -0.1603851318359375, -0.141845703125, -0.1233062744140625, -0.104766845703125, -0.0862274169921875, -0.06768798828125, -0.0491485595703125, -0.030609130859375, -0.0120697021484375, 0.0064697265625, 0.0250091552734375, 0.043548583984375, 0.0620880126953125, 0.08062744140625, 0.0991668701171875, 0.117706298828125, 0.1362457275390625, 0.15478515625, 0.1733245849609375, 0.191864013671875, 0.2104034423828125, 0.22894287109375, 0.2474822998046875, 0.266021728515625, 0.2845611572265625, 0.3031005859375, 0.3216400146484375, 0.340179443359375, 0.3587188720703125, 0.37725830078125, 0.3957977294921875, 0.414337158203125, 0.4328765869140625, 0.451416015625, 0.4699554443359375, 0.488494873046875, 0.5070343017578125, 0.52557373046875, 0.5441131591796875, 0.562652587890625, 0.5811920166015625, 0.5997314453125, 0.6182708740234375, 0.636810302734375, 0.6553497314453125, 0.67388916015625, 0.6924285888671875, 0.710968017578125, 0.7295074462890625, 0.748046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 16.0, 26.0, 25.0, 49.0, 92.0, 141.0, 207.0, 341.0, 610.0, 1080.0, 2227.0, 5161.0, 13900.0, 53551.0, 297227.0, 527514.0, 108588.0, 23421.0, 7601.0, 3193.0, 1520.0, 823.0, 483.0, 258.0, 170.0, 103.0, 59.0, 44.0, 25.0, 26.0, 16.0, 8.0, 15.0, 6.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.28125, -3.18536376953125, -3.0894775390625, -2.99359130859375, -2.897705078125, -2.80181884765625, -2.7059326171875, -2.61004638671875, -2.51416015625, -2.41827392578125, -2.3223876953125, -2.22650146484375, -2.130615234375, -2.03472900390625, -1.9388427734375, -1.84295654296875, -1.7470703125, -1.65118408203125, -1.5552978515625, -1.45941162109375, -1.363525390625, -1.26763916015625, -1.1717529296875, -1.07586669921875, -0.97998046875, -0.88409423828125, -0.7882080078125, -0.69232177734375, -0.596435546875, -0.50054931640625, -0.4046630859375, -0.30877685546875, -0.212890625, -0.11700439453125, -0.0211181640625, 0.07476806640625, 0.170654296875, 0.26654052734375, 0.3624267578125, 0.45831298828125, 0.55419921875, 0.65008544921875, 0.7459716796875, 0.84185791015625, 0.937744140625, 1.03363037109375, 1.1295166015625, 1.22540283203125, 1.3212890625, 1.41717529296875, 1.5130615234375, 1.60894775390625, 1.704833984375, 1.80072021484375, 1.8966064453125, 1.99249267578125, 2.08837890625, 2.18426513671875, 2.2801513671875, 2.37603759765625, 2.471923828125, 2.56781005859375, 2.6636962890625, 2.75958251953125, 2.85546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 12.0, 23.0, 24.0, 31.0, 35.0, 27.0, 42.0, 56.0, 53.0, 43.0, 64.0, 69.0, 48.0, 58.0, 60.0, 45.0, 41.0, 59.0, 33.0, 39.0, 26.0, 24.0, 12.0, 22.0, 16.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5546875, -1.499908447265625, -1.44512939453125, -1.390350341796875, -1.3355712890625, -1.280792236328125, -1.22601318359375, -1.171234130859375, -1.116455078125, -1.061676025390625, -1.00689697265625, -0.952117919921875, -0.8973388671875, -0.842559814453125, -0.78778076171875, -0.733001708984375, -0.67822265625, -0.623443603515625, -0.56866455078125, -0.513885498046875, -0.4591064453125, -0.404327392578125, -0.34954833984375, -0.294769287109375, -0.239990234375, -0.185211181640625, -0.13043212890625, -0.075653076171875, -0.0208740234375, 0.033905029296875, 0.08868408203125, 0.143463134765625, 0.1982421875, 0.253021240234375, 0.30780029296875, 0.362579345703125, 0.4173583984375, 0.472137451171875, 0.52691650390625, 0.581695556640625, 0.636474609375, 0.691253662109375, 0.74603271484375, 0.800811767578125, 0.8555908203125, 0.910369873046875, 0.96514892578125, 1.019927978515625, 1.07470703125, 1.129486083984375, 1.18426513671875, 1.239044189453125, 1.2938232421875, 1.348602294921875, 1.40338134765625, 1.458160400390625, 1.512939453125, 1.567718505859375, 1.62249755859375, 1.677276611328125, 1.7320556640625, 1.786834716796875, 1.84161376953125, 1.896392822265625, 1.951171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 12.0, 6.0, 16.0, 30.0, 24.0, 48.0, 72.0, 119.0, 159.0, 283.0, 462.0, 833.0, 1585.0, 3571.0, 8352.0, 25008.0, 110622.0, 498026.0, 313374.0, 58627.0, 15745.0, 6033.0, 2623.0, 1263.0, 622.0, 381.0, 228.0, 127.0, 89.0, 59.0, 48.0, 25.0, 21.0, 15.0, 8.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-4.41015625, -4.2869873046875, -4.163818359375, -4.0406494140625, -3.91748046875, -3.7943115234375, -3.671142578125, -3.5479736328125, -3.4248046875, -3.3016357421875, -3.178466796875, -3.0552978515625, -2.93212890625, -2.8089599609375, -2.685791015625, -2.5626220703125, -2.439453125, -2.3162841796875, -2.193115234375, -2.0699462890625, -1.94677734375, -1.8236083984375, -1.700439453125, -1.5772705078125, -1.4541015625, -1.3309326171875, -1.207763671875, -1.0845947265625, -0.96142578125, -0.8382568359375, -0.715087890625, -0.5919189453125, -0.46875, -0.3455810546875, -0.222412109375, -0.0992431640625, 0.02392578125, 0.1470947265625, 0.270263671875, 0.3934326171875, 0.5166015625, 0.6397705078125, 0.762939453125, 0.8861083984375, 1.00927734375, 1.1324462890625, 1.255615234375, 1.3787841796875, 1.501953125, 1.6251220703125, 1.748291015625, 1.8714599609375, 1.99462890625, 2.1177978515625, 2.240966796875, 2.3641357421875, 2.4873046875, 2.6104736328125, 2.733642578125, 2.8568115234375, 2.97998046875, 3.1031494140625, 3.226318359375, 3.3494873046875, 3.47265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 9.0, 5.0, 7.0, 17.0, 26.0, 69.0, 129.0, 262.0, 233.0, 107.0, 77.0, 24.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005621910095214844, -0.0005456209182739258, -0.0005290508270263672, -0.0005124807357788086, -0.00049591064453125, -0.0004793405532836914, -0.0004627704620361328, -0.0004462003707885742, -0.0004296302795410156, -0.00041306018829345703, -0.00039649009704589844, -0.00037992000579833984, -0.00036334991455078125, -0.00034677982330322266, -0.00033020973205566406, -0.00031363964080810547, -0.0002970695495605469, -0.0002804994583129883, -0.0002639293670654297, -0.0002473592758178711, -0.0002307891845703125, -0.0002142190933227539, -0.0001976490020751953, -0.00018107891082763672, -0.00016450881958007812, -0.00014793872833251953, -0.00013136863708496094, -0.00011479854583740234, -9.822845458984375e-05, -8.165836334228516e-05, -6.508827209472656e-05, -4.851818084716797e-05, -3.1948089599609375e-05, -1.537799835205078e-05, 1.1920928955078125e-06, 1.7762184143066406e-05, 3.4332275390625e-05, 5.0902366638183594e-05, 6.747245788574219e-05, 8.404254913330078e-05, 0.00010061264038085938, 0.00011718273162841797, 0.00013375282287597656, 0.00015032291412353516, 0.00016689300537109375, 0.00018346309661865234, 0.00020003318786621094, 0.00021660327911376953, 0.00023317337036132812, 0.0002497434616088867, 0.0002663135528564453, 0.0002828836441040039, 0.0002994537353515625, 0.0003160238265991211, 0.0003325939178466797, 0.0003491640090942383, 0.0003657341003417969, 0.00038230419158935547, 0.00039887428283691406, 0.00041544437408447266, 0.00043201446533203125, 0.00044858455657958984, 0.00046515464782714844, 0.00048172473907470703, 0.0004982948303222656]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 8.0, 10.0, 11.0, 15.0, 23.0, 37.0, 77.0, 109.0, 126.0, 250.0, 448.0, 742.0, 1341.0, 2789.0, 6168.0, 15442.0, 48835.0, 200506.0, 487133.0, 205290.0, 50537.0, 16110.0, 6402.0, 2780.0, 1463.0, 754.0, 449.0, 222.0, 156.0, 101.0, 71.0, 43.0, 40.0, 11.0, 16.0, 14.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.412109375, -3.300262451171875, -3.18841552734375, -3.076568603515625, -2.9647216796875, -2.852874755859375, -2.74102783203125, -2.629180908203125, -2.517333984375, -2.405487060546875, -2.29364013671875, -2.181793212890625, -2.0699462890625, -1.958099365234375, -1.84625244140625, -1.734405517578125, -1.62255859375, -1.510711669921875, -1.39886474609375, -1.287017822265625, -1.1751708984375, -1.063323974609375, -0.95147705078125, -0.839630126953125, -0.727783203125, -0.615936279296875, -0.50408935546875, -0.392242431640625, -0.2803955078125, -0.168548583984375, -0.05670166015625, 0.055145263671875, 0.1669921875, 0.278839111328125, 0.39068603515625, 0.502532958984375, 0.6143798828125, 0.726226806640625, 0.83807373046875, 0.949920654296875, 1.061767578125, 1.173614501953125, 1.28546142578125, 1.397308349609375, 1.5091552734375, 1.621002197265625, 1.73284912109375, 1.844696044921875, 1.95654296875, 2.068389892578125, 2.18023681640625, 2.292083740234375, 2.4039306640625, 2.515777587890625, 2.62762451171875, 2.739471435546875, 2.851318359375, 2.963165283203125, 3.07501220703125, 3.186859130859375, 3.2987060546875, 3.410552978515625, 3.52239990234375, 3.634246826171875, 3.74609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 16.0, 19.0, 28.0, 38.0, 61.0, 55.0, 79.0, 94.0, 93.0, 104.0, 86.0, 72.0, 51.0, 49.0, 30.0, 27.0, 22.0, 7.0, 13.0, 12.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.1851654052734375, -2.122283935546875, -2.0594024658203125, -1.99652099609375, -1.9336395263671875, -1.870758056640625, -1.8078765869140625, -1.7449951171875, -1.6821136474609375, -1.619232177734375, -1.5563507080078125, -1.49346923828125, -1.4305877685546875, -1.367706298828125, -1.3048248291015625, -1.241943359375, -1.1790618896484375, -1.116180419921875, -1.0532989501953125, -0.99041748046875, -0.9275360107421875, -0.864654541015625, -0.8017730712890625, -0.7388916015625, -0.6760101318359375, -0.613128662109375, -0.5502471923828125, -0.48736572265625, -0.4244842529296875, -0.361602783203125, -0.2987213134765625, -0.23583984375, -0.1729583740234375, -0.110076904296875, -0.0471954345703125, 0.01568603515625, 0.0785675048828125, 0.141448974609375, 0.2043304443359375, 0.2672119140625, 0.3300933837890625, 0.392974853515625, 0.4558563232421875, 0.51873779296875, 0.5816192626953125, 0.644500732421875, 0.7073822021484375, 0.770263671875, 0.8331451416015625, 0.896026611328125, 0.9589080810546875, 1.02178955078125, 1.0846710205078125, 1.147552490234375, 1.2104339599609375, 1.2733154296875, 1.3361968994140625, 1.399078369140625, 1.4619598388671875, 1.52484130859375, 1.5877227783203125, 1.650604248046875, 1.7134857177734375, 1.7763671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 12.0, 33.0, 90.0, 205.0, 329.0, 215.0, 80.0, 23.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.03612518310547, -59.83302307128906, -58.629920959472656, -57.426822662353516, -56.22372055053711, -55.0206184387207, -53.8175163269043, -52.614418029785156, -51.41131591796875, -50.208213806152344, -49.00511169433594, -47.8020133972168, -46.59891128540039, -45.395809173583984, -44.19270706176758, -42.98960876464844, -41.78650665283203, -40.583404541015625, -39.38030242919922, -38.17720413208008, -36.97410202026367, -35.770999908447266, -34.56789779663086, -33.36479949951172, -32.16169357299805, -30.95859146118164, -29.755491256713867, -28.55238914489746, -27.349288940429688, -26.14618682861328, -24.943084716796875, -23.7399845123291, -22.536882400512695, -21.33378028869629, -20.130680084228516, -18.92757797241211, -17.724477767944336, -16.52137565612793, -15.31827449798584, -14.11517333984375, -12.91207218170166, -11.70897102355957, -10.50586986541748, -9.30276870727539, -8.099666595458984, -6.896565914154053, -5.693464279174805, -4.490363121032715, -3.287261962890625, -2.084160804748535, -0.8810594081878662, 0.32204198837280273, 1.5251431465148926, 2.7282443046569824, 3.9313459396362305, 5.13444709777832, 6.33754825592041, 7.5406494140625, 8.74375057220459, 9.94685173034668, 11.149953842163086, 12.35305404663086, 13.556156158447266, 14.759257316589355, 15.962358474731445]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 12.0, 23.0, 33.0, 39.0, 44.0, 41.0, 57.0, 56.0, 69.0, 59.0, 66.0, 59.0, 53.0, 55.0, 48.0, 32.0, 44.0, 20.0, 38.0, 19.0, 19.0, 14.0, 9.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.138592720031738, -10.749749183654785, -10.360905647277832, -9.972061157226562, -9.58321762084961, -9.194374084472656, -8.805530548095703, -8.41668701171875, -8.027843475341797, -7.638999938964844, -7.250155925750732, -6.861312389373779, -6.472468376159668, -6.083624839782715, -5.694781303405762, -5.305937767028809, -4.917093276977539, -4.528249740600586, -4.139405727386475, -3.7505621910095215, -3.3617184162139893, -2.972874641418457, -2.584031105041504, -2.1951873302459717, -1.8063435554504395, -1.4174997806549072, -1.0286561250686646, -0.6398124694824219, -0.25096869468688965, 0.13787508010864258, 0.5267186164855957, 0.9155623912811279, 1.3044071197509766, 1.6932508945465088, 2.082094669342041, 2.470938205718994, 2.8597819805145264, 3.2486257553100586, 3.6374692916870117, 4.026312828063965, 4.415156841278076, 4.804000377655029, 5.192844390869141, 5.581687927246094, 5.970531463623047, 6.359375476837158, 6.748219013214111, 7.137063026428223, 7.525906562805176, 7.914750099182129, 8.303593635559082, 8.692438125610352, 9.081281661987305, 9.470125198364258, 9.858968734741211, 10.247812271118164, 10.636655807495117, 11.02549934387207, 11.414342880249023, 11.803186416625977, 12.192030906677246, 12.5808744430542, 12.969717979431152, 13.358561515808105, 13.747406005859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 11.0, 11.0, 20.0, 11.0, 22.0, 31.0, 67.0, 93.0, 156.0, 243.0, 350.0, 685.0, 1263.0, 2483.0, 5833.0, 17179.0, 70022.0, 640197.0, 3245156.0, 165799.0, 30336.0, 8475.0, 3129.0, 1277.0, 594.0, 300.0, 182.0, 115.0, 73.0, 41.0, 29.0, 20.0, 20.0, 11.0, 9.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.1171875, -8.8427734375, -8.568359375, -8.2939453125, -8.01953125, -7.7451171875, -7.470703125, -7.1962890625, -6.921875, -6.6474609375, -6.373046875, -6.0986328125, -5.82421875, -5.5498046875, -5.275390625, -5.0009765625, -4.7265625, -4.4521484375, -4.177734375, -3.9033203125, -3.62890625, -3.3544921875, -3.080078125, -2.8056640625, -2.53125, -2.2568359375, -1.982421875, -1.7080078125, -1.43359375, -1.1591796875, -0.884765625, -0.6103515625, -0.3359375, -0.0615234375, 0.212890625, 0.4873046875, 0.76171875, 1.0361328125, 1.310546875, 1.5849609375, 1.859375, 2.1337890625, 2.408203125, 2.6826171875, 2.95703125, 3.2314453125, 3.505859375, 3.7802734375, 4.0546875, 4.3291015625, 4.603515625, 4.8779296875, 5.15234375, 5.4267578125, 5.701171875, 5.9755859375, 6.25, 6.5244140625, 6.798828125, 7.0732421875, 7.34765625, 7.6220703125, 7.896484375, 8.1708984375, 8.4453125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 14.0, 16.0, 28.0, 42.0, 73.0, 78.0, 108.0, 146.0, 119.0, 92.0, 86.0, 62.0, 53.0, 26.0, 12.0, 11.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4292869567871094, -0.40959930419921875, -0.3899116516113281, -0.3702239990234375, -0.3505363464355469, -0.33084869384765625, -0.3111610412597656, -0.291473388671875, -0.2717857360839844, -0.25209808349609375, -0.23241043090820312, -0.2127227783203125, -0.19303512573242188, -0.17334747314453125, -0.15365982055664062, -0.13397216796875, -0.11428451538085938, -0.09459686279296875, -0.07490921020507812, -0.0552215576171875, -0.035533905029296875, -0.01584625244140625, 0.003841400146484375, 0.023529052734375, 0.043216705322265625, 0.06290435791015625, 0.08259201049804688, 0.1022796630859375, 0.12196731567382812, 0.14165496826171875, 0.16134262084960938, 0.1810302734375, 0.20071792602539062, 0.22040557861328125, 0.24009323120117188, 0.2597808837890625, 0.2794685363769531, 0.29915618896484375, 0.3188438415527344, 0.338531494140625, 0.3582191467285156, 0.37790679931640625, 0.3975944519042969, 0.4172821044921875, 0.4369697570800781, 0.45665740966796875, 0.4763450622558594, 0.49603271484375, 0.5157203674316406, 0.5354080200195312, 0.5550956726074219, 0.5747833251953125, 0.5944709777832031, 0.6141586303710938, 0.6338462829589844, 0.653533935546875, 0.6732215881347656, 0.6929092407226562, 0.7125968933105469, 0.7322845458984375, 0.7519721984863281, 0.7716598510742188, 0.7913475036621094, 0.81103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 1.0, 8.0, 16.0, 9.0, 25.0, 29.0, 56.0, 92.0, 148.0, 337.0, 733.0, 2637.0, 19327.0, 379017.0, 3656071.0, 123779.0, 9261.0, 1622.0, 536.0, 220.0, 147.0, 80.0, 40.0, 25.0, 20.0, 15.0, 9.0, 8.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.75, -15.3043212890625, -14.858642578125, -14.4129638671875, -13.96728515625, -13.5216064453125, -13.075927734375, -12.6302490234375, -12.1845703125, -11.7388916015625, -11.293212890625, -10.8475341796875, -10.40185546875, -9.9561767578125, -9.510498046875, -9.0648193359375, -8.619140625, -8.1734619140625, -7.727783203125, -7.2821044921875, -6.83642578125, -6.3907470703125, -5.945068359375, -5.4993896484375, -5.0537109375, -4.6080322265625, -4.162353515625, -3.7166748046875, -3.27099609375, -2.8253173828125, -2.379638671875, -1.9339599609375, -1.48828125, -1.0426025390625, -0.596923828125, -0.1512451171875, 0.29443359375, 0.7401123046875, 1.185791015625, 1.6314697265625, 2.0771484375, 2.5228271484375, 2.968505859375, 3.4141845703125, 3.85986328125, 4.3055419921875, 4.751220703125, 5.1968994140625, 5.642578125, 6.0882568359375, 6.533935546875, 6.9796142578125, 7.42529296875, 7.8709716796875, 8.316650390625, 8.7623291015625, 9.2080078125, 9.6536865234375, 10.099365234375, 10.5450439453125, 10.99072265625, 11.4364013671875, 11.882080078125, 12.3277587890625, 12.7734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 18.0, 6.0, 26.0, 18.0, 44.0, 55.0, 45.0, 94.0, 118.0, 207.0, 249.0, 394.0, 791.0, 761.0, 407.0, 227.0, 169.0, 124.0, 106.0, 53.0, 39.0, 26.0, 11.0, 21.0, 11.0, 6.0, 10.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87255859375, -0.8413925170898438, -0.8102264404296875, -0.7790603637695312, -0.747894287109375, -0.7167282104492188, -0.6855621337890625, -0.6543960571289062, -0.62322998046875, -0.5920639038085938, -0.5608978271484375, -0.5297317504882812, -0.498565673828125, -0.46739959716796875, -0.4362335205078125, -0.40506744384765625, -0.3739013671875, -0.34273529052734375, -0.3115692138671875, -0.28040313720703125, -0.249237060546875, -0.21807098388671875, -0.1869049072265625, -0.15573883056640625, -0.12457275390625, -0.09340667724609375, -0.0622406005859375, -0.03107452392578125, 9.1552734375e-05, 0.03125762939453125, 0.0624237060546875, 0.09358978271484375, 0.124755859375, 0.15592193603515625, 0.1870880126953125, 0.21825408935546875, 0.249420166015625, 0.28058624267578125, 0.3117523193359375, 0.34291839599609375, 0.37408447265625, 0.40525054931640625, 0.4364166259765625, 0.46758270263671875, 0.498748779296875, 0.5299148559570312, 0.5610809326171875, 0.5922470092773438, 0.6234130859375, 0.6545791625976562, 0.6857452392578125, 0.7169113159179688, 0.748077392578125, 0.7792434692382812, 0.8104095458984375, 0.8415756225585938, 0.87274169921875, 0.9039077758789062, 0.9350738525390625, 0.9662399291992188, 0.997406005859375, 1.0285720825195312, 1.0597381591796875, 1.0909042358398438, 1.1220703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 6.0, 19.0, 26.0, 46.0, 79.0, 93.0, 123.0, 154.0, 141.0, 112.0, 81.0, 47.0, 31.0, 16.0, 9.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.346214294433594, -8.064419746398926, -7.7826247215271, -7.500830173492432, -7.2190351486206055, -6.9372406005859375, -6.6554460525512695, -6.373651504516602, -6.091856479644775, -5.810061931610107, -5.528266906738281, -5.246472358703613, -4.964677810668945, -4.682882785797119, -4.401088237762451, -4.119293212890625, -3.837498664855957, -3.55570387840271, -3.273909091949463, -2.992114543914795, -2.710319757461548, -2.428524971008301, -2.146730422973633, -1.8649356365203857, -1.5831408500671387, -1.3013460636138916, -1.019551396369934, -0.7377566695213318, -0.4559619426727295, -0.17416715621948242, 0.1076275110244751, 0.3894221782684326, 0.6712169647216797, 0.953011691570282, 1.2348064184188843, 1.5166010856628418, 1.7983958721160889, 2.080190658569336, 2.361985206604004, 2.643779993057251, 2.925574779510498, 3.207369565963745, 3.489164352416992, 3.77095890045166, 4.052753448486328, 4.334548473358154, 4.616343021392822, 4.898138046264648, 5.179932594299316, 5.461727142333984, 5.7435221672058105, 6.0253167152404785, 6.307111740112305, 6.588906288146973, 6.870700836181641, 7.152495384216309, 7.434290409088135, 7.716084957122803, 7.997879981994629, 8.279674530029297, 8.561469078063965, 8.843263626098633, 9.125059127807617, 9.406853675842285, 9.688648223876953]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 9.0, 10.0, 9.0, 10.0, 10.0, 18.0, 18.0, 23.0, 23.0, 23.0, 32.0, 36.0, 44.0, 32.0, 63.0, 46.0, 57.0, 43.0, 55.0, 41.0, 37.0, 32.0, 40.0, 43.0, 36.0, 27.0, 26.0, 20.0, 23.0, 15.0, 23.0, 18.0, 12.0, 12.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5599160194396973, -3.427819013595581, -3.295722007751465, -3.1636250019073486, -3.0315279960632324, -2.899430990219116, -2.767333984375, -2.635236978530884, -2.5031399726867676, -2.3710429668426514, -2.238945960998535, -2.106848955154419, -1.9747519493103027, -1.8426549434661865, -1.7105579376220703, -1.578460931777954, -1.446363925933838, -1.3142669200897217, -1.1821699142456055, -1.0500729084014893, -0.917975902557373, -0.7858788967132568, -0.6537818908691406, -0.5216848850250244, -0.3895878791809082, -0.257490873336792, -0.12539386749267578, 0.00670313835144043, 0.13880014419555664, 0.27089715003967285, 0.40299415588378906, 0.5350911617279053, 0.6671881675720215, 0.7992851734161377, 0.9313821792602539, 1.0634791851043701, 1.1955761909484863, 1.3276731967926025, 1.4597702026367188, 1.591867208480835, 1.7239642143249512, 1.8560612201690674, 1.9881582260131836, 2.1202552318573, 2.252352237701416, 2.3844492435455322, 2.5165462493896484, 2.6486432552337646, 2.780740261077881, 2.912837266921997, 3.0449342727661133, 3.1770312786102295, 3.3091282844543457, 3.441225290298462, 3.573322296142578, 3.7054193019866943, 3.8375163078308105, 3.9696133136749268, 4.101710319519043, 4.233807563781738, 4.365904331207275, 4.4980010986328125, 4.630098342895508, 4.762195587158203, 4.89429235458374]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 14.0, 44.0, 39.0, 57.0, 78.0, 144.0, 203.0, 295.0, 513.0, 851.0, 1623.0, 3613.0, 8669.0, 22388.0, 61493.0, 183672.0, 398342.0, 238555.0, 79904.0, 28335.0, 10704.0, 4329.0, 2010.0, 1050.0, 560.0, 342.0, 205.0, 130.0, 107.0, 74.0, 49.0, 33.0, 32.0, 20.0, 11.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1156005859375, -3.981201171875, -3.8468017578125, -3.71240234375, -3.5780029296875, -3.443603515625, -3.3092041015625, -3.1748046875, -3.0404052734375, -2.906005859375, -2.7716064453125, -2.63720703125, -2.5028076171875, -2.368408203125, -2.2340087890625, -2.099609375, -1.9652099609375, -1.830810546875, -1.6964111328125, -1.56201171875, -1.4276123046875, -1.293212890625, -1.1588134765625, -1.0244140625, -0.8900146484375, -0.755615234375, -0.6212158203125, -0.48681640625, -0.3524169921875, -0.218017578125, -0.0836181640625, 0.05078125, 0.1851806640625, 0.319580078125, 0.4539794921875, 0.58837890625, 0.7227783203125, 0.857177734375, 0.9915771484375, 1.1259765625, 1.2603759765625, 1.394775390625, 1.5291748046875, 1.66357421875, 1.7979736328125, 1.932373046875, 2.0667724609375, 2.201171875, 2.3355712890625, 2.469970703125, 2.6043701171875, 2.73876953125, 2.8731689453125, 3.007568359375, 3.1419677734375, 3.2763671875, 3.4107666015625, 3.545166015625, 3.6795654296875, 3.81396484375, 3.9483642578125, 4.082763671875, 4.2171630859375, 4.3515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 7.0, 11.0, 22.0, 33.0, 46.0, 47.0, 74.0, 95.0, 111.0, 104.0, 107.0, 99.0, 82.0, 46.0, 42.0, 28.0, 14.0, 15.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4716796875, -0.4522247314453125, -0.432769775390625, -0.4133148193359375, -0.39385986328125, -0.3744049072265625, -0.354949951171875, -0.3354949951171875, -0.3160400390625, -0.2965850830078125, -0.277130126953125, -0.2576751708984375, -0.23822021484375, -0.2187652587890625, -0.199310302734375, -0.1798553466796875, -0.160400390625, -0.1409454345703125, -0.121490478515625, -0.1020355224609375, -0.08258056640625, -0.0631256103515625, -0.043670654296875, -0.0242156982421875, -0.0047607421875, 0.0146942138671875, 0.034149169921875, 0.0536041259765625, 0.07305908203125, 0.0925140380859375, 0.111968994140625, 0.1314239501953125, 0.15087890625, 0.1703338623046875, 0.189788818359375, 0.2092437744140625, 0.22869873046875, 0.2481536865234375, 0.267608642578125, 0.2870635986328125, 0.3065185546875, 0.3259735107421875, 0.345428466796875, 0.3648834228515625, 0.38433837890625, 0.4037933349609375, 0.423248291015625, 0.4427032470703125, 0.462158203125, 0.4816131591796875, 0.501068115234375, 0.5205230712890625, 0.53997802734375, 0.5594329833984375, 0.578887939453125, 0.5983428955078125, 0.6177978515625, 0.6372528076171875, 0.656707763671875, 0.6761627197265625, 0.69561767578125, 0.7150726318359375, 0.734527587890625, 0.7539825439453125, 0.7734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 8.0, 7.0, 16.0, 22.0, 20.0, 43.0, 61.0, 82.0, 78.0, 125.0, 201.0, 294.0, 504.0, 1024.0, 2213.0, 5474.0, 15453.0, 50504.0, 175410.0, 429692.0, 256785.0, 74806.0, 22210.0, 7558.0, 2831.0, 1356.0, 657.0, 407.0, 237.0, 133.0, 114.0, 55.0, 44.0, 41.0, 23.0, 18.0, 11.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0], "bins": [-6.015625, -5.85589599609375, -5.6961669921875, -5.53643798828125, -5.376708984375, -5.21697998046875, -5.0572509765625, -4.89752197265625, -4.73779296875, -4.57806396484375, -4.4183349609375, -4.25860595703125, -4.098876953125, -3.93914794921875, -3.7794189453125, -3.61968994140625, -3.4599609375, -3.30023193359375, -3.1405029296875, -2.98077392578125, -2.821044921875, -2.66131591796875, -2.5015869140625, -2.34185791015625, -2.18212890625, -2.02239990234375, -1.8626708984375, -1.70294189453125, -1.543212890625, -1.38348388671875, -1.2237548828125, -1.06402587890625, -0.904296875, -0.74456787109375, -0.5848388671875, -0.42510986328125, -0.265380859375, -0.10565185546875, 0.0540771484375, 0.21380615234375, 0.37353515625, 0.53326416015625, 0.6929931640625, 0.85272216796875, 1.012451171875, 1.17218017578125, 1.3319091796875, 1.49163818359375, 1.6513671875, 1.81109619140625, 1.9708251953125, 2.13055419921875, 2.290283203125, 2.45001220703125, 2.6097412109375, 2.76947021484375, 2.92919921875, 3.08892822265625, 3.2486572265625, 3.40838623046875, 3.568115234375, 3.72784423828125, 3.8875732421875, 4.04730224609375, 4.20703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 6.0, 9.0, 5.0, 10.0, 13.0, 13.0, 9.0, 17.0, 18.0, 16.0, 20.0, 32.0, 37.0, 33.0, 39.0, 48.0, 36.0, 45.0, 39.0, 36.0, 45.0, 62.0, 38.0, 44.0, 42.0, 44.0, 29.0, 26.0, 31.0, 29.0, 20.0, 27.0, 19.0, 10.0, 12.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.756683349609375, -1.68914794921875, -1.621612548828125, -1.5540771484375, -1.486541748046875, -1.41900634765625, -1.351470947265625, -1.283935546875, -1.216400146484375, -1.14886474609375, -1.081329345703125, -1.0137939453125, -0.946258544921875, -0.87872314453125, -0.811187744140625, -0.74365234375, -0.676116943359375, -0.60858154296875, -0.541046142578125, -0.4735107421875, -0.405975341796875, -0.33843994140625, -0.270904541015625, -0.203369140625, -0.135833740234375, -0.06829833984375, -0.000762939453125, 0.0667724609375, 0.134307861328125, 0.20184326171875, 0.269378662109375, 0.3369140625, 0.404449462890625, 0.47198486328125, 0.539520263671875, 0.6070556640625, 0.674591064453125, 0.74212646484375, 0.809661865234375, 0.877197265625, 0.944732666015625, 1.01226806640625, 1.079803466796875, 1.1473388671875, 1.214874267578125, 1.28240966796875, 1.349945068359375, 1.41748046875, 1.485015869140625, 1.55255126953125, 1.620086669921875, 1.6876220703125, 1.755157470703125, 1.82269287109375, 1.890228271484375, 1.957763671875, 2.025299072265625, 2.09283447265625, 2.160369873046875, 2.2279052734375, 2.295440673828125, 2.36297607421875, 2.430511474609375, 2.498046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 12.0, 13.0, 22.0, 22.0, 53.0, 90.0, 185.0, 338.0, 750.0, 2037.0, 6521.0, 32605.0, 347285.0, 591998.0, 53094.0, 9144.0, 2609.0, 932.0, 385.0, 196.0, 113.0, 52.0, 26.0, 14.0, 16.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8828125, -10.5638427734375, -10.244873046875, -9.9259033203125, -9.60693359375, -9.2879638671875, -8.968994140625, -8.6500244140625, -8.3310546875, -8.0120849609375, -7.693115234375, -7.3741455078125, -7.05517578125, -6.7362060546875, -6.417236328125, -6.0982666015625, -5.779296875, -5.4603271484375, -5.141357421875, -4.8223876953125, -4.50341796875, -4.1844482421875, -3.865478515625, -3.5465087890625, -3.2275390625, -2.9085693359375, -2.589599609375, -2.2706298828125, -1.95166015625, -1.6326904296875, -1.313720703125, -0.9947509765625, -0.67578125, -0.3568115234375, -0.037841796875, 0.2811279296875, 0.60009765625, 0.9190673828125, 1.238037109375, 1.5570068359375, 1.8759765625, 2.1949462890625, 2.513916015625, 2.8328857421875, 3.15185546875, 3.4708251953125, 3.789794921875, 4.1087646484375, 4.427734375, 4.7467041015625, 5.065673828125, 5.3846435546875, 5.70361328125, 6.0225830078125, 6.341552734375, 6.6605224609375, 6.9794921875, 7.2984619140625, 7.617431640625, 7.9364013671875, 8.25537109375, 8.5743408203125, 8.893310546875, 9.2122802734375, 9.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 11.0, 9.0, 8.0, 8.0, 22.0, 19.0, 22.0, 41.0, 64.0, 62.0, 82.0, 96.0, 79.0, 95.0, 59.0, 51.0, 50.0, 31.0, 21.0, 18.0, 29.0, 18.0, 15.0, 11.0, 7.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0005130767822265625, -0.000497087836265564, -0.00048109889030456543, -0.0004651099443435669, -0.00044912099838256836, -0.0004331320524215698, -0.0004171431064605713, -0.00040115416049957275, -0.0003851652145385742, -0.0003691762685775757, -0.00035318732261657715, -0.0003371983766555786, -0.0003212094306945801, -0.00030522048473358154, -0.000289231538772583, -0.00027324259281158447, -0.00025725364685058594, -0.0002412647008895874, -0.00022527575492858887, -0.00020928680896759033, -0.0001932978630065918, -0.00017730891704559326, -0.00016131997108459473, -0.0001453310251235962, -0.00012934207916259766, -0.00011335313320159912, -9.736418724060059e-05, -8.137524127960205e-05, -6.538629531860352e-05, -4.939734935760498e-05, -3.3408403396606445e-05, -1.741945743560791e-05, -1.430511474609375e-06, 1.455843448638916e-05, 3.0547380447387695e-05, 4.653632640838623e-05, 6.252527236938477e-05, 7.85142183303833e-05, 9.450316429138184e-05, 0.00011049211025238037, 0.0001264810562133789, 0.00014247000217437744, 0.00015845894813537598, 0.0001744478940963745, 0.00019043684005737305, 0.00020642578601837158, 0.00022241473197937012, 0.00023840367794036865, 0.0002543926239013672, 0.0002703815698623657, 0.00028637051582336426, 0.0003023594617843628, 0.00031834840774536133, 0.00033433735370635986, 0.0003503262996673584, 0.00036631524562835693, 0.00038230419158935547, 0.000398293137550354, 0.00041428208351135254, 0.0004302710294723511, 0.0004462599754333496, 0.00046224892139434814, 0.0004782378673553467, 0.0004942268133163452, 0.0005102157592773438]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 2.0, 9.0, 5.0, 5.0, 12.0, 17.0, 25.0, 46.0, 69.0, 117.0, 229.0, 438.0, 986.0, 2254.0, 6707.0, 28089.0, 202709.0, 688045.0, 94895.0, 16253.0, 4400.0, 1631.0, 762.0, 357.0, 187.0, 97.0, 69.0, 45.0, 37.0, 15.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3984375, -8.112060546875, -7.82568359375, -7.539306640625, -7.2529296875, -6.966552734375, -6.68017578125, -6.393798828125, -6.107421875, -5.821044921875, -5.53466796875, -5.248291015625, -4.9619140625, -4.675537109375, -4.38916015625, -4.102783203125, -3.81640625, -3.530029296875, -3.24365234375, -2.957275390625, -2.6708984375, -2.384521484375, -2.09814453125, -1.811767578125, -1.525390625, -1.239013671875, -0.95263671875, -0.666259765625, -0.3798828125, -0.093505859375, 0.19287109375, 0.479248046875, 0.765625, 1.052001953125, 1.33837890625, 1.624755859375, 1.9111328125, 2.197509765625, 2.48388671875, 2.770263671875, 3.056640625, 3.343017578125, 3.62939453125, 3.915771484375, 4.2021484375, 4.488525390625, 4.77490234375, 5.061279296875, 5.34765625, 5.634033203125, 5.92041015625, 6.206787109375, 6.4931640625, 6.779541015625, 7.06591796875, 7.352294921875, 7.638671875, 7.925048828125, 8.21142578125, 8.497802734375, 8.7841796875, 9.070556640625, 9.35693359375, 9.643310546875, 9.9296875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 8.0, 5.0, 8.0, 12.0, 14.0, 18.0, 30.0, 30.0, 58.0, 65.0, 95.0, 134.0, 120.0, 103.0, 78.0, 51.0, 38.0, 25.0, 27.0, 15.0, 17.0, 12.0, 11.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.79473876953125, -2.6832275390625, -2.57171630859375, -2.460205078125, -2.34869384765625, -2.2371826171875, -2.12567138671875, -2.01416015625, -1.90264892578125, -1.7911376953125, -1.67962646484375, -1.568115234375, -1.45660400390625, -1.3450927734375, -1.23358154296875, -1.1220703125, -1.01055908203125, -0.8990478515625, -0.78753662109375, -0.676025390625, -0.56451416015625, -0.4530029296875, -0.34149169921875, -0.22998046875, -0.11846923828125, -0.0069580078125, 0.10455322265625, 0.216064453125, 0.32757568359375, 0.4390869140625, 0.55059814453125, 0.662109375, 0.77362060546875, 0.8851318359375, 0.99664306640625, 1.108154296875, 1.21966552734375, 1.3311767578125, 1.44268798828125, 1.55419921875, 1.66571044921875, 1.7772216796875, 1.88873291015625, 2.000244140625, 2.11175537109375, 2.2232666015625, 2.33477783203125, 2.4462890625, 2.55780029296875, 2.6693115234375, 2.78082275390625, 2.892333984375, 3.00384521484375, 3.1153564453125, 3.22686767578125, 3.33837890625, 3.44989013671875, 3.5614013671875, 3.67291259765625, 3.784423828125, 3.89593505859375, 4.0074462890625, 4.11895751953125, 4.23046875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 19.0, 46.0, 72.0, 123.0, 165.0, 178.0, 164.0, 96.0, 50.0, 32.0, 13.0, 8.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.87000274658203, -43.43575668334961, -42.00151062011719, -40.567264556884766, -39.133018493652344, -37.69877624511719, -36.264530181884766, -34.830284118652344, -33.39603805541992, -31.9617919921875, -30.527545928955078, -29.09330177307129, -27.659055709838867, -26.224809646606445, -24.790565490722656, -23.356319427490234, -21.922073364257812, -20.48782730102539, -19.05358123779297, -17.61933708190918, -16.185091018676758, -14.750844955444336, -13.31659984588623, -11.882354736328125, -10.448108673095703, -9.013862609863281, -7.579617500305176, -6.145371913909912, -4.711126327514648, -3.2768807411193848, -1.842635154724121, -0.4083900451660156, 1.0258560180664062, 2.46010160446167, 3.8943471908569336, 5.328592777252197, 6.762838363647461, 8.197084426879883, 9.631329536437988, 11.065574645996094, 12.499820709228516, 13.934066772460938, 15.368311882019043, 16.80255699157715, 18.23680305480957, 19.671049118041992, 21.10529327392578, 22.539539337158203, 23.973785400390625, 25.408031463623047, 26.84227752685547, 28.276521682739258, 29.71076774597168, 31.1450138092041, 32.57925796508789, 34.01350402832031, 35.447750091552734, 36.881996154785156, 38.31624221801758, 39.75048828125, 41.184730529785156, 42.61897659301758, 44.05322265625, 45.48746871948242, 46.921714782714844]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 6.0, 9.0, 9.0, 14.0, 13.0, 14.0, 16.0, 33.0, 25.0, 30.0, 37.0, 28.0, 45.0, 43.0, 53.0, 42.0, 58.0, 45.0, 50.0, 46.0, 46.0, 42.0, 31.0, 39.0, 57.0, 26.0, 18.0, 22.0, 27.0, 19.0, 14.0, 6.0, 12.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.106409072875977, -22.493146896362305, -21.879884719848633, -21.26662254333496, -20.65336036682129, -20.040098190307617, -19.426836013793945, -18.813573837280273, -18.2003116607666, -17.58704948425293, -16.973787307739258, -16.360525131225586, -15.747262954711914, -15.134000778198242, -14.52073860168457, -13.907476425170898, -13.294214248657227, -12.680952072143555, -12.067689895629883, -11.454427719116211, -10.841165542602539, -10.227903366088867, -9.614641189575195, -9.001379013061523, -8.388116836547852, -7.77485466003418, -7.161592483520508, -6.548330307006836, -5.935068130493164, -5.321805953979492, -4.70854377746582, -4.095281600952148, -3.4820213317871094, -2.8687591552734375, -2.2554969787597656, -1.6422348022460938, -1.0289726257324219, -0.41571044921875, 0.19755172729492188, 0.8108139038085938, 1.4240760803222656, 2.0373382568359375, 2.6506004333496094, 3.2638626098632812, 3.877124786376953, 4.490386962890625, 5.103649139404297, 5.716911315917969, 6.330173492431641, 6.9434356689453125, 7.556697845458984, 8.169960021972656, 8.783222198486328, 9.396484375, 10.009746551513672, 10.623008728027344, 11.236270904541016, 11.849533081054688, 12.46279525756836, 13.076057434082031, 13.689319610595703, 14.302581787109375, 14.915843963623047, 15.529106140136719, 16.14236831665039]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 10.0, 6.0, 6.0, 12.0, 8.0, 20.0, 26.0, 30.0, 43.0, 86.0, 111.0, 193.0, 315.0, 464.0, 862.0, 1566.0, 2900.0, 6531.0, 18674.0, 70629.0, 517086.0, 3309333.0, 207096.0, 39012.0, 11179.0, 4042.0, 1879.0, 884.0, 510.0, 287.0, 170.0, 97.0, 67.0, 46.0, 26.0, 16.0, 19.0, 9.0, 9.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.015625, -8.7364501953125, -8.457275390625, -8.1781005859375, -7.89892578125, -7.6197509765625, -7.340576171875, -7.0614013671875, -6.7822265625, -6.5030517578125, -6.223876953125, -5.9447021484375, -5.66552734375, -5.3863525390625, -5.107177734375, -4.8280029296875, -4.548828125, -4.2696533203125, -3.990478515625, -3.7113037109375, -3.43212890625, -3.1529541015625, -2.873779296875, -2.5946044921875, -2.3154296875, -2.0362548828125, -1.757080078125, -1.4779052734375, -1.19873046875, -0.9195556640625, -0.640380859375, -0.3612060546875, -0.08203125, 0.1971435546875, 0.476318359375, 0.7554931640625, 1.03466796875, 1.3138427734375, 1.593017578125, 1.8721923828125, 2.1513671875, 2.4305419921875, 2.709716796875, 2.9888916015625, 3.26806640625, 3.5472412109375, 3.826416015625, 4.1055908203125, 4.384765625, 4.6639404296875, 4.943115234375, 5.2222900390625, 5.50146484375, 5.7806396484375, 6.059814453125, 6.3389892578125, 6.6181640625, 6.8973388671875, 7.176513671875, 7.4556884765625, 7.73486328125, 8.0140380859375, 8.293212890625, 8.5723876953125, 8.8515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 17.0, 13.0, 34.0, 38.0, 44.0, 74.0, 79.0, 97.0, 93.0, 95.0, 103.0, 62.0, 78.0, 52.0, 36.0, 22.0, 23.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6588211059570312, -0.6350250244140625, -0.6112289428710938, -0.587432861328125, -0.5636367797851562, -0.5398406982421875, -0.5160446166992188, -0.49224853515625, -0.46845245361328125, -0.4446563720703125, -0.42086029052734375, -0.397064208984375, -0.37326812744140625, -0.3494720458984375, -0.32567596435546875, -0.3018798828125, -0.27808380126953125, -0.2542877197265625, -0.23049163818359375, -0.206695556640625, -0.18289947509765625, -0.1591033935546875, -0.13530731201171875, -0.11151123046875, -0.08771514892578125, -0.0639190673828125, -0.04012298583984375, -0.016326904296875, 0.00746917724609375, 0.0312652587890625, 0.05506134033203125, 0.078857421875, 0.10265350341796875, 0.1264495849609375, 0.15024566650390625, 0.174041748046875, 0.19783782958984375, 0.2216339111328125, 0.24542999267578125, 0.26922607421875, 0.29302215576171875, 0.3168182373046875, 0.34061431884765625, 0.364410400390625, 0.38820648193359375, 0.4120025634765625, 0.43579864501953125, 0.4595947265625, 0.48339080810546875, 0.5071868896484375, 0.5309829711914062, 0.554779052734375, 0.5785751342773438, 0.6023712158203125, 0.6261672973632812, 0.64996337890625, 0.6737594604492188, 0.6975555419921875, 0.7213516235351562, 0.745147705078125, 0.7689437866210938, 0.7927398681640625, 0.8165359497070312, 0.84033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 13.0, 22.0, 32.0, 51.0, 93.0, 159.0, 270.0, 560.0, 1054.0, 2289.0, 5440.0, 15856.0, 58963.0, 306659.0, 2967962.0, 688198.0, 106934.0, 25552.0, 8142.0, 3159.0, 1359.0, 645.0, 369.0, 204.0, 105.0, 68.0, 37.0, 28.0, 17.0, 10.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.62677001953125, -8.3707275390625, -8.11468505859375, -7.858642578125, -7.60260009765625, -7.3465576171875, -7.09051513671875, -6.83447265625, -6.57843017578125, -6.3223876953125, -6.06634521484375, -5.810302734375, -5.55426025390625, -5.2982177734375, -5.04217529296875, -4.7861328125, -4.53009033203125, -4.2740478515625, -4.01800537109375, -3.761962890625, -3.50592041015625, -3.2498779296875, -2.99383544921875, -2.73779296875, -2.48175048828125, -2.2257080078125, -1.96966552734375, -1.713623046875, -1.45758056640625, -1.2015380859375, -0.94549560546875, -0.689453125, -0.43341064453125, -0.1773681640625, 0.07867431640625, 0.334716796875, 0.59075927734375, 0.8468017578125, 1.10284423828125, 1.35888671875, 1.61492919921875, 1.8709716796875, 2.12701416015625, 2.383056640625, 2.63909912109375, 2.8951416015625, 3.15118408203125, 3.4072265625, 3.66326904296875, 3.9193115234375, 4.17535400390625, 4.431396484375, 4.68743896484375, 4.9434814453125, 5.19952392578125, 5.45556640625, 5.71160888671875, 5.9676513671875, 6.22369384765625, 6.479736328125, 6.73577880859375, 6.9918212890625, 7.24786376953125, 7.50390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 20.0, 18.0, 22.0, 28.0, 43.0, 63.0, 82.0, 121.0, 196.0, 297.0, 615.0, 1235.0, 472.0, 280.0, 165.0, 126.0, 79.0, 52.0, 36.0, 28.0, 21.0, 17.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6689453125, -1.6156768798828125, -1.562408447265625, -1.5091400146484375, -1.45587158203125, -1.4026031494140625, -1.349334716796875, -1.2960662841796875, -1.2427978515625, -1.1895294189453125, -1.136260986328125, -1.0829925537109375, -1.02972412109375, -0.9764556884765625, -0.923187255859375, -0.8699188232421875, -0.816650390625, -0.7633819580078125, -0.710113525390625, -0.6568450927734375, -0.60357666015625, -0.5503082275390625, -0.497039794921875, -0.4437713623046875, -0.3905029296875, -0.3372344970703125, -0.283966064453125, -0.2306976318359375, -0.17742919921875, -0.1241607666015625, -0.070892333984375, -0.0176239013671875, 0.03564453125, 0.0889129638671875, 0.142181396484375, 0.1954498291015625, 0.24871826171875, 0.3019866943359375, 0.355255126953125, 0.4085235595703125, 0.4617919921875, 0.5150604248046875, 0.568328857421875, 0.6215972900390625, 0.67486572265625, 0.7281341552734375, 0.781402587890625, 0.8346710205078125, 0.887939453125, 0.9412078857421875, 0.994476318359375, 1.0477447509765625, 1.10101318359375, 1.1542816162109375, 1.207550048828125, 1.2608184814453125, 1.3140869140625, 1.3673553466796875, 1.420623779296875, 1.4738922119140625, 1.52716064453125, 1.5804290771484375, 1.633697509765625, 1.6869659423828125, 1.740234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 24.0, 80.0, 146.0, 262.0, 245.0, 134.0, 72.0, 21.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82246208190918, -7.0359930992126465, -6.249524116516113, -5.463055610656738, -4.676586627960205, -3.890117645263672, -3.103649139404297, -2.3171801567077637, -1.5307111740112305, -0.7442423105239868, 0.042226552963256836, 0.8286952972412109, 1.6151642799377441, 2.4016332626342773, 3.1881017684936523, 3.9745707511901855, 4.761039733886719, 5.547508716583252, 6.333977699279785, 7.12044620513916, 7.906915187835693, 8.693384170532227, 9.479852676391602, 10.266321182250977, 11.052790641784668, 11.839259147644043, 12.625728607177734, 13.41219711303711, 14.198665618896484, 14.985135078430176, 15.77160358428955, 16.558073043823242, 17.344539642333984, 18.13100814819336, 18.917476654052734, 19.70394515991211, 20.490415573120117, 21.276884078979492, 22.063352584838867, 22.849821090698242, 23.63629150390625, 24.422760009765625, 25.209228515625, 25.995697021484375, 26.782167434692383, 27.568635940551758, 28.355104446411133, 29.141572952270508, 29.928041458129883, 30.714509963989258, 31.500978469848633, 32.28744888305664, 33.073917388916016, 33.86038589477539, 34.646854400634766, 35.43332290649414, 36.219791412353516, 37.00625991821289, 37.792728424072266, 38.57919692993164, 39.365665435791016, 40.152137756347656, 40.93860626220703, 41.725074768066406, 42.51154327392578]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 4.0, 5.0, 5.0, 3.0, 10.0, 7.0, 10.0, 6.0, 14.0, 14.0, 25.0, 13.0, 20.0, 30.0, 26.0, 22.0, 33.0, 39.0, 29.0, 29.0, 44.0, 39.0, 36.0, 44.0, 42.0, 49.0, 34.0, 26.0, 34.0, 28.0, 32.0, 33.0, 30.0, 28.0, 23.0, 17.0, 12.0, 15.0, 20.0, 10.0, 10.0, 9.0, 4.0, 8.0, 8.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.300272464752197, -5.127559185028076, -4.954845905303955, -4.782133102416992, -4.609419822692871, -4.43670654296875, -4.263993263244629, -4.091279983520508, -3.918566942214966, -3.7458536624908447, -3.5731406211853027, -3.4004273414611816, -3.2277140617370605, -3.0550010204315186, -2.8822877407073975, -2.7095746994018555, -2.5368614196777344, -2.3641481399536133, -2.1914350986480713, -2.01872181892395, -1.8460086584091187, -1.673295497894287, -1.500582218170166, -1.3278690576553345, -1.155155897140503, -0.9824427366256714, -0.8097295165061951, -0.6370162963867188, -0.4643031358718872, -0.29158997535705566, -0.11887669563293457, 0.05383646488189697, 0.22655010223388672, 0.39926329255104065, 0.5719764828681946, 0.7446897029876709, 0.9174028635025024, 1.090116024017334, 1.262829303741455, 1.4355424642562866, 1.6082556247711182, 1.7809687852859497, 1.9536819458007812, 2.1263952255249023, 2.2991085052490234, 2.4718215465545654, 2.6445348262786865, 2.8172478675842285, 2.9899611473083496, 3.1626744270324707, 3.3353874683380127, 3.508100748062134, 3.680813789367676, 3.853527069091797, 4.026240348815918, 4.198953628540039, 4.37166690826416, 4.544380187988281, 4.717093467712402, 4.889806747436523, 5.062519550323486, 5.235232830047607, 5.4079461097717285, 5.58065938949585, 5.7533721923828125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 4.0, 10.0, 30.0, 14.0, 29.0, 44.0, 79.0, 85.0, 147.0, 179.0, 307.0, 457.0, 687.0, 1236.0, 2436.0, 5128.0, 11746.0, 27741.0, 66950.0, 152545.0, 283770.0, 262583.0, 131772.0, 57337.0, 23806.0, 9934.0, 4481.0, 2140.0, 1119.0, 591.0, 403.0, 253.0, 138.0, 111.0, 72.0, 37.0, 42.0, 31.0, 27.0, 11.0, 12.0, 12.0, 5.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.529296875, -3.411285400390625, -3.29327392578125, -3.175262451171875, -3.0572509765625, -2.939239501953125, -2.82122802734375, -2.703216552734375, -2.585205078125, -2.467193603515625, -2.34918212890625, -2.231170654296875, -2.1131591796875, -1.995147705078125, -1.87713623046875, -1.759124755859375, -1.64111328125, -1.523101806640625, -1.40509033203125, -1.287078857421875, -1.1690673828125, -1.051055908203125, -0.93304443359375, -0.815032958984375, -0.697021484375, -0.579010009765625, -0.46099853515625, -0.342987060546875, -0.2249755859375, -0.106964111328125, 0.01104736328125, 0.129058837890625, 0.2470703125, 0.365081787109375, 0.48309326171875, 0.601104736328125, 0.7191162109375, 0.837127685546875, 0.95513916015625, 1.073150634765625, 1.191162109375, 1.309173583984375, 1.42718505859375, 1.545196533203125, 1.6632080078125, 1.781219482421875, 1.89923095703125, 2.017242431640625, 2.13525390625, 2.253265380859375, 2.37127685546875, 2.489288330078125, 2.6072998046875, 2.725311279296875, 2.84332275390625, 2.961334228515625, 3.079345703125, 3.197357177734375, 3.31536865234375, 3.433380126953125, 3.5513916015625, 3.669403076171875, 3.78741455078125, 3.905426025390625, 4.0234375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 13.0, 15.0, 21.0, 28.0, 47.0, 53.0, 48.0, 75.0, 81.0, 98.0, 88.0, 61.0, 75.0, 72.0, 67.0, 46.0, 31.0, 25.0, 18.0, 13.0, 5.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6776351928710938, -0.6526336669921875, -0.6276321411132812, -0.602630615234375, -0.5776290893554688, -0.5526275634765625, -0.5276260375976562, -0.50262451171875, -0.47762298583984375, -0.4526214599609375, -0.42761993408203125, -0.402618408203125, -0.37761688232421875, -0.3526153564453125, -0.32761383056640625, -0.3026123046875, -0.27761077880859375, -0.2526092529296875, -0.22760772705078125, -0.202606201171875, -0.17760467529296875, -0.1526031494140625, -0.12760162353515625, -0.10260009765625, -0.07759857177734375, -0.0525970458984375, -0.02759552001953125, -0.002593994140625, 0.02240753173828125, 0.0474090576171875, 0.07241058349609375, 0.097412109375, 0.12241363525390625, 0.1474151611328125, 0.17241668701171875, 0.197418212890625, 0.22241973876953125, 0.2474212646484375, 0.27242279052734375, 0.29742431640625, 0.32242584228515625, 0.3474273681640625, 0.37242889404296875, 0.397430419921875, 0.42243194580078125, 0.4474334716796875, 0.47243499755859375, 0.4974365234375, 0.5224380493164062, 0.5474395751953125, 0.5724411010742188, 0.597442626953125, 0.6224441528320312, 0.6474456787109375, 0.6724472045898438, 0.69744873046875, 0.7224502563476562, 0.7474517822265625, 0.7724533081054688, 0.797454833984375, 0.8224563598632812, 0.8474578857421875, 0.8724594116210938, 0.8974609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 10.0, 8.0, 16.0, 13.0, 31.0, 25.0, 41.0, 45.0, 67.0, 92.0, 115.0, 196.0, 238.0, 415.0, 660.0, 1092.0, 2220.0, 4881.0, 12960.0, 35309.0, 103167.0, 315049.0, 374857.0, 126483.0, 43323.0, 15454.0, 5864.0, 2554.0, 1279.0, 681.0, 424.0, 275.0, 192.0, 151.0, 107.0, 72.0, 47.0, 40.0, 24.0, 20.0, 11.0, 23.0, 9.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.16796875, -5.987060546875, -5.80615234375, -5.625244140625, -5.4443359375, -5.263427734375, -5.08251953125, -4.901611328125, -4.720703125, -4.539794921875, -4.35888671875, -4.177978515625, -3.9970703125, -3.816162109375, -3.63525390625, -3.454345703125, -3.2734375, -3.092529296875, -2.91162109375, -2.730712890625, -2.5498046875, -2.368896484375, -2.18798828125, -2.007080078125, -1.826171875, -1.645263671875, -1.46435546875, -1.283447265625, -1.1025390625, -0.921630859375, -0.74072265625, -0.559814453125, -0.37890625, -0.197998046875, -0.01708984375, 0.163818359375, 0.3447265625, 0.525634765625, 0.70654296875, 0.887451171875, 1.068359375, 1.249267578125, 1.43017578125, 1.611083984375, 1.7919921875, 1.972900390625, 2.15380859375, 2.334716796875, 2.515625, 2.696533203125, 2.87744140625, 3.058349609375, 3.2392578125, 3.420166015625, 3.60107421875, 3.781982421875, 3.962890625, 4.143798828125, 4.32470703125, 4.505615234375, 4.6865234375, 4.867431640625, 5.04833984375, 5.229248046875, 5.41015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 8.0, 6.0, 15.0, 10.0, 13.0, 26.0, 16.0, 18.0, 30.0, 34.0, 40.0, 40.0, 35.0, 42.0, 60.0, 55.0, 53.0, 41.0, 44.0, 56.0, 65.0, 43.0, 32.0, 35.0, 20.0, 26.0, 31.0, 14.0, 23.0, 22.0, 14.0, 13.0, 4.0, 7.0, 5.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.351409912109375, -3.23602294921875, -3.120635986328125, -3.0052490234375, -2.889862060546875, -2.77447509765625, -2.659088134765625, -2.543701171875, -2.428314208984375, -2.31292724609375, -2.197540283203125, -2.0821533203125, -1.966766357421875, -1.85137939453125, -1.735992431640625, -1.62060546875, -1.505218505859375, -1.38983154296875, -1.274444580078125, -1.1590576171875, -1.043670654296875, -0.92828369140625, -0.812896728515625, -0.697509765625, -0.582122802734375, -0.46673583984375, -0.351348876953125, -0.2359619140625, -0.120574951171875, -0.00518798828125, 0.110198974609375, 0.2255859375, 0.340972900390625, 0.45635986328125, 0.571746826171875, 0.6871337890625, 0.802520751953125, 0.91790771484375, 1.033294677734375, 1.148681640625, 1.264068603515625, 1.37945556640625, 1.494842529296875, 1.6102294921875, 1.725616455078125, 1.84100341796875, 1.956390380859375, 2.07177734375, 2.187164306640625, 2.30255126953125, 2.417938232421875, 2.5333251953125, 2.648712158203125, 2.76409912109375, 2.879486083984375, 2.994873046875, 3.110260009765625, 3.22564697265625, 3.341033935546875, 3.4564208984375, 3.571807861328125, 3.68719482421875, 3.802581787109375, 3.91796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 9.0, 11.0, 17.0, 20.0, 31.0, 34.0, 60.0, 100.0, 112.0, 172.0, 279.0, 465.0, 765.0, 1144.0, 2068.0, 3851.0, 7218.0, 14944.0, 34870.0, 94773.0, 332971.0, 373677.0, 108273.0, 38696.0, 16441.0, 7899.0, 4017.0, 2215.0, 1255.0, 785.0, 459.0, 327.0, 199.0, 134.0, 67.0, 57.0, 37.0, 28.0, 28.0, 12.0, 10.0, 11.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.524810791015625, -3.41485595703125, -3.304901123046875, -3.1949462890625, -3.084991455078125, -2.97503662109375, -2.865081787109375, -2.755126953125, -2.645172119140625, -2.53521728515625, -2.425262451171875, -2.3153076171875, -2.205352783203125, -2.09539794921875, -1.985443115234375, -1.87548828125, -1.765533447265625, -1.65557861328125, -1.545623779296875, -1.4356689453125, -1.325714111328125, -1.21575927734375, -1.105804443359375, -0.995849609375, -0.885894775390625, -0.77593994140625, -0.665985107421875, -0.5560302734375, -0.446075439453125, -0.33612060546875, -0.226165771484375, -0.1162109375, -0.006256103515625, 0.10369873046875, 0.213653564453125, 0.3236083984375, 0.433563232421875, 0.54351806640625, 0.653472900390625, 0.763427734375, 0.873382568359375, 0.98333740234375, 1.093292236328125, 1.2032470703125, 1.313201904296875, 1.42315673828125, 1.533111572265625, 1.64306640625, 1.753021240234375, 1.86297607421875, 1.972930908203125, 2.0828857421875, 2.192840576171875, 2.30279541015625, 2.412750244140625, 2.522705078125, 2.632659912109375, 2.74261474609375, 2.852569580078125, 2.9625244140625, 3.072479248046875, 3.18243408203125, 3.292388916015625, 3.40234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 11.0, 14.0, 23.0, 35.0, 46.0, 43.0, 70.0, 140.0, 219.0, 128.0, 78.0, 45.0, 41.0, 28.0, 15.0, 14.0, 8.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008697509765625, -0.0008422061800956726, -0.0008146613836288452, -0.0007871165871620178, -0.0007595717906951904, -0.000732026994228363, -0.0007044821977615356, -0.0006769374012947083, -0.0006493926048278809, -0.0006218478083610535, -0.0005943030118942261, -0.0005667582154273987, -0.0005392134189605713, -0.0005116686224937439, -0.0004841238260269165, -0.0004565790295600891, -0.0004290342330932617, -0.0004014894366264343, -0.00037394464015960693, -0.00034639984369277954, -0.00031885504722595215, -0.00029131025075912476, -0.00026376545429229736, -0.00023622065782546997, -0.00020867586135864258, -0.00018113106489181519, -0.0001535862684249878, -0.0001260414719581604, -9.849667549133301e-05, -7.095187902450562e-05, -4.340708255767822e-05, -1.586228609085083e-05, 1.1682510375976562e-05, 3.9227306842803955e-05, 6.677210330963135e-05, 9.431689977645874e-05, 0.00012186169624328613, 0.00014940649271011353, 0.00017695128917694092, 0.0002044960856437683, 0.0002320408821105957, 0.0002595856785774231, 0.0002871304750442505, 0.0003146752715110779, 0.0003422200679779053, 0.00036976486444473267, 0.00039730966091156006, 0.00042485445737838745, 0.00045239925384521484, 0.00047994405031204224, 0.0005074888467788696, 0.000535033643245697, 0.0005625784397125244, 0.0005901232361793518, 0.0006176680326461792, 0.0006452128291130066, 0.000672757625579834, 0.0007003024220466614, 0.0007278472185134888, 0.0007553920149803162, 0.0007829368114471436, 0.000810481607913971, 0.0008380264043807983, 0.0008655712008476257, 0.0008931159973144531]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 12.0, 16.0, 17.0, 19.0, 26.0, 34.0, 51.0, 86.0, 137.0, 217.0, 383.0, 697.0, 1600.0, 3977.0, 11606.0, 39504.0, 203129.0, 646230.0, 103090.0, 24700.0, 7626.0, 2756.0, 1205.0, 581.0, 308.0, 189.0, 107.0, 60.0, 49.0, 32.0, 20.0, 20.0, 11.0, 14.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.05078125, -6.8326416015625, -6.614501953125, -6.3963623046875, -6.17822265625, -5.9600830078125, -5.741943359375, -5.5238037109375, -5.3056640625, -5.0875244140625, -4.869384765625, -4.6512451171875, -4.43310546875, -4.2149658203125, -3.996826171875, -3.7786865234375, -3.560546875, -3.3424072265625, -3.124267578125, -2.9061279296875, -2.68798828125, -2.4698486328125, -2.251708984375, -2.0335693359375, -1.8154296875, -1.5972900390625, -1.379150390625, -1.1610107421875, -0.94287109375, -0.7247314453125, -0.506591796875, -0.2884521484375, -0.0703125, 0.1478271484375, 0.365966796875, 0.5841064453125, 0.80224609375, 1.0203857421875, 1.238525390625, 1.4566650390625, 1.6748046875, 1.8929443359375, 2.111083984375, 2.3292236328125, 2.54736328125, 2.7655029296875, 2.983642578125, 3.2017822265625, 3.419921875, 3.6380615234375, 3.856201171875, 4.0743408203125, 4.29248046875, 4.5106201171875, 4.728759765625, 4.9468994140625, 5.1650390625, 5.3831787109375, 5.601318359375, 5.8194580078125, 6.03759765625, 6.2557373046875, 6.473876953125, 6.6920166015625, 6.91015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 8.0, 7.0, 9.0, 8.0, 11.0, 12.0, 17.0, 17.0, 20.0, 27.0, 22.0, 48.0, 60.0, 73.0, 92.0, 118.0, 104.0, 69.0, 56.0, 30.0, 29.0, 30.0, 28.0, 18.0, 12.0, 12.0, 11.0, 6.0, 7.0, 5.0, 4.0, 1.0, 4.0, 6.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.873046875, -2.781707763671875, -2.69036865234375, -2.599029541015625, -2.5076904296875, -2.416351318359375, -2.32501220703125, -2.233673095703125, -2.142333984375, -2.050994873046875, -1.95965576171875, -1.868316650390625, -1.7769775390625, -1.685638427734375, -1.59429931640625, -1.502960205078125, -1.41162109375, -1.320281982421875, -1.22894287109375, -1.137603759765625, -1.0462646484375, -0.954925537109375, -0.86358642578125, -0.772247314453125, -0.680908203125, -0.589569091796875, -0.49822998046875, -0.406890869140625, -0.3155517578125, -0.224212646484375, -0.13287353515625, -0.041534423828125, 0.0498046875, 0.141143798828125, 0.23248291015625, 0.323822021484375, 0.4151611328125, 0.506500244140625, 0.59783935546875, 0.689178466796875, 0.780517578125, 0.871856689453125, 0.96319580078125, 1.054534912109375, 1.1458740234375, 1.237213134765625, 1.32855224609375, 1.419891357421875, 1.51123046875, 1.602569580078125, 1.69390869140625, 1.785247802734375, 1.8765869140625, 1.967926025390625, 2.05926513671875, 2.150604248046875, 2.241943359375, 2.333282470703125, 2.42462158203125, 2.515960693359375, 2.6072998046875, 2.698638916015625, 2.78997802734375, 2.881317138671875, 2.97265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 12.0, 25.0, 65.0, 105.0, 136.0, 189.0, 165.0, 122.0, 88.0, 34.0, 19.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.42875671386719, -53.49612045288086, -51.56348419189453, -49.6308479309082, -47.698211669921875, -45.76557540893555, -43.83293914794922, -41.90030288696289, -39.96766662597656, -38.035030364990234, -36.102394104003906, -34.16975784301758, -32.23712158203125, -30.304485321044922, -28.371849060058594, -26.439212799072266, -24.506576538085938, -22.57394027709961, -20.64130401611328, -18.708667755126953, -16.776031494140625, -14.843395233154297, -12.910758972167969, -10.97812271118164, -9.045486450195312, -7.112850189208984, -5.180213928222656, -3.247577667236328, -1.31494140625, 0.6176948547363281, 2.5503311157226562, 4.482967376708984, 6.4156036376953125, 8.34823989868164, 10.280876159667969, 12.213512420654297, 14.146148681640625, 16.078784942626953, 18.01142120361328, 19.94405746459961, 21.876693725585938, 23.809329986572266, 25.741966247558594, 27.674602508544922, 29.60723876953125, 31.539875030517578, 33.472511291503906, 35.405147552490234, 37.33778381347656, 39.27042007446289, 41.20305633544922, 43.13569259643555, 45.068328857421875, 47.0009651184082, 48.93360137939453, 50.86623764038086, 52.79887390136719, 54.731510162353516, 56.664146423339844, 58.59678268432617, 60.5294189453125, 62.46205520629883, 64.39469146728516, 66.32733154296875, 68.25996398925781]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 18.0, 11.0, 10.0, 10.0, 17.0, 22.0, 20.0, 25.0, 32.0, 37.0, 22.0, 25.0, 41.0, 28.0, 37.0, 39.0, 49.0, 41.0, 35.0, 47.0, 38.0, 35.0, 31.0, 32.0, 38.0, 25.0, 33.0, 16.0, 23.0, 20.0, 16.0, 23.0, 14.0, 17.0, 9.0, 11.0, 9.0, 4.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.590604782104492, -22.92235565185547, -22.254106521606445, -21.585857391357422, -20.917606353759766, -20.249357223510742, -19.58110809326172, -18.912858963012695, -18.244609832763672, -17.57636070251465, -16.908111572265625, -16.2398624420166, -15.571612358093262, -14.903363227844238, -14.235113143920898, -13.566864013671875, -12.898614883422852, -12.230365753173828, -11.562116622924805, -10.893866539001465, -10.225617408752441, -9.557368278503418, -8.889118194580078, -8.220869064331055, -7.552619934082031, -6.884370803833008, -6.216121196746826, -5.5478715896606445, -4.879622459411621, -4.211373329162598, -3.543123722076416, -2.8748741149902344, -2.206623077392578, -1.5383737087249756, -0.870124340057373, -0.2018749713897705, 0.46637439727783203, 1.1346237659454346, 1.802873134613037, 2.4711227416992188, 3.139371871948242, 3.8076212406158447, 4.475870609283447, 5.144120216369629, 5.812369346618652, 6.480618476867676, 7.148868083953857, 7.817117691040039, 8.485366821289062, 9.153615951538086, 9.82186508178711, 10.49011516571045, 11.158364295959473, 11.826613426208496, 12.494863510131836, 13.16311264038086, 13.831361770629883, 14.499610900878906, 15.16786003112793, 15.83611011505127, 16.50436019897461, 17.172609329223633, 17.840858459472656, 18.50910758972168, 19.177356719970703]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 8.0, 19.0, 25.0, 51.0, 59.0, 119.0, 202.0, 377.0, 604.0, 1326.0, 2949.0, 7939.0, 24670.0, 103605.0, 1681283.0, 2224774.0, 107515.0, 25596.0, 7802.0, 2868.0, 1191.0, 565.0, 302.0, 160.0, 105.0, 42.0, 46.0, 14.0, 25.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05859375, -6.81524658203125, -6.5718994140625, -6.32855224609375, -6.085205078125, -5.84185791015625, -5.5985107421875, -5.35516357421875, -5.11181640625, -4.86846923828125, -4.6251220703125, -4.38177490234375, -4.138427734375, -3.89508056640625, -3.6517333984375, -3.40838623046875, -3.1650390625, -2.92169189453125, -2.6783447265625, -2.43499755859375, -2.191650390625, -1.94830322265625, -1.7049560546875, -1.46160888671875, -1.21826171875, -0.97491455078125, -0.7315673828125, -0.48822021484375, -0.244873046875, -0.00152587890625, 0.2418212890625, 0.48516845703125, 0.728515625, 0.97186279296875, 1.2152099609375, 1.45855712890625, 1.701904296875, 1.94525146484375, 2.1885986328125, 2.43194580078125, 2.67529296875, 2.91864013671875, 3.1619873046875, 3.40533447265625, 3.648681640625, 3.89202880859375, 4.1353759765625, 4.37872314453125, 4.6220703125, 4.86541748046875, 5.1087646484375, 5.35211181640625, 5.595458984375, 5.83880615234375, 6.0821533203125, 6.32550048828125, 6.56884765625, 6.81219482421875, 7.0555419921875, 7.29888916015625, 7.542236328125, 7.78558349609375, 8.0289306640625, 8.27227783203125, 8.515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 5.0, 6.0, 7.0, 11.0, 21.0, 25.0, 33.0, 37.0, 50.0, 59.0, 57.0, 76.0, 78.0, 78.0, 81.0, 76.0, 55.0, 52.0, 49.0, 38.0, 30.0, 20.0, 21.0, 12.0, 10.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8570480346679688, -0.8278656005859375, -0.7986831665039062, -0.769500732421875, -0.7403182983398438, -0.7111358642578125, -0.6819534301757812, -0.65277099609375, -0.6235885620117188, -0.5944061279296875, -0.5652236938476562, -0.536041259765625, -0.5068588256835938, -0.4776763916015625, -0.44849395751953125, -0.4193115234375, -0.39012908935546875, -0.3609466552734375, -0.33176422119140625, -0.302581787109375, -0.27339935302734375, -0.2442169189453125, -0.21503448486328125, -0.18585205078125, -0.15666961669921875, -0.1274871826171875, -0.09830474853515625, -0.069122314453125, -0.03993988037109375, -0.0107574462890625, 0.01842498779296875, 0.047607421875, 0.07678985595703125, 0.1059722900390625, 0.13515472412109375, 0.164337158203125, 0.19351959228515625, 0.2227020263671875, 0.25188446044921875, 0.28106689453125, 0.31024932861328125, 0.3394317626953125, 0.36861419677734375, 0.397796630859375, 0.42697906494140625, 0.4561614990234375, 0.48534393310546875, 0.5145263671875, 0.5437088012695312, 0.5728912353515625, 0.6020736694335938, 0.631256103515625, 0.6604385375976562, 0.6896209716796875, 0.7188034057617188, 0.74798583984375, 0.7771682739257812, 0.8063507080078125, 0.8355331420898438, 0.864715576171875, 0.8938980102539062, 0.9230804443359375, 0.9522628784179688, 0.9814453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 16.0, 19.0, 36.0, 56.0, 74.0, 137.0, 240.0, 421.0, 1155.0, 4059.0, 20540.0, 194805.0, 3687624.0, 252060.0, 25288.0, 5012.0, 1453.0, 575.0, 277.0, 154.0, 111.0, 61.0, 46.0, 26.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.653564453125, -12.25244140625, -11.851318359375, -11.4501953125, -11.049072265625, -10.64794921875, -10.246826171875, -9.845703125, -9.444580078125, -9.04345703125, -8.642333984375, -8.2412109375, -7.840087890625, -7.43896484375, -7.037841796875, -6.63671875, -6.235595703125, -5.83447265625, -5.433349609375, -5.0322265625, -4.631103515625, -4.22998046875, -3.828857421875, -3.427734375, -3.026611328125, -2.62548828125, -2.224365234375, -1.8232421875, -1.422119140625, -1.02099609375, -0.619873046875, -0.21875, 0.182373046875, 0.58349609375, 0.984619140625, 1.3857421875, 1.786865234375, 2.18798828125, 2.589111328125, 2.990234375, 3.391357421875, 3.79248046875, 4.193603515625, 4.5947265625, 4.995849609375, 5.39697265625, 5.798095703125, 6.19921875, 6.600341796875, 7.00146484375, 7.402587890625, 7.8037109375, 8.204833984375, 8.60595703125, 9.007080078125, 9.408203125, 9.809326171875, 10.21044921875, 10.611572265625, 11.0126953125, 11.413818359375, 11.81494140625, 12.216064453125, 12.6171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 7.0, 17.0, 16.0, 37.0, 71.0, 99.0, 202.0, 488.0, 1974.0, 617.0, 228.0, 124.0, 71.0, 40.0, 27.0, 17.0, 11.0, 9.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6328125, -2.54083251953125, -2.4488525390625, -2.35687255859375, -2.264892578125, -2.17291259765625, -2.0809326171875, -1.98895263671875, -1.89697265625, -1.80499267578125, -1.7130126953125, -1.62103271484375, -1.529052734375, -1.43707275390625, -1.3450927734375, -1.25311279296875, -1.1611328125, -1.06915283203125, -0.9771728515625, -0.88519287109375, -0.793212890625, -0.70123291015625, -0.6092529296875, -0.51727294921875, -0.42529296875, -0.33331298828125, -0.2413330078125, -0.14935302734375, -0.057373046875, 0.03460693359375, 0.1265869140625, 0.21856689453125, 0.310546875, 0.40252685546875, 0.4945068359375, 0.58648681640625, 0.678466796875, 0.77044677734375, 0.8624267578125, 0.95440673828125, 1.04638671875, 1.13836669921875, 1.2303466796875, 1.32232666015625, 1.414306640625, 1.50628662109375, 1.5982666015625, 1.69024658203125, 1.7822265625, 1.87420654296875, 1.9661865234375, 2.05816650390625, 2.150146484375, 2.24212646484375, 2.3341064453125, 2.42608642578125, 2.51806640625, 2.61004638671875, 2.7020263671875, 2.79400634765625, 2.885986328125, 2.97796630859375, 3.0699462890625, 3.16192626953125, 3.25390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 5.0, 11.0, 33.0, 146.0, 269.0, 298.0, 145.0, 71.0, 22.0, 7.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.972281455993652, -6.981586456298828, -5.990891456604004, -5.00019645690918, -4.0095014572143555, -3.0188069343566895, -2.0281119346618652, -1.037416934967041, -0.0467219352722168, 0.9439730048179626, 1.934667944908142, 2.9253628253936768, 3.916057825088501, 4.906752586364746, 5.89744758605957, 6.8881425857543945, 7.878837585449219, 8.869532585144043, 9.860227584838867, 10.850922584533691, 11.841617584228516, 12.832311630249023, 13.823007583618164, 14.813701629638672, 15.804397583007812, 16.79509162902832, 17.78578758239746, 18.77648162841797, 19.76717758178711, 20.757871627807617, 21.748567581176758, 22.739261627197266, 23.729955673217773, 24.72064971923828, 25.711345672607422, 26.70203971862793, 27.69273567199707, 28.683429718017578, 29.67412567138672, 30.664819717407227, 31.655515670776367, 32.646209716796875, 33.636905670166016, 34.627601623535156, 35.61829376220703, 36.60898971557617, 37.59968566894531, 38.59038162231445, 39.58107376098633, 40.57176971435547, 41.562461853027344, 42.553157806396484, 43.543853759765625, 44.534549713134766, 45.52524185180664, 46.51593780517578, 47.50663375854492, 48.49732971191406, 49.48802185058594, 50.47871780395508, 51.46941375732422, 52.46010971069336, 53.450801849365234, 54.441497802734375, 55.432193756103516]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 3.0, 6.0, 3.0, 6.0, 9.0, 11.0, 6.0, 10.0, 16.0, 24.0, 18.0, 23.0, 23.0, 33.0, 29.0, 40.0, 45.0, 29.0, 39.0, 41.0, 45.0, 42.0, 43.0, 30.0, 45.0, 54.0, 28.0, 39.0, 38.0, 30.0, 31.0, 21.0, 15.0, 18.0, 16.0, 16.0, 11.0, 15.0, 8.0, 11.0, 5.0, 12.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.144221305847168, -5.9327192306518555, -5.721217155456543, -5.509714603424072, -5.29821252822876, -5.086710453033447, -4.875207901000977, -4.663705825805664, -4.452203750610352, -4.240701675415039, -4.029199600219727, -3.817697048187256, -3.6061949729919434, -3.394692897796631, -3.1831905841827393, -2.9716882705688477, -2.760186195373535, -2.5486841201782227, -2.337181806564331, -2.1256794929504395, -1.914177417755127, -1.702675223350525, -1.4911730289459229, -1.2796708345413208, -1.0681686401367188, -0.8566664457321167, -0.6451642513275146, -0.4336620569229126, -0.22215986251831055, -0.010657668113708496, 0.20084452629089355, 0.4123467206954956, 0.6238493919372559, 0.8353515863418579, 1.04685378074646, 1.258355975151062, 1.469858169555664, 1.6813603639602661, 1.8928625583648682, 2.1043648719787598, 2.3158669471740723, 2.5273690223693848, 2.7388713359832764, 2.950373649597168, 3.1618757247924805, 3.373377799987793, 3.5848801136016846, 3.796382427215576, 4.007884502410889, 4.219386577606201, 4.430889129638672, 4.642391204833984, 4.853893280029297, 5.065395355224609, 5.276897430419922, 5.488399982452393, 5.699902057647705, 5.911404132843018, 6.122906684875488, 6.334408760070801, 6.545910835266113, 6.757412910461426, 6.968914985656738, 7.180417537689209, 7.3919196128845215]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 14.0, 15.0, 21.0, 25.0, 35.0, 61.0, 95.0, 141.0, 244.0, 343.0, 520.0, 1023.0, 1796.0, 3196.0, 6220.0, 12269.0, 25175.0, 51038.0, 105361.0, 204627.0, 278725.0, 178677.0, 90376.0, 44216.0, 21679.0, 10505.0, 5449.0, 2844.0, 1543.0, 885.0, 537.0, 330.0, 181.0, 115.0, 90.0, 60.0, 40.0, 28.0, 22.0, 8.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.1156005859375, -3.016357421875, -2.9171142578125, -2.81787109375, -2.7186279296875, -2.619384765625, -2.5201416015625, -2.4208984375, -2.3216552734375, -2.222412109375, -2.1231689453125, -2.02392578125, -1.9246826171875, -1.825439453125, -1.7261962890625, -1.626953125, -1.5277099609375, -1.428466796875, -1.3292236328125, -1.22998046875, -1.1307373046875, -1.031494140625, -0.9322509765625, -0.8330078125, -0.7337646484375, -0.634521484375, -0.5352783203125, -0.43603515625, -0.3367919921875, -0.237548828125, -0.1383056640625, -0.0390625, 0.0601806640625, 0.159423828125, 0.2586669921875, 0.35791015625, 0.4571533203125, 0.556396484375, 0.6556396484375, 0.7548828125, 0.8541259765625, 0.953369140625, 1.0526123046875, 1.15185546875, 1.2510986328125, 1.350341796875, 1.4495849609375, 1.548828125, 1.6480712890625, 1.747314453125, 1.8465576171875, 1.94580078125, 2.0450439453125, 2.144287109375, 2.2435302734375, 2.3427734375, 2.4420166015625, 2.541259765625, 2.6405029296875, 2.73974609375, 2.8389892578125, 2.938232421875, 3.0374755859375, 3.13671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 6.0, 10.0, 11.0, 13.0, 22.0, 27.0, 30.0, 31.0, 48.0, 47.0, 67.0, 73.0, 84.0, 61.0, 70.0, 75.0, 61.0, 40.0, 51.0, 39.0, 36.0, 20.0, 20.0, 14.0, 18.0, 3.0, 6.0, 7.0, 9.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8718338012695312, -0.8423004150390625, -0.8127670288085938, -0.783233642578125, -0.7537002563476562, -0.7241668701171875, -0.6946334838867188, -0.66510009765625, -0.6355667114257812, -0.6060333251953125, -0.5764999389648438, -0.546966552734375, -0.5174331665039062, -0.4878997802734375, -0.45836639404296875, -0.4288330078125, -0.39929962158203125, -0.3697662353515625, -0.34023284912109375, -0.310699462890625, -0.28116607666015625, -0.2516326904296875, -0.22209930419921875, -0.19256591796875, -0.16303253173828125, -0.1334991455078125, -0.10396575927734375, -0.074432373046875, -0.04489898681640625, -0.0153656005859375, 0.01416778564453125, 0.043701171875, 0.07323455810546875, 0.1027679443359375, 0.13230133056640625, 0.161834716796875, 0.19136810302734375, 0.2209014892578125, 0.25043487548828125, 0.27996826171875, 0.30950164794921875, 0.3390350341796875, 0.36856842041015625, 0.398101806640625, 0.42763519287109375, 0.4571685791015625, 0.48670196533203125, 0.5162353515625, 0.5457687377929688, 0.5753021240234375, 0.6048355102539062, 0.634368896484375, 0.6639022827148438, 0.6934356689453125, 0.7229690551757812, 0.75250244140625, 0.7820358276367188, 0.8115692138671875, 0.8411026000976562, 0.870635986328125, 0.9001693725585938, 0.9297027587890625, 0.9592361450195312, 0.98876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 8.0, 9.0, 8.0, 11.0, 17.0, 27.0, 35.0, 55.0, 59.0, 124.0, 177.0, 242.0, 396.0, 672.0, 1187.0, 2332.0, 5266.0, 12758.0, 36200.0, 108809.0, 307979.0, 363193.0, 136025.0, 44726.0, 15707.0, 6290.0, 2735.0, 1333.0, 764.0, 467.0, 301.0, 203.0, 131.0, 77.0, 57.0, 53.0, 31.0, 18.0, 19.0, 9.0, 9.0, 4.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.87890625, -5.716064453125, -5.55322265625, -5.390380859375, -5.2275390625, -5.064697265625, -4.90185546875, -4.739013671875, -4.576171875, -4.413330078125, -4.25048828125, -4.087646484375, -3.9248046875, -3.761962890625, -3.59912109375, -3.436279296875, -3.2734375, -3.110595703125, -2.94775390625, -2.784912109375, -2.6220703125, -2.459228515625, -2.29638671875, -2.133544921875, -1.970703125, -1.807861328125, -1.64501953125, -1.482177734375, -1.3193359375, -1.156494140625, -0.99365234375, -0.830810546875, -0.66796875, -0.505126953125, -0.34228515625, -0.179443359375, -0.0166015625, 0.146240234375, 0.30908203125, 0.471923828125, 0.634765625, 0.797607421875, 0.96044921875, 1.123291015625, 1.2861328125, 1.448974609375, 1.61181640625, 1.774658203125, 1.9375, 2.100341796875, 2.26318359375, 2.426025390625, 2.5888671875, 2.751708984375, 2.91455078125, 3.077392578125, 3.240234375, 3.403076171875, 3.56591796875, 3.728759765625, 3.8916015625, 4.054443359375, 4.21728515625, 4.380126953125, 4.54296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 7.0, 4.0, 16.0, 18.0, 10.0, 23.0, 25.0, 46.0, 32.0, 35.0, 50.0, 58.0, 58.0, 55.0, 48.0, 58.0, 72.0, 57.0, 51.0, 46.0, 44.0, 30.0, 24.0, 29.0, 21.0, 13.0, 16.0, 8.0, 6.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.20703125, -5.05120849609375, -4.8953857421875, -4.73956298828125, -4.583740234375, -4.42791748046875, -4.2720947265625, -4.11627197265625, -3.96044921875, -3.80462646484375, -3.6488037109375, -3.49298095703125, -3.337158203125, -3.18133544921875, -3.0255126953125, -2.86968994140625, -2.7138671875, -2.55804443359375, -2.4022216796875, -2.24639892578125, -2.090576171875, -1.93475341796875, -1.7789306640625, -1.62310791015625, -1.46728515625, -1.31146240234375, -1.1556396484375, -0.99981689453125, -0.843994140625, -0.68817138671875, -0.5323486328125, -0.37652587890625, -0.220703125, -0.06488037109375, 0.0909423828125, 0.24676513671875, 0.402587890625, 0.55841064453125, 0.7142333984375, 0.87005615234375, 1.02587890625, 1.18170166015625, 1.3375244140625, 1.49334716796875, 1.649169921875, 1.80499267578125, 1.9608154296875, 2.11663818359375, 2.2724609375, 2.42828369140625, 2.5841064453125, 2.73992919921875, 2.895751953125, 3.05157470703125, 3.2073974609375, 3.36322021484375, 3.51904296875, 3.67486572265625, 3.8306884765625, 3.98651123046875, 4.142333984375, 4.29815673828125, 4.4539794921875, 4.60980224609375, 4.765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 12.0, 12.0, 11.0, 17.0, 29.0, 35.0, 58.0, 80.0, 148.0, 215.0, 336.0, 608.0, 1192.0, 2251.0, 5011.0, 12079.0, 35059.0, 122933.0, 419672.0, 320874.0, 85208.0, 25320.0, 9343.0, 3864.0, 1811.0, 939.0, 529.0, 353.0, 182.0, 119.0, 71.0, 61.0, 29.0, 24.0, 22.0, 14.0, 12.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.72265625, -2.634429931640625, -2.54620361328125, -2.457977294921875, -2.3697509765625, -2.281524658203125, -2.19329833984375, -2.105072021484375, -2.016845703125, -1.928619384765625, -1.84039306640625, -1.752166748046875, -1.6639404296875, -1.575714111328125, -1.48748779296875, -1.399261474609375, -1.31103515625, -1.222808837890625, -1.13458251953125, -1.046356201171875, -0.9581298828125, -0.869903564453125, -0.78167724609375, -0.693450927734375, -0.605224609375, -0.516998291015625, -0.42877197265625, -0.340545654296875, -0.2523193359375, -0.164093017578125, -0.07586669921875, 0.012359619140625, 0.1005859375, 0.188812255859375, 0.27703857421875, 0.365264892578125, 0.4534912109375, 0.541717529296875, 0.62994384765625, 0.718170166015625, 0.806396484375, 0.894622802734375, 0.98284912109375, 1.071075439453125, 1.1593017578125, 1.247528076171875, 1.33575439453125, 1.423980712890625, 1.51220703125, 1.600433349609375, 1.68865966796875, 1.776885986328125, 1.8651123046875, 1.953338623046875, 2.04156494140625, 2.129791259765625, 2.218017578125, 2.306243896484375, 2.39447021484375, 2.482696533203125, 2.5709228515625, 2.659149169921875, 2.74737548828125, 2.835601806640625, 2.923828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 2.0, 3.0, 5.0, 8.0, 9.0, 12.0, 12.0, 17.0, 7.0, 25.0, 23.0, 32.0, 42.0, 48.0, 61.0, 90.0, 93.0, 108.0, 86.0, 71.0, 45.0, 37.0, 32.0, 27.0, 21.0, 24.0, 9.0, 11.0, 7.0, 13.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005168914794921875, -0.0005032531917095184, -0.0004896149039268494, -0.0004759766161441803, -0.00046233832836151123, -0.00044870004057884216, -0.0004350617527961731, -0.00042142346501350403, -0.00040778517723083496, -0.0003941468894481659, -0.0003805086016654968, -0.00036687031388282776, -0.0003532320261001587, -0.0003395937383174896, -0.00032595545053482056, -0.0003123171627521515, -0.0002986788749694824, -0.00028504058718681335, -0.0002714022994041443, -0.0002577640116214752, -0.00024412572383880615, -0.00023048743605613708, -0.00021684914827346802, -0.00020321086049079895, -0.00018957257270812988, -0.00017593428492546082, -0.00016229599714279175, -0.00014865770936012268, -0.0001350194215774536, -0.00012138113379478455, -0.00010774284601211548, -9.410455822944641e-05, -8.046627044677734e-05, -6.682798266410828e-05, -5.318969488143921e-05, -3.955140709877014e-05, -2.5913119316101074e-05, -1.2274831533432007e-05, 1.3634562492370605e-06, 1.5001744031906128e-05, 2.8640031814575195e-05, 4.227831959724426e-05, 5.591660737991333e-05, 6.95548951625824e-05, 8.319318294525146e-05, 9.683147072792053e-05, 0.0001104697585105896, 0.00012410804629325867, 0.00013774633407592773, 0.0001513846218585968, 0.00016502290964126587, 0.00017866119742393494, 0.000192299485206604, 0.00020593777298927307, 0.00021957606077194214, 0.0002332143485546112, 0.0002468526363372803, 0.00026049092411994934, 0.0002741292119026184, 0.0002877674996852875, 0.00030140578746795654, 0.0003150440752506256, 0.0003286823630332947, 0.00034232065081596375, 0.0003559589385986328]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 14.0, 18.0, 32.0, 44.0, 49.0, 100.0, 178.0, 327.0, 588.0, 1255.0, 2924.0, 7791.0, 27493.0, 144223.0, 637760.0, 178929.0, 31812.0, 9081.0, 3166.0, 1307.0, 614.0, 313.0, 195.0, 118.0, 68.0, 47.0, 31.0, 20.0, 6.0, 9.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.22265625, -4.07977294921875, -3.9368896484375, -3.79400634765625, -3.651123046875, -3.50823974609375, -3.3653564453125, -3.22247314453125, -3.07958984375, -2.93670654296875, -2.7938232421875, -2.65093994140625, -2.508056640625, -2.36517333984375, -2.2222900390625, -2.07940673828125, -1.9365234375, -1.79364013671875, -1.6507568359375, -1.50787353515625, -1.364990234375, -1.22210693359375, -1.0792236328125, -0.93634033203125, -0.79345703125, -0.65057373046875, -0.5076904296875, -0.36480712890625, -0.221923828125, -0.07904052734375, 0.0638427734375, 0.20672607421875, 0.349609375, 0.49249267578125, 0.6353759765625, 0.77825927734375, 0.921142578125, 1.06402587890625, 1.2069091796875, 1.34979248046875, 1.49267578125, 1.63555908203125, 1.7784423828125, 1.92132568359375, 2.064208984375, 2.20709228515625, 2.3499755859375, 2.49285888671875, 2.6357421875, 2.77862548828125, 2.9215087890625, 3.06439208984375, 3.207275390625, 3.35015869140625, 3.4930419921875, 3.63592529296875, 3.77880859375, 3.92169189453125, 4.0645751953125, 4.20745849609375, 4.350341796875, 4.49322509765625, 4.6361083984375, 4.77899169921875, 4.921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 9.0, 2.0, 8.0, 5.0, 8.0, 8.0, 12.0, 16.0, 17.0, 28.0, 38.0, 39.0, 66.0, 70.0, 97.0, 102.0, 95.0, 80.0, 72.0, 43.0, 34.0, 43.0, 24.0, 14.0, 16.0, 8.0, 9.0, 9.0, 9.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.4326171875, -2.353515625, -2.2744140625, -2.1953125, -2.1162109375, -2.037109375, -1.9580078125, -1.87890625, -1.7998046875, -1.720703125, -1.6416015625, -1.5625, -1.4833984375, -1.404296875, -1.3251953125, -1.24609375, -1.1669921875, -1.087890625, -1.0087890625, -0.9296875, -0.8505859375, -0.771484375, -0.6923828125, -0.61328125, -0.5341796875, -0.455078125, -0.3759765625, -0.296875, -0.2177734375, -0.138671875, -0.0595703125, 0.01953125, 0.0986328125, 0.177734375, 0.2568359375, 0.3359375, 0.4150390625, 0.494140625, 0.5732421875, 0.65234375, 0.7314453125, 0.810546875, 0.8896484375, 0.96875, 1.0478515625, 1.126953125, 1.2060546875, 1.28515625, 1.3642578125, 1.443359375, 1.5224609375, 1.6015625, 1.6806640625, 1.759765625, 1.8388671875, 1.91796875, 1.9970703125, 2.076171875, 2.1552734375, 2.234375, 2.3134765625, 2.392578125, 2.4716796875, 2.55078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 13.0, 29.0, 44.0, 80.0, 121.0, 154.0, 174.0, 142.0, 100.0, 64.0, 30.0, 16.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.46819305419922, -37.9037971496582, -36.33939743041992, -34.775001525878906, -33.21060562133789, -31.64620590209961, -30.081809997558594, -28.517412185668945, -26.953014373779297, -25.38861656188965, -23.824220657348633, -22.259822845458984, -20.695425033569336, -19.131027221679688, -17.566631317138672, -16.002233505249023, -14.437837600708008, -12.873440742492676, -11.309042930603027, -9.744646072387695, -8.180248260498047, -6.615851402282715, -5.051454544067383, -3.4870567321777344, -1.9226598739624023, -0.35826265811920166, 1.206134557723999, 2.77053165435791, 4.3349289894104, 5.899326324462891, 7.463723182678223, 9.028120994567871, 10.592517852783203, 12.156914710998535, 13.721312522888184, 15.285709381103516, 16.850107192993164, 18.414505004882812, 19.978900909423828, 21.543298721313477, 23.107696533203125, 24.672094345092773, 26.23649024963379, 27.800888061523438, 29.365285873413086, 30.929683685302734, 32.49407958984375, 34.05847930908203, 35.62287139892578, 37.1872673034668, 38.75166702270508, 40.316062927246094, 41.88045883178711, 43.44485855102539, 45.009254455566406, 46.57365417480469, 48.1380500793457, 49.70244598388672, 51.266845703125, 52.831241607666016, 54.39563751220703, 55.96003723144531, 57.52443313598633, 59.088829040527344, 60.653228759765625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 18.0, 12.0, 7.0, 20.0, 30.0, 24.0, 31.0, 49.0, 44.0, 64.0, 69.0, 61.0, 64.0, 59.0, 68.0, 62.0, 53.0, 47.0, 51.0, 30.0, 27.0, 29.0, 20.0, 17.0, 13.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.771833419799805, -26.622455596923828, -25.473079681396484, -24.323701858520508, -23.17432403564453, -22.024948120117188, -20.87557029724121, -19.726192474365234, -18.57681655883789, -17.427438735961914, -16.27806282043457, -15.128684997558594, -13.979308128356934, -12.829931259155273, -11.680553436279297, -10.531176567077637, -9.381799697875977, -8.232422828674316, -7.083045482635498, -5.93366813659668, -4.7842912673950195, -3.6349143981933594, -2.485537052154541, -1.3361597061157227, -0.1867828369140625, 0.9625942707061768, 2.111971378326416, 3.2613484859466553, 4.4107255935668945, 5.560102462768555, 6.709479808807373, 7.858857154846191, 9.008232116699219, 10.157608985900879, 11.306985855102539, 12.456363677978516, 13.605740547180176, 14.755117416381836, 15.904495239257812, 17.053871154785156, 18.203248977661133, 19.35262680053711, 20.502002716064453, 21.65138053894043, 22.800758361816406, 23.95013427734375, 25.099512100219727, 26.248889923095703, 27.398265838623047, 28.547643661499023, 29.697019577026367, 30.846397399902344, 31.995773315429688, 33.14514923095703, 34.29452896118164, 35.443904876708984, 36.593284606933594, 37.74266052246094, 38.89204025268555, 40.04141616821289, 41.190792083740234, 42.340171813964844, 43.48954772949219, 44.63892364501953, 45.788299560546875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 10.0, 20.0, 34.0, 48.0, 77.0, 114.0, 219.0, 323.0, 691.0, 1302.0, 2810.0, 6623.0, 17270.0, 58354.0, 409739.0, 3519601.0, 128209.0, 30280.0, 10318.0, 4221.0, 1939.0, 903.0, 475.0, 282.0, 159.0, 87.0, 56.0, 27.0, 32.0, 8.0, 16.0, 11.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.74945068359375, -4.5535888671875, -4.35772705078125, -4.161865234375, -3.96600341796875, -3.7701416015625, -3.57427978515625, -3.37841796875, -3.18255615234375, -2.9866943359375, -2.79083251953125, -2.594970703125, -2.39910888671875, -2.2032470703125, -2.00738525390625, -1.8115234375, -1.61566162109375, -1.4197998046875, -1.22393798828125, -1.028076171875, -0.83221435546875, -0.6363525390625, -0.44049072265625, -0.24462890625, -0.04876708984375, 0.1470947265625, 0.34295654296875, 0.538818359375, 0.73468017578125, 0.9305419921875, 1.12640380859375, 1.322265625, 1.51812744140625, 1.7139892578125, 1.90985107421875, 2.105712890625, 2.30157470703125, 2.4974365234375, 2.69329833984375, 2.88916015625, 3.08502197265625, 3.2808837890625, 3.47674560546875, 3.672607421875, 3.86846923828125, 4.0643310546875, 4.26019287109375, 4.4560546875, 4.65191650390625, 4.8477783203125, 5.04364013671875, 5.239501953125, 5.43536376953125, 5.6312255859375, 5.82708740234375, 6.02294921875, 6.21881103515625, 6.4146728515625, 6.61053466796875, 6.806396484375, 7.00225830078125, 7.1981201171875, 7.39398193359375, 7.58984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 12.0, 22.0, 16.0, 26.0, 34.0, 51.0, 65.0, 75.0, 79.0, 82.0, 87.0, 67.0, 78.0, 70.0, 54.0, 45.0, 36.0, 26.0, 25.0, 17.0, 11.0, 4.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8486328125, -0.810791015625, -0.77294921875, -0.735107421875, -0.697265625, -0.659423828125, -0.62158203125, -0.583740234375, -0.5458984375, -0.508056640625, -0.47021484375, -0.432373046875, -0.39453125, -0.356689453125, -0.31884765625, -0.281005859375, -0.2431640625, -0.205322265625, -0.16748046875, -0.129638671875, -0.091796875, -0.053955078125, -0.01611328125, 0.021728515625, 0.0595703125, 0.097412109375, 0.13525390625, 0.173095703125, 0.2109375, 0.248779296875, 0.28662109375, 0.324462890625, 0.3623046875, 0.400146484375, 0.43798828125, 0.475830078125, 0.513671875, 0.551513671875, 0.58935546875, 0.627197265625, 0.6650390625, 0.702880859375, 0.74072265625, 0.778564453125, 0.81640625, 0.854248046875, 0.89208984375, 0.929931640625, 0.9677734375, 1.005615234375, 1.04345703125, 1.081298828125, 1.119140625, 1.156982421875, 1.19482421875, 1.232666015625, 1.2705078125, 1.308349609375, 1.34619140625, 1.384033203125, 1.421875, 1.459716796875, 1.49755859375, 1.535400390625, 1.5732421875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 17.0, 16.0, 17.0, 28.0, 86.0, 140.0, 238.0, 491.0, 890.0, 2167.0, 5132.0, 14728.0, 59091.0, 472153.0, 3436982.0, 157739.0, 29561.0, 8811.0, 3201.0, 1415.0, 683.0, 342.0, 174.0, 68.0, 41.0, 26.0, 15.0, 13.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3359375, -8.08544921875, -7.8349609375, -7.58447265625, -7.333984375, -7.08349609375, -6.8330078125, -6.58251953125, -6.33203125, -6.08154296875, -5.8310546875, -5.58056640625, -5.330078125, -5.07958984375, -4.8291015625, -4.57861328125, -4.328125, -4.07763671875, -3.8271484375, -3.57666015625, -3.326171875, -3.07568359375, -2.8251953125, -2.57470703125, -2.32421875, -2.07373046875, -1.8232421875, -1.57275390625, -1.322265625, -1.07177734375, -0.8212890625, -0.57080078125, -0.3203125, -0.06982421875, 0.1806640625, 0.43115234375, 0.681640625, 0.93212890625, 1.1826171875, 1.43310546875, 1.68359375, 1.93408203125, 2.1845703125, 2.43505859375, 2.685546875, 2.93603515625, 3.1865234375, 3.43701171875, 3.6875, 3.93798828125, 4.1884765625, 4.43896484375, 4.689453125, 4.93994140625, 5.1904296875, 5.44091796875, 5.69140625, 5.94189453125, 6.1923828125, 6.44287109375, 6.693359375, 6.94384765625, 7.1943359375, 7.44482421875, 7.6953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 7.0, 15.0, 20.0, 24.0, 49.0, 35.0, 59.0, 106.0, 160.0, 381.0, 1519.0, 1006.0, 243.0, 139.0, 82.0, 56.0, 45.0, 24.0, 20.0, 16.0, 12.0, 7.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.1512451171875, -2.089599609375, -2.0279541015625, -1.96630859375, -1.9046630859375, -1.843017578125, -1.7813720703125, -1.7197265625, -1.6580810546875, -1.596435546875, -1.5347900390625, -1.47314453125, -1.4114990234375, -1.349853515625, -1.2882080078125, -1.2265625, -1.1649169921875, -1.103271484375, -1.0416259765625, -0.97998046875, -0.9183349609375, -0.856689453125, -0.7950439453125, -0.7333984375, -0.6717529296875, -0.610107421875, -0.5484619140625, -0.48681640625, -0.4251708984375, -0.363525390625, -0.3018798828125, -0.240234375, -0.1785888671875, -0.116943359375, -0.0552978515625, 0.00634765625, 0.0679931640625, 0.129638671875, 0.1912841796875, 0.2529296875, 0.3145751953125, 0.376220703125, 0.4378662109375, 0.49951171875, 0.5611572265625, 0.622802734375, 0.6844482421875, 0.74609375, 0.8077392578125, 0.869384765625, 0.9310302734375, 0.99267578125, 1.0543212890625, 1.115966796875, 1.1776123046875, 1.2392578125, 1.3009033203125, 1.362548828125, 1.4241943359375, 1.48583984375, 1.5474853515625, 1.609130859375, 1.6707763671875, 1.732421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 11.0, 26.0, 96.0, 252.0, 334.0, 189.0, 72.0, 21.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.54802322387695, -51.565025329589844, -50.582027435302734, -49.599029541015625, -48.61602783203125, -47.63302993774414, -46.65003204345703, -45.66703414916992, -44.68403625488281, -43.7010383605957, -42.718040466308594, -41.73503875732422, -40.75204086303711, -39.76904296875, -38.78604507446289, -37.80304718017578, -36.820045471191406, -35.8370475769043, -34.85404968261719, -33.87104797363281, -32.8880500793457, -31.905052185058594, -30.922054290771484, -29.939056396484375, -28.956058502197266, -27.973060607910156, -26.990060806274414, -26.007062911987305, -25.024065017700195, -24.041065216064453, -23.058067321777344, -22.075069427490234, -21.092071533203125, -20.109073638916016, -19.126073837280273, -18.143075942993164, -17.160078048706055, -16.177078247070312, -15.194080352783203, -14.211082458496094, -13.228083610534668, -12.245084762573242, -11.262086868286133, -10.279088020324707, -9.296089172363281, -8.313091278076172, -7.330092430114746, -6.3470940589904785, -5.364095687866211, -4.381097316741943, -3.3980987071990967, -2.41510009765625, -1.4321017265319824, -0.44910335540771484, 0.5338954925537109, 1.5168938636779785, 2.499892234802246, 3.4828906059265137, 4.465888977050781, 5.448887825012207, 6.431886196136475, 7.414884567260742, 8.397883415222168, 9.380882263183594, 10.363880157470703]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 11.0, 15.0, 14.0, 24.0, 32.0, 39.0, 40.0, 51.0, 55.0, 60.0, 71.0, 56.0, 54.0, 59.0, 53.0, 59.0, 49.0, 35.0, 40.0, 36.0, 31.0, 25.0, 18.0, 18.0, 8.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.801284790039062, -9.525372505187988, -9.249460220336914, -8.97354793548584, -8.697635650634766, -8.421724319458008, -8.145811080932617, -7.869899272918701, -7.593987464904785, -7.318075180053711, -7.042162895202637, -6.7662506103515625, -6.4903388023376465, -6.214426517486572, -5.938514232635498, -5.662601947784424, -5.38668966293335, -5.110777378082275, -4.834865093231201, -4.558953285217285, -4.283041000366211, -4.007128715515137, -3.7312164306640625, -3.4553041458129883, -3.179392099380493, -2.903479814529419, -2.627567768096924, -2.3516554832458496, -2.0757431983947754, -1.7998311519622803, -1.523918867111206, -1.2480067014694214, -0.9720945358276367, -0.696182370185852, -0.4202701449394226, -0.14435791969299316, 0.1315542459487915, 0.40746641159057617, 0.6833786964416504, 0.9592908620834351, 1.2352030277252197, 1.5111151933670044, 1.787027359008789, 2.0629396438598633, 2.3388519287109375, 2.6147639751434326, 2.890676259994507, 3.166588306427002, 3.442500591278076, 3.7184128761291504, 3.9943249225616455, 4.270236968994141, 4.546149253845215, 4.822061538696289, 5.097973823547363, 5.3738861083984375, 5.649798393249512, 5.925710678100586, 6.20162296295166, 6.477535247802734, 6.75344705581665, 7.029359340667725, 7.305271625518799, 7.581183910369873, 7.857095718383789]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 3.0, 8.0, 7.0, 11.0, 21.0, 14.0, 23.0, 44.0, 64.0, 98.0, 152.0, 200.0, 309.0, 477.0, 804.0, 1375.0, 2456.0, 4414.0, 8327.0, 15926.0, 31648.0, 62170.0, 120536.0, 216798.0, 252514.0, 158550.0, 83411.0, 42273.0, 21273.0, 11083.0, 5907.0, 3103.0, 1817.0, 1008.0, 623.0, 386.0, 226.0, 154.0, 111.0, 67.0, 57.0, 27.0, 27.0, 18.0, 9.0, 4.0, 7.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.90234375, -2.812255859375, -2.72216796875, -2.632080078125, -2.5419921875, -2.451904296875, -2.36181640625, -2.271728515625, -2.181640625, -2.091552734375, -2.00146484375, -1.911376953125, -1.8212890625, -1.731201171875, -1.64111328125, -1.551025390625, -1.4609375, -1.370849609375, -1.28076171875, -1.190673828125, -1.1005859375, -1.010498046875, -0.92041015625, -0.830322265625, -0.740234375, -0.650146484375, -0.56005859375, -0.469970703125, -0.3798828125, -0.289794921875, -0.19970703125, -0.109619140625, -0.01953125, 0.070556640625, 0.16064453125, 0.250732421875, 0.3408203125, 0.430908203125, 0.52099609375, 0.611083984375, 0.701171875, 0.791259765625, 0.88134765625, 0.971435546875, 1.0615234375, 1.151611328125, 1.24169921875, 1.331787109375, 1.421875, 1.511962890625, 1.60205078125, 1.692138671875, 1.7822265625, 1.872314453125, 1.96240234375, 2.052490234375, 2.142578125, 2.232666015625, 2.32275390625, 2.412841796875, 2.5029296875, 2.593017578125, 2.68310546875, 2.773193359375, 2.86328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 13.0, 6.0, 14.0, 19.0, 19.0, 11.0, 25.0, 26.0, 44.0, 44.0, 64.0, 45.0, 63.0, 63.0, 61.0, 70.0, 70.0, 57.0, 51.0, 41.0, 39.0, 32.0, 27.0, 20.0, 14.0, 20.0, 14.0, 16.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.98388671875, -0.9535598754882812, -0.9232330322265625, -0.8929061889648438, -0.862579345703125, -0.8322525024414062, -0.8019256591796875, -0.7715988159179688, -0.74127197265625, -0.7109451293945312, -0.6806182861328125, -0.6502914428710938, -0.619964599609375, -0.5896377563476562, -0.5593109130859375, -0.5289840698242188, -0.4986572265625, -0.46833038330078125, -0.4380035400390625, -0.40767669677734375, -0.377349853515625, -0.34702301025390625, -0.3166961669921875, -0.28636932373046875, -0.25604248046875, -0.22571563720703125, -0.1953887939453125, -0.16506195068359375, -0.134735107421875, -0.10440826416015625, -0.0740814208984375, -0.04375457763671875, -0.013427734375, 0.01689910888671875, 0.0472259521484375, 0.07755279541015625, 0.107879638671875, 0.13820648193359375, 0.1685333251953125, 0.19886016845703125, 0.22918701171875, 0.25951385498046875, 0.2898406982421875, 0.32016754150390625, 0.350494384765625, 0.38082122802734375, 0.4111480712890625, 0.44147491455078125, 0.4718017578125, 0.5021286010742188, 0.5324554443359375, 0.5627822875976562, 0.593109130859375, 0.6234359741210938, 0.6537628173828125, 0.6840896606445312, 0.71441650390625, 0.7447433471679688, 0.7750701904296875, 0.8053970336914062, 0.835723876953125, 0.8660507202148438, 0.8963775634765625, 0.9267044067382812, 0.95703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 9.0, 7.0, 10.0, 13.0, 18.0, 27.0, 47.0, 43.0, 55.0, 89.0, 109.0, 183.0, 265.0, 425.0, 762.0, 1508.0, 3535.0, 9429.0, 28657.0, 100806.0, 343636.0, 387697.0, 118982.0, 33810.0, 10661.0, 3805.0, 1717.0, 838.0, 452.0, 285.0, 209.0, 130.0, 82.0, 68.0, 55.0, 30.0, 20.0, 25.0, 10.0, 9.0, 4.0, 3.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0], "bins": [-6.13671875, -5.966552734375, -5.79638671875, -5.626220703125, -5.4560546875, -5.285888671875, -5.11572265625, -4.945556640625, -4.775390625, -4.605224609375, -4.43505859375, -4.264892578125, -4.0947265625, -3.924560546875, -3.75439453125, -3.584228515625, -3.4140625, -3.243896484375, -3.07373046875, -2.903564453125, -2.7333984375, -2.563232421875, -2.39306640625, -2.222900390625, -2.052734375, -1.882568359375, -1.71240234375, -1.542236328125, -1.3720703125, -1.201904296875, -1.03173828125, -0.861572265625, -0.69140625, -0.521240234375, -0.35107421875, -0.180908203125, -0.0107421875, 0.159423828125, 0.32958984375, 0.499755859375, 0.669921875, 0.840087890625, 1.01025390625, 1.180419921875, 1.3505859375, 1.520751953125, 1.69091796875, 1.861083984375, 2.03125, 2.201416015625, 2.37158203125, 2.541748046875, 2.7119140625, 2.882080078125, 3.05224609375, 3.222412109375, 3.392578125, 3.562744140625, 3.73291015625, 3.903076171875, 4.0732421875, 4.243408203125, 4.41357421875, 4.583740234375, 4.75390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 10.0, 7.0, 14.0, 15.0, 19.0, 19.0, 24.0, 25.0, 29.0, 25.0, 32.0, 27.0, 41.0, 32.0, 44.0, 49.0, 45.0, 52.0, 55.0, 43.0, 47.0, 42.0, 37.0, 35.0, 33.0, 20.0, 29.0, 22.0, 25.0, 14.0, 15.0, 15.0, 11.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.470367431640625, -3.35479736328125, -3.239227294921875, -3.1236572265625, -3.008087158203125, -2.89251708984375, -2.776947021484375, -2.661376953125, -2.545806884765625, -2.43023681640625, -2.314666748046875, -2.1990966796875, -2.083526611328125, -1.96795654296875, -1.852386474609375, -1.73681640625, -1.621246337890625, -1.50567626953125, -1.390106201171875, -1.2745361328125, -1.158966064453125, -1.04339599609375, -0.927825927734375, -0.812255859375, -0.696685791015625, -0.58111572265625, -0.465545654296875, -0.3499755859375, -0.234405517578125, -0.11883544921875, -0.003265380859375, 0.1123046875, 0.227874755859375, 0.34344482421875, 0.459014892578125, 0.5745849609375, 0.690155029296875, 0.80572509765625, 0.921295166015625, 1.036865234375, 1.152435302734375, 1.26800537109375, 1.383575439453125, 1.4991455078125, 1.614715576171875, 1.73028564453125, 1.845855712890625, 1.96142578125, 2.076995849609375, 2.19256591796875, 2.308135986328125, 2.4237060546875, 2.539276123046875, 2.65484619140625, 2.770416259765625, 2.885986328125, 3.001556396484375, 3.11712646484375, 3.232696533203125, 3.3482666015625, 3.463836669921875, 3.57940673828125, 3.694976806640625, 3.810546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 13.0, 13.0, 32.0, 56.0, 103.0, 310.0, 853.0, 3460.0, 21421.0, 400318.0, 586187.0, 29796.0, 4289.0, 1090.0, 315.0, 137.0, 51.0, 39.0, 17.0, 16.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6708984375, -6.462890625, -6.2548828125, -6.046875, -5.8388671875, -5.630859375, -5.4228515625, -5.21484375, -5.0068359375, -4.798828125, -4.5908203125, -4.3828125, -4.1748046875, -3.966796875, -3.7587890625, -3.55078125, -3.3427734375, -3.134765625, -2.9267578125, -2.71875, -2.5107421875, -2.302734375, -2.0947265625, -1.88671875, -1.6787109375, -1.470703125, -1.2626953125, -1.0546875, -0.8466796875, -0.638671875, -0.4306640625, -0.22265625, -0.0146484375, 0.193359375, 0.4013671875, 0.609375, 0.8173828125, 1.025390625, 1.2333984375, 1.44140625, 1.6494140625, 1.857421875, 2.0654296875, 2.2734375, 2.4814453125, 2.689453125, 2.8974609375, 3.10546875, 3.3134765625, 3.521484375, 3.7294921875, 3.9375, 4.1455078125, 4.353515625, 4.5615234375, 4.76953125, 4.9775390625, 5.185546875, 5.3935546875, 5.6015625, 5.8095703125, 6.017578125, 6.2255859375, 6.43359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 5.0, 7.0, 21.0, 27.0, 27.0, 34.0, 50.0, 67.0, 102.0, 140.0, 153.0, 89.0, 54.0, 49.0, 43.0, 28.0, 23.0, 22.0, 13.0, 9.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000614166259765625, -0.0005955100059509277, -0.0005768537521362305, -0.0005581974983215332, -0.0005395412445068359, -0.0005208849906921387, -0.0005022287368774414, -0.00048357248306274414, -0.0004649162292480469, -0.0004462599754333496, -0.00042760372161865234, -0.0004089474678039551, -0.0003902912139892578, -0.00037163496017456055, -0.0003529787063598633, -0.000334322452545166, -0.00031566619873046875, -0.0002970099449157715, -0.0002783536911010742, -0.00025969743728637695, -0.0002410411834716797, -0.00022238492965698242, -0.00020372867584228516, -0.0001850724220275879, -0.00016641616821289062, -0.00014775991439819336, -0.0001291036605834961, -0.00011044740676879883, -9.179115295410156e-05, -7.31348991394043e-05, -5.447864532470703e-05, -3.5822391510009766e-05, -1.71661376953125e-05, 1.4901161193847656e-06, 2.014636993408203e-05, 3.88026237487793e-05, 5.745887756347656e-05, 7.611513137817383e-05, 9.47713851928711e-05, 0.00011342763900756836, 0.00013208389282226562, 0.0001507401466369629, 0.00016939640045166016, 0.00018805265426635742, 0.0002067089080810547, 0.00022536516189575195, 0.00024402141571044922, 0.0002626776695251465, 0.00028133392333984375, 0.000299990177154541, 0.0003186464309692383, 0.00033730268478393555, 0.0003559589385986328, 0.0003746151924133301, 0.00039327144622802734, 0.0004119277000427246, 0.0004305839538574219, 0.00044924020767211914, 0.0004678964614868164, 0.00048655271530151367, 0.0005052089691162109, 0.0005238652229309082, 0.0005425214767456055, 0.0005611777305603027, 0.000579833984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 11.0, 5.0, 22.0, 18.0, 30.0, 50.0, 92.0, 166.0, 319.0, 874.0, 2382.0, 9421.0, 75327.0, 807401.0, 134386.0, 13092.0, 3081.0, 998.0, 419.0, 216.0, 104.0, 41.0, 26.0, 20.0, 19.0, 13.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.75250244140625, -5.5362548828125, -5.32000732421875, -5.103759765625, -4.88751220703125, -4.6712646484375, -4.45501708984375, -4.23876953125, -4.02252197265625, -3.8062744140625, -3.59002685546875, -3.373779296875, -3.15753173828125, -2.9412841796875, -2.72503662109375, -2.5087890625, -2.29254150390625, -2.0762939453125, -1.86004638671875, -1.643798828125, -1.42755126953125, -1.2113037109375, -0.99505615234375, -0.77880859375, -0.56256103515625, -0.3463134765625, -0.13006591796875, 0.086181640625, 0.30242919921875, 0.5186767578125, 0.73492431640625, 0.951171875, 1.16741943359375, 1.3836669921875, 1.59991455078125, 1.816162109375, 2.03240966796875, 2.2486572265625, 2.46490478515625, 2.68115234375, 2.89739990234375, 3.1136474609375, 3.32989501953125, 3.546142578125, 3.76239013671875, 3.9786376953125, 4.19488525390625, 4.4111328125, 4.62738037109375, 4.8436279296875, 5.05987548828125, 5.276123046875, 5.49237060546875, 5.7086181640625, 5.92486572265625, 6.14111328125, 6.35736083984375, 6.5736083984375, 6.78985595703125, 7.006103515625, 7.22235107421875, 7.4385986328125, 7.65484619140625, 7.87109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 12.0, 9.0, 13.0, 20.0, 28.0, 39.0, 64.0, 76.0, 89.0, 107.0, 137.0, 120.0, 70.0, 61.0, 38.0, 35.0, 20.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.385040283203125, -3.28570556640625, -3.186370849609375, -3.0870361328125, -2.987701416015625, -2.88836669921875, -2.789031982421875, -2.689697265625, -2.590362548828125, -2.49102783203125, -2.391693115234375, -2.2923583984375, -2.193023681640625, -2.09368896484375, -1.994354248046875, -1.89501953125, -1.795684814453125, -1.69635009765625, -1.597015380859375, -1.4976806640625, -1.398345947265625, -1.29901123046875, -1.199676513671875, -1.100341796875, -1.001007080078125, -0.90167236328125, -0.802337646484375, -0.7030029296875, -0.603668212890625, -0.50433349609375, -0.404998779296875, -0.3056640625, -0.206329345703125, -0.10699462890625, -0.007659912109375, 0.0916748046875, 0.191009521484375, 0.29034423828125, 0.389678955078125, 0.489013671875, 0.588348388671875, 0.68768310546875, 0.787017822265625, 0.8863525390625, 0.985687255859375, 1.08502197265625, 1.184356689453125, 1.28369140625, 1.383026123046875, 1.48236083984375, 1.581695556640625, 1.6810302734375, 1.780364990234375, 1.87969970703125, 1.979034423828125, 2.078369140625, 2.177703857421875, 2.27703857421875, 2.376373291015625, 2.4757080078125, 2.575042724609375, 2.67437744140625, 2.773712158203125, 2.873046875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 19.0, 75.0, 163.0, 266.0, 276.0, 125.0, 46.0, 17.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.460166931152344, -47.91260528564453, -45.36503982543945, -42.817474365234375, -40.26991271972656, -37.72235107421875, -35.17478561401367, -32.627220153808594, -30.07965850830078, -27.532094955444336, -24.98453140258789, -22.436967849731445, -19.889404296875, -17.341840744018555, -14.79427719116211, -12.246713638305664, -9.699150085449219, -7.151586532592773, -4.604022979736328, -2.056459426879883, 0.4911041259765625, 3.038667678833008, 5.586231231689453, 8.133794784545898, 10.681358337402344, 13.228921890258789, 15.776485443115234, 18.32404899597168, 20.871612548828125, 23.41917610168457, 25.966739654541016, 28.51430320739746, 31.061874389648438, 33.60943603515625, 36.15700149536133, 38.704566955566406, 41.25212860107422, 43.79969024658203, 46.34725570678711, 48.89482116699219, 51.4423828125, 53.98994445800781, 56.53750991821289, 59.08507537841797, 61.63263702392578, 64.1801986694336, 66.72776794433594, 69.27532958984375, 71.82289123535156, 74.37045288085938, 76.91801452636719, 79.46558380126953, 82.01314544677734, 84.56070709228516, 87.1082763671875, 89.65583801269531, 92.20339965820312, 94.75096130371094, 97.29852294921875, 99.8460922241211, 102.3936538696289, 104.94121551513672, 107.48878479003906, 110.03634643554688, 112.58390808105469]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 0.0, 7.0, 7.0, 9.0, 8.0, 16.0, 16.0, 16.0, 24.0, 12.0, 23.0, 21.0, 20.0, 26.0, 25.0, 36.0, 42.0, 39.0, 40.0, 44.0, 39.0, 44.0, 45.0, 45.0, 37.0, 37.0, 33.0, 36.0, 37.0, 37.0, 20.0, 24.0, 19.0, 13.0, 21.0, 12.0, 17.0, 13.0, 10.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.275630950927734, -16.694604873657227, -16.113576889038086, -15.532549858093262, -14.951522827148438, -14.37049674987793, -13.789469718933105, -13.208442687988281, -12.627415657043457, -12.046388626098633, -11.465361595153809, -10.884334564208984, -10.303308486938477, -9.722280502319336, -9.141254425048828, -8.560227394104004, -7.97920036315918, -7.3981733322143555, -6.817146301269531, -6.236119747161865, -5.655092716217041, -5.074065685272217, -4.493039131164551, -3.9120121002197266, -3.3309850692749023, -2.749958038330078, -2.168931245803833, -1.5879043340682983, -1.0068774223327637, -0.42585039138793945, 0.15517640113830566, 0.7362031936645508, 1.3172321319580078, 1.8982590436935425, 2.479285955429077, 3.0603127479553223, 3.6413397789001465, 4.222366809844971, 4.803393363952637, 5.384420394897461, 5.965447425842285, 6.546474456787109, 7.127501487731934, 7.7085280418396, 8.289554595947266, 8.870582580566406, 9.451608657836914, 10.032635688781738, 10.613662719726562, 11.194689750671387, 11.775716781616211, 12.356743812561035, 12.93777084350586, 13.518796920776367, 14.099823951721191, 14.680850982666016, 15.26187801361084, 15.842905044555664, 16.423931121826172, 17.004959106445312, 17.58598518371582, 18.16701316833496, 18.74803924560547, 19.32906723022461, 19.910093307495117]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 9.0, 9.0, 8.0, 15.0, 11.0, 32.0, 36.0, 40.0, 58.0, 77.0, 77.0, 130.0, 209.0, 317.0, 488.0, 841.0, 1296.0, 2344.0, 4173.0, 8411.0, 17907.0, 44169.0, 129179.0, 672952.0, 2945895.0, 243381.0, 70944.0, 26796.0, 11907.0, 5686.0, 2850.0, 1589.0, 878.0, 599.0, 363.0, 206.0, 127.0, 85.0, 58.0, 37.0, 30.0, 21.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.640625, -4.512542724609375, -4.38446044921875, -4.256378173828125, -4.1282958984375, -4.000213623046875, -3.87213134765625, -3.744049072265625, -3.615966796875, -3.487884521484375, -3.35980224609375, -3.231719970703125, -3.1036376953125, -2.975555419921875, -2.84747314453125, -2.719390869140625, -2.59130859375, -2.463226318359375, -2.33514404296875, -2.207061767578125, -2.0789794921875, -1.950897216796875, -1.82281494140625, -1.694732666015625, -1.566650390625, -1.438568115234375, -1.31048583984375, -1.182403564453125, -1.0543212890625, -0.926239013671875, -0.79815673828125, -0.670074462890625, -0.5419921875, -0.413909912109375, -0.28582763671875, -0.157745361328125, -0.0296630859375, 0.098419189453125, 0.22650146484375, 0.354583740234375, 0.482666015625, 0.610748291015625, 0.73883056640625, 0.866912841796875, 0.9949951171875, 1.123077392578125, 1.25115966796875, 1.379241943359375, 1.50732421875, 1.635406494140625, 1.76348876953125, 1.891571044921875, 2.0196533203125, 2.147735595703125, 2.27581787109375, 2.403900146484375, 2.531982421875, 2.660064697265625, 2.78814697265625, 2.916229248046875, 3.0443115234375, 3.172393798828125, 3.30047607421875, 3.428558349609375, 3.556640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 4.0, 7.0, 10.0, 11.0, 21.0, 30.0, 19.0, 36.0, 45.0, 47.0, 49.0, 50.0, 72.0, 69.0, 64.0, 77.0, 75.0, 49.0, 49.0, 44.0, 35.0, 25.0, 30.0, 28.0, 18.0, 11.0, 10.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0409698486328125, -1.008697509765625, -0.9764251708984375, -0.94415283203125, -0.9118804931640625, -0.879608154296875, -0.8473358154296875, -0.8150634765625, -0.7827911376953125, -0.750518798828125, -0.7182464599609375, -0.68597412109375, -0.6537017822265625, -0.621429443359375, -0.5891571044921875, -0.556884765625, -0.5246124267578125, -0.492340087890625, -0.4600677490234375, -0.42779541015625, -0.3955230712890625, -0.363250732421875, -0.3309783935546875, -0.2987060546875, -0.2664337158203125, -0.234161376953125, -0.2018890380859375, -0.16961669921875, -0.1373443603515625, -0.105072021484375, -0.0727996826171875, -0.04052734375, -0.0082550048828125, 0.024017333984375, 0.0562896728515625, 0.08856201171875, 0.1208343505859375, 0.153106689453125, 0.1853790283203125, 0.2176513671875, 0.2499237060546875, 0.282196044921875, 0.3144683837890625, 0.34674072265625, 0.3790130615234375, 0.411285400390625, 0.4435577392578125, 0.475830078125, 0.5081024169921875, 0.540374755859375, 0.5726470947265625, 0.60491943359375, 0.6371917724609375, 0.669464111328125, 0.7017364501953125, 0.7340087890625, 0.7662811279296875, 0.798553466796875, 0.8308258056640625, 0.86309814453125, 0.8953704833984375, 0.927642822265625, 0.9599151611328125, 0.9921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 9.0, 15.0, 18.0, 33.0, 45.0, 82.0, 147.0, 421.0, 1751.0, 15356.0, 664980.0, 3471957.0, 35377.0, 3074.0, 619.0, 191.0, 83.0, 56.0, 24.0, 26.0, 6.0, 12.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.3590087890625, -17.889892578125, -17.4207763671875, -16.95166015625, -16.4825439453125, -16.013427734375, -15.5443115234375, -15.0751953125, -14.6060791015625, -14.136962890625, -13.6678466796875, -13.19873046875, -12.7296142578125, -12.260498046875, -11.7913818359375, -11.322265625, -10.8531494140625, -10.384033203125, -9.9149169921875, -9.44580078125, -8.9766845703125, -8.507568359375, -8.0384521484375, -7.5693359375, -7.1002197265625, -6.631103515625, -6.1619873046875, -5.69287109375, -5.2237548828125, -4.754638671875, -4.2855224609375, -3.81640625, -3.3472900390625, -2.878173828125, -2.4090576171875, -1.93994140625, -1.4708251953125, -1.001708984375, -0.5325927734375, -0.0634765625, 0.4056396484375, 0.874755859375, 1.3438720703125, 1.81298828125, 2.2821044921875, 2.751220703125, 3.2203369140625, 3.689453125, 4.1585693359375, 4.627685546875, 5.0968017578125, 5.56591796875, 6.0350341796875, 6.504150390625, 6.9732666015625, 7.4423828125, 7.9114990234375, 8.380615234375, 8.8497314453125, 9.31884765625, 9.7879638671875, 10.257080078125, 10.7261962890625, 11.1953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 14.0, 30.0, 40.0, 59.0, 96.0, 188.0, 369.0, 1215.0, 1192.0, 379.0, 198.0, 107.0, 64.0, 34.0, 34.0, 15.0, 14.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.375, -4.273223876953125, -4.17144775390625, -4.069671630859375, -3.9678955078125, -3.866119384765625, -3.76434326171875, -3.662567138671875, -3.560791015625, -3.459014892578125, -3.35723876953125, -3.255462646484375, -3.1536865234375, -3.051910400390625, -2.95013427734375, -2.848358154296875, -2.74658203125, -2.644805908203125, -2.54302978515625, -2.441253662109375, -2.3394775390625, -2.237701416015625, -2.13592529296875, -2.034149169921875, -1.932373046875, -1.830596923828125, -1.72882080078125, -1.627044677734375, -1.5252685546875, -1.423492431640625, -1.32171630859375, -1.219940185546875, -1.1181640625, -1.016387939453125, -0.91461181640625, -0.812835693359375, -0.7110595703125, -0.609283447265625, -0.50750732421875, -0.405731201171875, -0.303955078125, -0.202178955078125, -0.10040283203125, 0.001373291015625, 0.1031494140625, 0.204925537109375, 0.30670166015625, 0.408477783203125, 0.51025390625, 0.612030029296875, 0.71380615234375, 0.815582275390625, 0.9173583984375, 1.019134521484375, 1.12091064453125, 1.222686767578125, 1.324462890625, 1.426239013671875, 1.52801513671875, 1.629791259765625, 1.7315673828125, 1.833343505859375, 1.93511962890625, 2.036895751953125, 2.138671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 4.0, 2.0, 8.0, 8.0, 12.0, 31.0, 39.0, 44.0, 77.0, 122.0, 145.0, 137.0, 108.0, 85.0, 58.0, 44.0, 30.0, 18.0, 12.0, 8.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.884719848632812, -16.358734130859375, -15.83275032043457, -15.306764602661133, -14.780779838562012, -14.25479507446289, -13.72881031036377, -13.202825546264648, -12.676839828491211, -12.15085506439209, -11.624870300292969, -11.098884582519531, -10.57289981842041, -10.046915054321289, -9.520930290222168, -8.994945526123047, -8.468960762023926, -7.942975997924805, -7.416990756988525, -6.891005992889404, -6.365020751953125, -5.839035987854004, -5.313051223754883, -4.787066459655762, -4.261081218719482, -3.7350962162017822, -3.209111213684082, -2.683126449584961, -2.1571414470672607, -1.6311564445495605, -1.1051716804504395, -0.5791866779327393, -0.05320167541503906, 0.47278326749801636, 0.9987682104110718, 1.5247530937194824, 2.0507380962371826, 2.576723098754883, 3.102707862854004, 3.628692865371704, 4.154677867889404, 4.680662631988525, 5.206647872924805, 5.732632637023926, 6.258617401123047, 6.784602642059326, 7.310587406158447, 7.836572647094727, 8.362557411193848, 8.888542175292969, 9.41452693939209, 9.940511703491211, 10.466497421264648, 10.99248218536377, 11.51846694946289, 12.044451713562012, 12.570436477661133, 13.096421241760254, 13.622406005859375, 14.148391723632812, 14.674376487731934, 15.200361251831055, 15.726346015930176, 16.252330780029297, 16.778316497802734]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 13.0, 14.0, 11.0, 19.0, 11.0, 24.0, 22.0, 30.0, 23.0, 30.0, 27.0, 31.0, 33.0, 40.0, 44.0, 44.0, 46.0, 32.0, 41.0, 44.0, 40.0, 39.0, 39.0, 26.0, 32.0, 26.0, 29.0, 28.0, 12.0, 17.0, 9.0, 20.0, 13.0, 14.0, 14.0, 5.0, 9.0, 10.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.747694969177246, -7.513235092163086, -7.278774738311768, -7.044314384460449, -6.809854507446289, -6.575394630432129, -6.3409342765808105, -6.106473922729492, -5.872014045715332, -5.637554168701172, -5.4030938148498535, -5.168633460998535, -4.934173583984375, -4.699713706970215, -4.4652533531188965, -4.230792999267578, -3.996333122253418, -3.7618730068206787, -3.5274128913879395, -3.2929527759552, -3.058492660522461, -2.8240325450897217, -2.5895724296569824, -2.355112314224243, -2.120652198791504, -1.8861920833587646, -1.6517319679260254, -1.4172718524932861, -1.1828117370605469, -0.9483516216278076, -0.7138915061950684, -0.4794313907623291, -0.24497127532958984, -0.010511159896850586, 0.22394895553588867, 0.45840907096862793, 0.6928691864013672, 0.9273293018341064, 1.1617894172668457, 1.396249532699585, 1.6307096481323242, 1.8651697635650635, 2.0996298789978027, 2.334089994430542, 2.5685501098632812, 2.8030102252960205, 3.0374703407287598, 3.271930456161499, 3.5063905715942383, 3.7408506870269775, 3.975310802459717, 4.209771156311035, 4.444231033325195, 4.6786909103393555, 4.913151264190674, 5.147611618041992, 5.382071495056152, 5.6165313720703125, 5.850991725921631, 6.085452079772949, 6.319911956787109, 6.5543718338012695, 6.788832187652588, 7.023292541503906, 7.257752418518066]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 18.0, 20.0, 32.0, 43.0, 69.0, 114.0, 146.0, 207.0, 391.0, 751.0, 1303.0, 2831.0, 6292.0, 14483.0, 34826.0, 82047.0, 193761.0, 370832.0, 195199.0, 83445.0, 34991.0, 14572.0, 6101.0, 2840.0, 1341.0, 719.0, 446.0, 232.0, 168.0, 98.0, 62.0, 49.0, 22.0, 24.0, 19.0, 2.0, 7.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.8984375, -4.7564697265625, -4.614501953125, -4.4725341796875, -4.33056640625, -4.1885986328125, -4.046630859375, -3.9046630859375, -3.7626953125, -3.6207275390625, -3.478759765625, -3.3367919921875, -3.19482421875, -3.0528564453125, -2.910888671875, -2.7689208984375, -2.626953125, -2.4849853515625, -2.343017578125, -2.2010498046875, -2.05908203125, -1.9171142578125, -1.775146484375, -1.6331787109375, -1.4912109375, -1.3492431640625, -1.207275390625, -1.0653076171875, -0.92333984375, -0.7813720703125, -0.639404296875, -0.4974365234375, -0.35546875, -0.2135009765625, -0.071533203125, 0.0704345703125, 0.21240234375, 0.3543701171875, 0.496337890625, 0.6383056640625, 0.7802734375, 0.9222412109375, 1.064208984375, 1.2061767578125, 1.34814453125, 1.4901123046875, 1.632080078125, 1.7740478515625, 1.916015625, 2.0579833984375, 2.199951171875, 2.3419189453125, 2.48388671875, 2.6258544921875, 2.767822265625, 2.9097900390625, 3.0517578125, 3.1937255859375, 3.335693359375, 3.4776611328125, 3.61962890625, 3.7615966796875, 3.903564453125, 4.0455322265625, 4.1875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 4.0, 9.0, 8.0, 18.0, 19.0, 24.0, 28.0, 35.0, 37.0, 48.0, 42.0, 48.0, 66.0, 62.0, 71.0, 57.0, 60.0, 53.0, 50.0, 38.0, 47.0, 36.0, 21.0, 33.0, 22.0, 18.0, 10.0, 8.0, 9.0, 8.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0488662719726562, -1.0186309814453125, -0.9883956909179688, -0.958160400390625, -0.9279251098632812, -0.8976898193359375, -0.8674545288085938, -0.83721923828125, -0.8069839477539062, -0.7767486572265625, -0.7465133666992188, -0.716278076171875, -0.6860427856445312, -0.6558074951171875, -0.6255722045898438, -0.5953369140625, -0.5651016235351562, -0.5348663330078125, -0.5046310424804688, -0.474395751953125, -0.44416046142578125, -0.4139251708984375, -0.38368988037109375, -0.35345458984375, -0.32321929931640625, -0.2929840087890625, -0.26274871826171875, -0.232513427734375, -0.20227813720703125, -0.1720428466796875, -0.14180755615234375, -0.111572265625, -0.08133697509765625, -0.0511016845703125, -0.02086639404296875, 0.009368896484375, 0.03960418701171875, 0.0698394775390625, 0.10007476806640625, 0.13031005859375, 0.16054534912109375, 0.1907806396484375, 0.22101593017578125, 0.251251220703125, 0.28148651123046875, 0.3117218017578125, 0.34195709228515625, 0.3721923828125, 0.40242767333984375, 0.4326629638671875, 0.46289825439453125, 0.493133544921875, 0.5233688354492188, 0.5536041259765625, 0.5838394165039062, 0.61407470703125, 0.6443099975585938, 0.6745452880859375, 0.7047805786132812, 0.735015869140625, 0.7652511596679688, 0.7954864501953125, 0.8257217407226562, 0.85595703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 14.0, 12.0, 17.0, 21.0, 29.0, 38.0, 46.0, 86.0, 103.0, 165.0, 263.0, 503.0, 963.0, 1951.0, 4230.0, 10366.0, 28966.0, 86173.0, 266251.0, 423239.0, 146741.0, 48747.0, 17105.0, 6589.0, 2857.0, 1363.0, 653.0, 354.0, 214.0, 160.0, 81.0, 83.0, 46.0, 30.0, 21.0, 13.0, 18.0, 7.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.66796875, -4.5185546875, -4.369140625, -4.2197265625, -4.0703125, -3.9208984375, -3.771484375, -3.6220703125, -3.47265625, -3.3232421875, -3.173828125, -3.0244140625, -2.875, -2.7255859375, -2.576171875, -2.4267578125, -2.27734375, -2.1279296875, -1.978515625, -1.8291015625, -1.6796875, -1.5302734375, -1.380859375, -1.2314453125, -1.08203125, -0.9326171875, -0.783203125, -0.6337890625, -0.484375, -0.3349609375, -0.185546875, -0.0361328125, 0.11328125, 0.2626953125, 0.412109375, 0.5615234375, 0.7109375, 0.8603515625, 1.009765625, 1.1591796875, 1.30859375, 1.4580078125, 1.607421875, 1.7568359375, 1.90625, 2.0556640625, 2.205078125, 2.3544921875, 2.50390625, 2.6533203125, 2.802734375, 2.9521484375, 3.1015625, 3.2509765625, 3.400390625, 3.5498046875, 3.69921875, 3.8486328125, 3.998046875, 4.1474609375, 4.296875, 4.4462890625, 4.595703125, 4.7451171875, 4.89453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 10.0, 13.0, 5.0, 8.0, 13.0, 9.0, 17.0, 18.0, 11.0, 33.0, 19.0, 27.0, 36.0, 30.0, 46.0, 35.0, 40.0, 41.0, 45.0, 44.0, 38.0, 55.0, 42.0, 30.0, 31.0, 28.0, 36.0, 33.0, 35.0, 32.0, 21.0, 23.0, 18.0, 17.0, 13.0, 8.0, 8.0, 4.0, 5.0, 5.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.19921875, -3.08917236328125, -2.9791259765625, -2.86907958984375, -2.759033203125, -2.64898681640625, -2.5389404296875, -2.42889404296875, -2.31884765625, -2.20880126953125, -2.0987548828125, -1.98870849609375, -1.878662109375, -1.76861572265625, -1.6585693359375, -1.54852294921875, -1.4384765625, -1.32843017578125, -1.2183837890625, -1.10833740234375, -0.998291015625, -0.88824462890625, -0.7781982421875, -0.66815185546875, -0.55810546875, -0.44805908203125, -0.3380126953125, -0.22796630859375, -0.117919921875, -0.00787353515625, 0.1021728515625, 0.21221923828125, 0.322265625, 0.43231201171875, 0.5423583984375, 0.65240478515625, 0.762451171875, 0.87249755859375, 0.9825439453125, 1.09259033203125, 1.20263671875, 1.31268310546875, 1.4227294921875, 1.53277587890625, 1.642822265625, 1.75286865234375, 1.8629150390625, 1.97296142578125, 2.0830078125, 2.19305419921875, 2.3031005859375, 2.41314697265625, 2.523193359375, 2.63323974609375, 2.7432861328125, 2.85333251953125, 2.96337890625, 3.07342529296875, 3.1834716796875, 3.29351806640625, 3.403564453125, 3.51361083984375, 3.6236572265625, 3.73370361328125, 3.84375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 14.0, 15.0, 29.0, 44.0, 53.0, 106.0, 210.0, 400.0, 1003.0, 2939.0, 10772.0, 59893.0, 619788.0, 308896.0, 33794.0, 7201.0, 1938.0, 754.0, 287.0, 173.0, 91.0, 63.0, 31.0, 14.0, 15.0, 13.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.173583984375, -4.98779296875, -4.802001953125, -4.6162109375, -4.430419921875, -4.24462890625, -4.058837890625, -3.873046875, -3.687255859375, -3.50146484375, -3.315673828125, -3.1298828125, -2.944091796875, -2.75830078125, -2.572509765625, -2.38671875, -2.200927734375, -2.01513671875, -1.829345703125, -1.6435546875, -1.457763671875, -1.27197265625, -1.086181640625, -0.900390625, -0.714599609375, -0.52880859375, -0.343017578125, -0.1572265625, 0.028564453125, 0.21435546875, 0.400146484375, 0.5859375, 0.771728515625, 0.95751953125, 1.143310546875, 1.3291015625, 1.514892578125, 1.70068359375, 1.886474609375, 2.072265625, 2.258056640625, 2.44384765625, 2.629638671875, 2.8154296875, 3.001220703125, 3.18701171875, 3.372802734375, 3.55859375, 3.744384765625, 3.93017578125, 4.115966796875, 4.3017578125, 4.487548828125, 4.67333984375, 4.859130859375, 5.044921875, 5.230712890625, 5.41650390625, 5.602294921875, 5.7880859375, 5.973876953125, 6.15966796875, 6.345458984375, 6.53125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 9.0, 5.0, 14.0, 18.0, 23.0, 32.0, 46.0, 52.0, 124.0, 214.0, 161.0, 75.0, 50.0, 44.0, 19.0, 23.0, 17.0, 12.0, 14.0, 10.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008869171142578125, -0.0008633807301521301, -0.0008398443460464478, -0.0008163079619407654, -0.000792771577835083, -0.0007692351937294006, -0.0007456988096237183, -0.0007221624255180359, -0.0006986260414123535, -0.0006750896573066711, -0.0006515532732009888, -0.0006280168890953064, -0.000604480504989624, -0.0005809441208839417, -0.0005574077367782593, -0.0005338713526725769, -0.0005103349685668945, -0.00048679858446121216, -0.0004632622003555298, -0.0004397258162498474, -0.00041618943214416504, -0.00039265304803848267, -0.0003691166639328003, -0.0003455802798271179, -0.00032204389572143555, -0.0002985075116157532, -0.0002749711275100708, -0.00025143474340438843, -0.00022789835929870605, -0.00020436197519302368, -0.0001808255910873413, -0.00015728920698165894, -0.00013375282287597656, -0.00011021643877029419, -8.668005466461182e-05, -6.314367055892944e-05, -3.960728645324707e-05, -1.6070902347564697e-05, 7.465481758117676e-06, 3.100186586380005e-05, 5.453824996948242e-05, 7.80746340751648e-05, 0.00010161101818084717, 0.00012514740228652954, 0.00014868378639221191, 0.0001722201704978943, 0.00019575655460357666, 0.00021929293870925903, 0.0002428293228149414, 0.0002663657069206238, 0.00028990209102630615, 0.0003134384751319885, 0.0003369748592376709, 0.00036051124334335327, 0.00038404762744903564, 0.000407584011554718, 0.0004311203956604004, 0.00045465677976608276, 0.00047819316387176514, 0.0005017295479774475, 0.0005252659320831299, 0.0005488023161888123, 0.0005723387002944946, 0.000595875084400177, 0.0006194114685058594]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 7.0, 4.0, 6.0, 8.0, 22.0, 13.0, 23.0, 34.0, 37.0, 59.0, 93.0, 160.0, 273.0, 463.0, 827.0, 1681.0, 3623.0, 8608.0, 26907.0, 110726.0, 619493.0, 211347.0, 41800.0, 12889.0, 4791.0, 2110.0, 1023.0, 580.0, 328.0, 202.0, 130.0, 73.0, 59.0, 59.0, 25.0, 16.0, 13.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.37890625, -4.244873046875, -4.11083984375, -3.976806640625, -3.8427734375, -3.708740234375, -3.57470703125, -3.440673828125, -3.306640625, -3.172607421875, -3.03857421875, -2.904541015625, -2.7705078125, -2.636474609375, -2.50244140625, -2.368408203125, -2.234375, -2.100341796875, -1.96630859375, -1.832275390625, -1.6982421875, -1.564208984375, -1.43017578125, -1.296142578125, -1.162109375, -1.028076171875, -0.89404296875, -0.760009765625, -0.6259765625, -0.491943359375, -0.35791015625, -0.223876953125, -0.08984375, 0.044189453125, 0.17822265625, 0.312255859375, 0.4462890625, 0.580322265625, 0.71435546875, 0.848388671875, 0.982421875, 1.116455078125, 1.25048828125, 1.384521484375, 1.5185546875, 1.652587890625, 1.78662109375, 1.920654296875, 2.0546875, 2.188720703125, 2.32275390625, 2.456787109375, 2.5908203125, 2.724853515625, 2.85888671875, 2.992919921875, 3.126953125, 3.260986328125, 3.39501953125, 3.529052734375, 3.6630859375, 3.797119140625, 3.93115234375, 4.065185546875, 4.19921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 9.0, 9.0, 16.0, 15.0, 8.0, 19.0, 27.0, 32.0, 56.0, 91.0, 122.0, 170.0, 123.0, 94.0, 57.0, 37.0, 35.0, 19.0, 14.0, 9.0, 8.0, 3.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1640625, -4.04998779296875, -3.9359130859375, -3.82183837890625, -3.707763671875, -3.59368896484375, -3.4796142578125, -3.36553955078125, -3.25146484375, -3.13739013671875, -3.0233154296875, -2.90924072265625, -2.795166015625, -2.68109130859375, -2.5670166015625, -2.45294189453125, -2.3388671875, -2.22479248046875, -2.1107177734375, -1.99664306640625, -1.882568359375, -1.76849365234375, -1.6544189453125, -1.54034423828125, -1.42626953125, -1.31219482421875, -1.1981201171875, -1.08404541015625, -0.969970703125, -0.85589599609375, -0.7418212890625, -0.62774658203125, -0.513671875, -0.39959716796875, -0.2855224609375, -0.17144775390625, -0.057373046875, 0.05670166015625, 0.1707763671875, 0.28485107421875, 0.39892578125, 0.51300048828125, 0.6270751953125, 0.74114990234375, 0.855224609375, 0.96929931640625, 1.0833740234375, 1.19744873046875, 1.3115234375, 1.42559814453125, 1.5396728515625, 1.65374755859375, 1.767822265625, 1.88189697265625, 1.9959716796875, 2.11004638671875, 2.22412109375, 2.33819580078125, 2.4522705078125, 2.56634521484375, 2.680419921875, 2.79449462890625, 2.9085693359375, 3.02264404296875, 3.13671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 26.0, 28.0, 52.0, 90.0, 93.0, 123.0, 136.0, 133.0, 98.0, 72.0, 43.0, 32.0, 20.0, 10.0, 10.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.650753021240234, -36.4671630859375, -35.2835693359375, -34.0999755859375, -32.916385650634766, -31.7327938079834, -30.54920196533203, -29.365610122680664, -28.182018280029297, -26.99842643737793, -25.814834594726562, -24.631242752075195, -23.447650909423828, -22.26405906677246, -21.080467224121094, -19.896875381469727, -18.71328353881836, -17.529691696166992, -16.346099853515625, -15.162508010864258, -13.97891616821289, -12.795324325561523, -11.611732482910156, -10.428140640258789, -9.244548797607422, -8.060956954956055, -6.8773651123046875, -5.69377326965332, -4.510181427001953, -3.326589584350586, -2.1429977416992188, -0.9594058990478516, 0.22418975830078125, 1.4077816009521484, 2.5913734436035156, 3.774965286254883, 4.95855712890625, 6.142148971557617, 7.325740814208984, 8.509332656860352, 9.692924499511719, 10.876516342163086, 12.060108184814453, 13.24370002746582, 14.427291870117188, 15.610883712768555, 16.794475555419922, 17.97806739807129, 19.161659240722656, 20.345251083374023, 21.52884292602539, 22.712434768676758, 23.896026611328125, 25.079618453979492, 26.26321029663086, 27.446802139282227, 28.630393981933594, 29.81398582458496, 30.997577667236328, 32.18116760253906, 33.36476135253906, 34.54835510253906, 35.7319450378418, 36.91553497314453, 38.09912872314453]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 7.0, 9.0, 9.0, 12.0, 11.0, 15.0, 27.0, 23.0, 23.0, 26.0, 36.0, 41.0, 31.0, 42.0, 33.0, 50.0, 44.0, 36.0, 47.0, 33.0, 37.0, 39.0, 45.0, 37.0, 33.0, 24.0, 31.0, 27.0, 26.0, 15.0, 19.0, 22.0, 12.0, 14.0, 12.0, 12.0, 14.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.571372985839844, -20.91573143005371, -20.26009178161621, -19.604450225830078, -18.948808670043945, -18.293167114257812, -17.637527465820312, -16.98188591003418, -16.326244354248047, -15.67060375213623, -15.014962196350098, -14.359321594238281, -13.703680038452148, -13.048039436340332, -12.392398834228516, -11.736757278442383, -11.081116676330566, -10.42547607421875, -9.769834518432617, -9.1141939163208, -8.458552360534668, -7.802911758422852, -7.147270679473877, -6.491629600524902, -5.835988521575928, -5.180347442626953, -4.5247063636779785, -3.869065523147583, -3.2134244441986084, -2.557783365249634, -1.9021425247192383, -1.2465014457702637, -0.5908603668212891, 0.06478065252304077, 0.7204216718673706, 1.3760626316070557, 2.0317037105560303, 2.687344789505005, 3.3429856300354004, 3.998626708984375, 4.65426778793335, 5.309908866882324, 5.965549945831299, 6.621191024780273, 7.27683162689209, 7.932473182678223, 8.588113784790039, 9.243755340576172, 9.899395942687988, 10.555036544799805, 11.210678100585938, 11.866318702697754, 12.521960258483887, 13.177600860595703, 13.833242416381836, 14.488883018493652, 15.144523620605469, 15.800164222717285, 16.4558048248291, 17.111446380615234, 17.767087936401367, 18.4227294921875, 19.078369140625, 19.734010696411133, 20.389652252197266]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 9.0, 10.0, 4.0, 17.0, 20.0, 42.0, 61.0, 90.0, 155.0, 308.0, 553.0, 1038.0, 2202.0, 5190.0, 13493.0, 42100.0, 209974.0, 3542419.0, 298403.0, 51572.0, 15776.0, 5940.0, 2462.0, 1165.0, 605.0, 297.0, 154.0, 85.0, 52.0, 27.0, 20.0, 12.0, 8.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.17474365234375, -6.9979248046875, -6.82110595703125, -6.644287109375, -6.46746826171875, -6.2906494140625, -6.11383056640625, -5.93701171875, -5.76019287109375, -5.5833740234375, -5.40655517578125, -5.229736328125, -5.05291748046875, -4.8760986328125, -4.69927978515625, -4.5224609375, -4.34564208984375, -4.1688232421875, -3.99200439453125, -3.815185546875, -3.63836669921875, -3.4615478515625, -3.28472900390625, -3.10791015625, -2.93109130859375, -2.7542724609375, -2.57745361328125, -2.400634765625, -2.22381591796875, -2.0469970703125, -1.87017822265625, -1.693359375, -1.51654052734375, -1.3397216796875, -1.16290283203125, -0.986083984375, -0.80926513671875, -0.6324462890625, -0.45562744140625, -0.27880859375, -0.10198974609375, 0.0748291015625, 0.25164794921875, 0.428466796875, 0.60528564453125, 0.7821044921875, 0.95892333984375, 1.1357421875, 1.31256103515625, 1.4893798828125, 1.66619873046875, 1.843017578125, 2.01983642578125, 2.1966552734375, 2.37347412109375, 2.55029296875, 2.72711181640625, 2.9039306640625, 3.08074951171875, 3.257568359375, 3.43438720703125, 3.6112060546875, 3.78802490234375, 3.96484375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 12.0, 17.0, 12.0, 20.0, 25.0, 19.0, 38.0, 33.0, 43.0, 51.0, 54.0, 57.0, 54.0, 55.0, 59.0, 52.0, 51.0, 47.0, 35.0, 53.0, 33.0, 36.0, 32.0, 16.0, 15.0, 15.0, 8.0, 13.0, 8.0, 5.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8828125, -0.853363037109375, -0.82391357421875, -0.794464111328125, -0.7650146484375, -0.735565185546875, -0.70611572265625, -0.676666259765625, -0.647216796875, -0.617767333984375, -0.58831787109375, -0.558868408203125, -0.5294189453125, -0.499969482421875, -0.47052001953125, -0.441070556640625, -0.41162109375, -0.382171630859375, -0.35272216796875, -0.323272705078125, -0.2938232421875, -0.264373779296875, -0.23492431640625, -0.205474853515625, -0.176025390625, -0.146575927734375, -0.11712646484375, -0.087677001953125, -0.0582275390625, -0.028778076171875, 0.00067138671875, 0.030120849609375, 0.0595703125, 0.089019775390625, 0.11846923828125, 0.147918701171875, 0.1773681640625, 0.206817626953125, 0.23626708984375, 0.265716552734375, 0.295166015625, 0.324615478515625, 0.35406494140625, 0.383514404296875, 0.4129638671875, 0.442413330078125, 0.47186279296875, 0.501312255859375, 0.53076171875, 0.560211181640625, 0.58966064453125, 0.619110107421875, 0.6485595703125, 0.678009033203125, 0.70745849609375, 0.736907958984375, 0.766357421875, 0.795806884765625, 0.82525634765625, 0.854705810546875, 0.8841552734375, 0.913604736328125, 0.94305419921875, 0.972503662109375, 1.001953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 9.0, 8.0, 26.0, 25.0, 55.0, 109.0, 185.0, 501.0, 1586.0, 6442.0, 34648.0, 461396.0, 3563438.0, 106154.0, 14934.0, 3257.0, 920.0, 301.0, 145.0, 50.0, 45.0, 21.0, 11.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.40625, -12.10552978515625, -11.8048095703125, -11.50408935546875, -11.203369140625, -10.90264892578125, -10.6019287109375, -10.30120849609375, -10.00048828125, -9.69976806640625, -9.3990478515625, -9.09832763671875, -8.797607421875, -8.49688720703125, -8.1961669921875, -7.89544677734375, -7.5947265625, -7.29400634765625, -6.9932861328125, -6.69256591796875, -6.391845703125, -6.09112548828125, -5.7904052734375, -5.48968505859375, -5.18896484375, -4.88824462890625, -4.5875244140625, -4.28680419921875, -3.986083984375, -3.68536376953125, -3.3846435546875, -3.08392333984375, -2.783203125, -2.48248291015625, -2.1817626953125, -1.88104248046875, -1.580322265625, -1.27960205078125, -0.9788818359375, -0.67816162109375, -0.37744140625, -0.07672119140625, 0.2239990234375, 0.52471923828125, 0.825439453125, 1.12615966796875, 1.4268798828125, 1.72760009765625, 2.0283203125, 2.32904052734375, 2.6297607421875, 2.93048095703125, 3.231201171875, 3.53192138671875, 3.8326416015625, 4.13336181640625, 4.43408203125, 4.73480224609375, 5.0355224609375, 5.33624267578125, 5.636962890625, 5.93768310546875, 6.2384033203125, 6.53912353515625, 6.83984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 10.0, 20.0, 24.0, 35.0, 50.0, 84.0, 127.0, 255.0, 638.0, 1659.0, 522.0, 243.0, 126.0, 87.0, 38.0, 31.0, 23.0, 15.0, 20.0, 8.0, 6.0, 6.0, 8.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.642578125, -2.567901611328125, -2.49322509765625, -2.418548583984375, -2.3438720703125, -2.269195556640625, -2.19451904296875, -2.119842529296875, -2.045166015625, -1.970489501953125, -1.89581298828125, -1.821136474609375, -1.7464599609375, -1.671783447265625, -1.59710693359375, -1.522430419921875, -1.44775390625, -1.373077392578125, -1.29840087890625, -1.223724365234375, -1.1490478515625, -1.074371337890625, -0.99969482421875, -0.925018310546875, -0.850341796875, -0.775665283203125, -0.70098876953125, -0.626312255859375, -0.5516357421875, -0.476959228515625, -0.40228271484375, -0.327606201171875, -0.2529296875, -0.178253173828125, -0.10357666015625, -0.028900146484375, 0.0457763671875, 0.120452880859375, 0.19512939453125, 0.269805908203125, 0.344482421875, 0.419158935546875, 0.49383544921875, 0.568511962890625, 0.6431884765625, 0.717864990234375, 0.79254150390625, 0.867218017578125, 0.94189453125, 1.016571044921875, 1.09124755859375, 1.165924072265625, 1.2406005859375, 1.315277099609375, 1.38995361328125, 1.464630126953125, 1.539306640625, 1.613983154296875, 1.68865966796875, 1.763336181640625, 1.8380126953125, 1.912689208984375, 1.98736572265625, 2.062042236328125, 2.13671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 6.0, 9.0, 9.0, 17.0, 32.0, 62.0, 90.0, 97.0, 149.0, 156.0, 125.0, 83.0, 64.0, 47.0, 28.0, 15.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.374724388122559, -5.8787760734558105, -5.382828235626221, -4.886879920959473, -4.390932083129883, -3.8949837684631348, -3.3990354537963867, -2.9030873775482178, -2.407139301300049, -1.9111912250518799, -1.4152430295944214, -0.9192948341369629, -0.42334675788879395, 0.072601318359375, 0.568549633026123, 1.064497709274292, 1.560445785522461, 2.05639386177063, 2.552341938018799, 3.048290252685547, 3.544238328933716, 4.040186405181885, 4.536134719848633, 5.032082557678223, 5.528030872344971, 6.023979187011719, 6.519927024841309, 7.015875339508057, 7.511823654174805, 8.007771492004395, 8.503719329833984, 8.99966812133789, 9.495615005493164, 9.991562843322754, 10.48751163482666, 10.98345947265625, 11.47940731048584, 11.97535514831543, 12.471303939819336, 12.967251777648926, 13.463199615478516, 13.959147453308105, 14.455096244812012, 14.951044082641602, 15.446991920471191, 15.942939758300781, 16.438888549804688, 16.934837341308594, 17.4307861328125, 17.926734924316406, 18.42268180847168, 18.918630599975586, 19.414579391479492, 19.910526275634766, 20.406475067138672, 20.902423858642578, 21.39837074279785, 21.894319534301758, 22.39026641845703, 22.886215209960938, 23.382164001464844, 23.878110885620117, 24.374059677124023, 24.87000846862793, 25.365955352783203]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 8.0, 15.0, 7.0, 13.0, 11.0, 14.0, 19.0, 31.0, 21.0, 23.0, 35.0, 32.0, 33.0, 31.0, 43.0, 58.0, 50.0, 53.0, 46.0, 40.0, 53.0, 31.0, 40.0, 33.0, 38.0, 41.0, 34.0, 25.0, 30.0, 21.0, 13.0, 18.0, 6.0, 5.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.534829139709473, -7.300292015075684, -7.065754413604736, -6.831217288970947, -6.5966796875, -6.362142562866211, -6.127605438232422, -5.893067836761475, -5.658530235290527, -5.423993110656738, -5.189455509185791, -4.954918384552002, -4.720380783081055, -4.485843658447266, -4.251306533813477, -4.016768932342529, -3.7822318077087402, -3.547694444656372, -3.313157081604004, -3.078619956970215, -2.8440823554992676, -2.6095452308654785, -2.3750078678131104, -2.140470504760742, -1.905933141708374, -1.6713957786560059, -1.4368584156036377, -1.202321171760559, -0.9677838087081909, -0.7332464456558228, -0.49870920181274414, -0.264171838760376, -0.029634475708007812, 0.20490285754203796, 0.43944019079208374, 0.6739774942398071, 0.9085148572921753, 1.1430522203445435, 1.377589464187622, 1.6121268272399902, 1.8466641902923584, 2.0812015533447266, 2.3157389163970947, 2.550276279449463, 2.784813404083252, 3.019351005554199, 3.2538881301879883, 3.4884254932403564, 3.7229628562927246, 3.9575002193450928, 4.192037582397461, 4.42657470703125, 4.661112308502197, 4.895649433135986, 5.130187034606934, 5.364724159240723, 5.599261283874512, 5.833798408508301, 6.068336009979248, 6.302873134613037, 6.537410736083984, 6.771947860717773, 7.0064849853515625, 7.24102258682251, 7.475560188293457]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 12.0, 13.0, 30.0, 48.0, 77.0, 110.0, 229.0, 407.0, 841.0, 1963.0, 4694.0, 12227.0, 33005.0, 89191.0, 231321.0, 378816.0, 184155.0, 69709.0, 25404.0, 9444.0, 3737.0, 1564.0, 714.0, 355.0, 216.0, 93.0, 77.0, 40.0, 23.0, 16.0, 8.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.62091064453125, -6.4527587890625, -6.28460693359375, -6.116455078125, -5.94830322265625, -5.7801513671875, -5.61199951171875, -5.44384765625, -5.27569580078125, -5.1075439453125, -4.93939208984375, -4.771240234375, -4.60308837890625, -4.4349365234375, -4.26678466796875, -4.0986328125, -3.93048095703125, -3.7623291015625, -3.59417724609375, -3.426025390625, -3.25787353515625, -3.0897216796875, -2.92156982421875, -2.75341796875, -2.58526611328125, -2.4171142578125, -2.24896240234375, -2.080810546875, -1.91265869140625, -1.7445068359375, -1.57635498046875, -1.408203125, -1.24005126953125, -1.0718994140625, -0.90374755859375, -0.735595703125, -0.56744384765625, -0.3992919921875, -0.23114013671875, -0.06298828125, 0.10516357421875, 0.2733154296875, 0.44146728515625, 0.609619140625, 0.77777099609375, 0.9459228515625, 1.11407470703125, 1.2822265625, 1.45037841796875, 1.6185302734375, 1.78668212890625, 1.954833984375, 2.12298583984375, 2.2911376953125, 2.45928955078125, 2.62744140625, 2.79559326171875, 2.9637451171875, 3.13189697265625, 3.300048828125, 3.46820068359375, 3.6363525390625, 3.80450439453125, 3.97265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 8.0, 7.0, 3.0, 12.0, 15.0, 26.0, 29.0, 25.0, 25.0, 46.0, 42.0, 56.0, 56.0, 63.0, 54.0, 62.0, 61.0, 54.0, 40.0, 42.0, 45.0, 56.0, 45.0, 18.0, 29.0, 15.0, 15.0, 17.0, 13.0, 6.0, 3.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0203399658203125, -0.986968994140625, -0.9535980224609375, -0.92022705078125, -0.8868560791015625, -0.853485107421875, -0.8201141357421875, -0.7867431640625, -0.7533721923828125, -0.720001220703125, -0.6866302490234375, -0.65325927734375, -0.6198883056640625, -0.586517333984375, -0.5531463623046875, -0.519775390625, -0.4864044189453125, -0.453033447265625, -0.4196624755859375, -0.38629150390625, -0.3529205322265625, -0.319549560546875, -0.2861785888671875, -0.2528076171875, -0.2194366455078125, -0.186065673828125, -0.1526947021484375, -0.11932373046875, -0.0859527587890625, -0.052581787109375, -0.0192108154296875, 0.01416015625, 0.0475311279296875, 0.080902099609375, 0.1142730712890625, 0.14764404296875, 0.1810150146484375, 0.214385986328125, 0.2477569580078125, 0.2811279296875, 0.3144989013671875, 0.347869873046875, 0.3812408447265625, 0.41461181640625, 0.4479827880859375, 0.481353759765625, 0.5147247314453125, 0.548095703125, 0.5814666748046875, 0.614837646484375, 0.6482086181640625, 0.68157958984375, 0.7149505615234375, 0.748321533203125, 0.7816925048828125, 0.8150634765625, 0.8484344482421875, 0.881805419921875, 0.9151763916015625, 0.94854736328125, 0.9819183349609375, 1.015289306640625, 1.0486602783203125, 1.08203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 1.0, 9.0, 1.0, 8.0, 13.0, 17.0, 17.0, 27.0, 39.0, 62.0, 69.0, 141.0, 198.0, 281.0, 400.0, 759.0, 1578.0, 4363.0, 15968.0, 73083.0, 353202.0, 462197.0, 103917.0, 22249.0, 5758.0, 1983.0, 826.0, 482.0, 277.0, 177.0, 144.0, 100.0, 55.0, 36.0, 36.0, 20.0, 16.0, 14.0, 3.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-7.859375, -7.6417236328125, -7.424072265625, -7.2064208984375, -6.98876953125, -6.7711181640625, -6.553466796875, -6.3358154296875, -6.1181640625, -5.9005126953125, -5.682861328125, -5.4652099609375, -5.24755859375, -5.0299072265625, -4.812255859375, -4.5946044921875, -4.376953125, -4.1593017578125, -3.941650390625, -3.7239990234375, -3.50634765625, -3.2886962890625, -3.071044921875, -2.8533935546875, -2.6357421875, -2.4180908203125, -2.200439453125, -1.9827880859375, -1.76513671875, -1.5474853515625, -1.329833984375, -1.1121826171875, -0.89453125, -0.6768798828125, -0.459228515625, -0.2415771484375, -0.02392578125, 0.1937255859375, 0.411376953125, 0.6290283203125, 0.8466796875, 1.0643310546875, 1.281982421875, 1.4996337890625, 1.71728515625, 1.9349365234375, 2.152587890625, 2.3702392578125, 2.587890625, 2.8055419921875, 3.023193359375, 3.2408447265625, 3.45849609375, 3.6761474609375, 3.893798828125, 4.1114501953125, 4.3291015625, 4.5467529296875, 4.764404296875, 4.9820556640625, 5.19970703125, 5.4173583984375, 5.635009765625, 5.8526611328125, 6.0703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 5.0, 10.0, 9.0, 11.0, 10.0, 14.0, 18.0, 16.0, 24.0, 18.0, 30.0, 33.0, 28.0, 28.0, 45.0, 27.0, 28.0, 32.0, 46.0, 49.0, 33.0, 41.0, 53.0, 49.0, 34.0, 37.0, 33.0, 37.0, 28.0, 28.0, 16.0, 17.0, 13.0, 10.0, 6.0, 14.0, 10.0, 5.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 9.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.40240478515625, -3.2872314453125, -3.17205810546875, -3.056884765625, -2.94171142578125, -2.8265380859375, -2.71136474609375, -2.59619140625, -2.48101806640625, -2.3658447265625, -2.25067138671875, -2.135498046875, -2.02032470703125, -1.9051513671875, -1.78997802734375, -1.6748046875, -1.55963134765625, -1.4444580078125, -1.32928466796875, -1.214111328125, -1.09893798828125, -0.9837646484375, -0.86859130859375, -0.75341796875, -0.63824462890625, -0.5230712890625, -0.40789794921875, -0.292724609375, -0.17755126953125, -0.0623779296875, 0.05279541015625, 0.16796875, 0.28314208984375, 0.3983154296875, 0.51348876953125, 0.628662109375, 0.74383544921875, 0.8590087890625, 0.97418212890625, 1.08935546875, 1.20452880859375, 1.3197021484375, 1.43487548828125, 1.550048828125, 1.66522216796875, 1.7803955078125, 1.89556884765625, 2.0107421875, 2.12591552734375, 2.2410888671875, 2.35626220703125, 2.471435546875, 2.58660888671875, 2.7017822265625, 2.81695556640625, 2.93212890625, 3.04730224609375, 3.1624755859375, 3.27764892578125, 3.392822265625, 3.50799560546875, 3.6231689453125, 3.73834228515625, 3.853515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 7.0, 4.0, 5.0, 5.0, 4.0, 5.0, 13.0, 15.0, 11.0, 19.0, 27.0, 51.0, 61.0, 100.0, 147.0, 238.0, 372.0, 634.0, 1111.0, 2009.0, 3772.0, 7689.0, 17324.0, 44466.0, 137303.0, 419545.0, 278891.0, 81844.0, 28967.0, 11741.0, 5486.0, 2817.0, 1539.0, 861.0, 526.0, 322.0, 200.0, 151.0, 83.0, 55.0, 40.0, 23.0, 17.0, 20.0, 10.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3203125, -2.233673095703125, -2.14703369140625, -2.060394287109375, -1.9737548828125, -1.887115478515625, -1.80047607421875, -1.713836669921875, -1.627197265625, -1.540557861328125, -1.45391845703125, -1.367279052734375, -1.2806396484375, -1.194000244140625, -1.10736083984375, -1.020721435546875, -0.93408203125, -0.847442626953125, -0.76080322265625, -0.674163818359375, -0.5875244140625, -0.500885009765625, -0.41424560546875, -0.327606201171875, -0.240966796875, -0.154327392578125, -0.06768798828125, 0.018951416015625, 0.1055908203125, 0.192230224609375, 0.27886962890625, 0.365509033203125, 0.4521484375, 0.538787841796875, 0.62542724609375, 0.712066650390625, 0.7987060546875, 0.885345458984375, 0.97198486328125, 1.058624267578125, 1.145263671875, 1.231903076171875, 1.31854248046875, 1.405181884765625, 1.4918212890625, 1.578460693359375, 1.66510009765625, 1.751739501953125, 1.83837890625, 1.925018310546875, 2.01165771484375, 2.098297119140625, 2.1849365234375, 2.271575927734375, 2.35821533203125, 2.444854736328125, 2.531494140625, 2.618133544921875, 2.70477294921875, 2.791412353515625, 2.8780517578125, 2.964691162109375, 3.05133056640625, 3.137969970703125, 3.224609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 16.0, 23.0, 22.0, 18.0, 31.0, 26.0, 29.0, 65.0, 80.0, 103.0, 135.0, 94.0, 71.0, 53.0, 46.0, 29.0, 30.0, 21.0, 11.0, 12.0, 20.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005602836608886719, -0.0005418136715888977, -0.0005233436822891235, -0.0005048736929893494, -0.0004864037036895752, -0.000467933714389801, -0.00044946372509002686, -0.0004309937357902527, -0.0004125237464904785, -0.00039405375719070435, -0.0003755837678909302, -0.000357113778591156, -0.00033864378929138184, -0.00032017379999160767, -0.0003017038106918335, -0.0002832338213920593, -0.00026476383209228516, -0.000246293842792511, -0.00022782385349273682, -0.00020935386419296265, -0.00019088387489318848, -0.0001724138855934143, -0.00015394389629364014, -0.00013547390699386597, -0.0001170039176940918, -9.853392839431763e-05, -8.006393909454346e-05, -6.159394979476929e-05, -4.312396049499512e-05, -2.4653971195220947e-05, -6.183981895446777e-06, 1.2286007404327393e-05, 3.075599670410156e-05, 4.922598600387573e-05, 6.76959753036499e-05, 8.616596460342407e-05, 0.00010463595390319824, 0.0001231059432029724, 0.00014157593250274658, 0.00016004592180252075, 0.00017851591110229492, 0.0001969859004020691, 0.00021545588970184326, 0.00023392587900161743, 0.0002523958683013916, 0.00027086585760116577, 0.00028933584690093994, 0.0003078058362007141, 0.0003262758255004883, 0.00034474581480026245, 0.0003632158041000366, 0.0003816857933998108, 0.00040015578269958496, 0.00041862577199935913, 0.0004370957612991333, 0.00045556575059890747, 0.00047403573989868164, 0.0004925057291984558, 0.00051097571849823, 0.0005294457077980042, 0.0005479156970977783, 0.0005663856863975525, 0.0005848556756973267, 0.0006033256649971008, 0.000621795654296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 7.0, 21.0, 33.0, 56.0, 56.0, 89.0, 186.0, 335.0, 687.0, 1681.0, 4602.0, 16277.0, 86982.0, 677467.0, 217819.0, 30277.0, 7537.0, 2387.0, 960.0, 453.0, 227.0, 138.0, 88.0, 46.0, 37.0, 22.0, 14.0, 13.0, 11.0, 10.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.24609375, -6.075927734375, -5.90576171875, -5.735595703125, -5.5654296875, -5.395263671875, -5.22509765625, -5.054931640625, -4.884765625, -4.714599609375, -4.54443359375, -4.374267578125, -4.2041015625, -4.033935546875, -3.86376953125, -3.693603515625, -3.5234375, -3.353271484375, -3.18310546875, -3.012939453125, -2.8427734375, -2.672607421875, -2.50244140625, -2.332275390625, -2.162109375, -1.991943359375, -1.82177734375, -1.651611328125, -1.4814453125, -1.311279296875, -1.14111328125, -0.970947265625, -0.80078125, -0.630615234375, -0.46044921875, -0.290283203125, -0.1201171875, 0.050048828125, 0.22021484375, 0.390380859375, 0.560546875, 0.730712890625, 0.90087890625, 1.071044921875, 1.2412109375, 1.411376953125, 1.58154296875, 1.751708984375, 1.921875, 2.092041015625, 2.26220703125, 2.432373046875, 2.6025390625, 2.772705078125, 2.94287109375, 3.113037109375, 3.283203125, 3.453369140625, 3.62353515625, 3.793701171875, 3.9638671875, 4.134033203125, 4.30419921875, 4.474365234375, 4.64453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 12.0, 7.0, 10.0, 14.0, 13.0, 23.0, 26.0, 37.0, 61.0, 86.0, 108.0, 125.0, 101.0, 73.0, 65.0, 44.0, 31.0, 31.0, 22.0, 15.0, 12.0, 8.0, 6.0, 8.0, 12.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.8828125, -2.78515625, -2.6875, -2.58984375, -2.4921875, -2.39453125, -2.296875, -2.19921875, -2.1015625, -2.00390625, -1.90625, -1.80859375, -1.7109375, -1.61328125, -1.515625, -1.41796875, -1.3203125, -1.22265625, -1.125, -1.02734375, -0.9296875, -0.83203125, -0.734375, -0.63671875, -0.5390625, -0.44140625, -0.34375, -0.24609375, -0.1484375, -0.05078125, 0.046875, 0.14453125, 0.2421875, 0.33984375, 0.4375, 0.53515625, 0.6328125, 0.73046875, 0.828125, 0.92578125, 1.0234375, 1.12109375, 1.21875, 1.31640625, 1.4140625, 1.51171875, 1.609375, 1.70703125, 1.8046875, 1.90234375, 2.0, 2.09765625, 2.1953125, 2.29296875, 2.390625, 2.48828125, 2.5859375, 2.68359375, 2.78125, 2.87890625, 2.9765625, 3.07421875, 3.171875, 3.26953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 12.0, 20.0, 58.0, 126.0, 168.0, 238.0, 191.0, 108.0, 47.0, 17.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.76984786987305, -58.46548080444336, -56.161109924316406, -53.85674285888672, -51.55237579345703, -49.248008728027344, -46.94363784790039, -44.6392707824707, -42.33489990234375, -40.03053283691406, -37.72616195678711, -35.42179489135742, -33.117427825927734, -30.813058853149414, -28.508689880371094, -26.204322814941406, -23.89995574951172, -21.5955867767334, -19.29121971130371, -16.98685073852539, -14.682482719421387, -12.378114700317383, -10.073745727539062, -7.769378662109375, -5.465009689331055, -3.1606414318084717, -0.8562731742858887, 1.4480953216552734, 3.7524633407592773, 6.056831359863281, 8.361200332641602, 10.665567398071289, 12.969932556152344, 15.274300575256348, 17.57866859436035, 19.883037567138672, 22.18740463256836, 24.49177360534668, 26.796142578125, 29.100509643554688, 31.404878616333008, 33.70924758911133, 36.013614654541016, 38.31798553466797, 40.622352600097656, 42.926719665527344, 45.23108673095703, 47.53545379638672, 49.83982467651367, 52.14419174194336, 54.44856262207031, 56.7529296875, 59.05729675292969, 61.361663818359375, 63.66603469848633, 65.97039794921875, 68.27477264404297, 70.57913970947266, 72.88350677490234, 75.18788146972656, 77.49224853515625, 79.79661560058594, 82.10098266601562, 84.40534973144531, 86.709716796875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 7.0, 14.0, 5.0, 15.0, 18.0, 17.0, 21.0, 25.0, 33.0, 27.0, 26.0, 38.0, 36.0, 47.0, 37.0, 57.0, 42.0, 34.0, 39.0, 47.0, 40.0, 37.0, 28.0, 38.0, 28.0, 36.0, 35.0, 18.0, 25.0, 19.0, 20.0, 14.0, 6.0, 10.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-24.171260833740234, -23.46770668029785, -22.764150619506836, -22.060596466064453, -21.357040405273438, -20.653486251831055, -19.949932098388672, -19.246376037597656, -18.54281997680664, -17.839265823364258, -17.135709762573242, -16.43215560913086, -15.728599548339844, -15.025045394897461, -14.321490287780762, -13.617935180664062, -12.91438102722168, -12.21082592010498, -11.507270812988281, -10.803716659545898, -10.100160598754883, -9.3966064453125, -8.6930513381958, -7.989496231079102, -7.285941123962402, -6.582386016845703, -5.878830909729004, -5.175276279449463, -4.471721172332764, -3.7681660652160645, -3.0646114349365234, -2.361056327819824, -1.657501220703125, -0.9539462327957153, -0.25039124488830566, 0.45316362380981445, 1.1567187309265137, 1.860273838043213, 2.563828468322754, 3.267383575439453, 3.9709386825561523, 4.674493789672852, 5.378048896789551, 6.081603527069092, 6.785158634185791, 7.48871374130249, 8.192268371582031, 8.89582347869873, 9.59937858581543, 10.302933692932129, 11.006488800048828, 11.710042953491211, 12.413599014282227, 13.11715316772461, 13.820708274841309, 14.524263381958008, 15.227818489074707, 15.931373596191406, 16.63492774963379, 17.338483810424805, 18.042037963867188, 18.745594024658203, 19.449148178100586, 20.15270233154297, 20.856258392333984]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 11.0, 20.0, 22.0, 23.0, 36.0, 53.0, 72.0, 87.0, 140.0, 221.0, 334.0, 575.0, 879.0, 1511.0, 2756.0, 5114.0, 10534.0, 22937.0, 57326.0, 188254.0, 2463913.0, 1192793.0, 155362.0, 50402.0, 20703.0, 9527.0, 4619.0, 2464.0, 1387.0, 833.0, 468.0, 297.0, 202.0, 125.0, 94.0, 57.0, 26.0, 30.0, 22.0, 12.0, 4.0, 10.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.1739501953125, -4.043212890625, -3.9124755859375, -3.78173828125, -3.6510009765625, -3.520263671875, -3.3895263671875, -3.2587890625, -3.1280517578125, -2.997314453125, -2.8665771484375, -2.73583984375, -2.6051025390625, -2.474365234375, -2.3436279296875, -2.212890625, -2.0821533203125, -1.951416015625, -1.8206787109375, -1.68994140625, -1.5592041015625, -1.428466796875, -1.2977294921875, -1.1669921875, -1.0362548828125, -0.905517578125, -0.7747802734375, -0.64404296875, -0.5133056640625, -0.382568359375, -0.2518310546875, -0.12109375, 0.0096435546875, 0.140380859375, 0.2711181640625, 0.40185546875, 0.5325927734375, 0.663330078125, 0.7940673828125, 0.9248046875, 1.0555419921875, 1.186279296875, 1.3170166015625, 1.44775390625, 1.5784912109375, 1.709228515625, 1.8399658203125, 1.970703125, 2.1014404296875, 2.232177734375, 2.3629150390625, 2.49365234375, 2.6243896484375, 2.755126953125, 2.8858642578125, 3.0166015625, 3.1473388671875, 3.278076171875, 3.4088134765625, 3.53955078125, 3.6702880859375, 3.801025390625, 3.9317626953125, 4.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 15.0, 22.0, 20.0, 25.0, 22.0, 29.0, 33.0, 38.0, 48.0, 51.0, 46.0, 54.0, 46.0, 61.0, 71.0, 64.0, 47.0, 40.0, 51.0, 31.0, 26.0, 31.0, 23.0, 21.0, 22.0, 12.0, 9.0, 4.0, 11.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0399169921875, -1.006591796875, -0.9732666015625, -0.93994140625, -0.9066162109375, -0.873291015625, -0.8399658203125, -0.806640625, -0.7733154296875, -0.739990234375, -0.7066650390625, -0.67333984375, -0.6400146484375, -0.606689453125, -0.5733642578125, -0.5400390625, -0.5067138671875, -0.473388671875, -0.4400634765625, -0.40673828125, -0.3734130859375, -0.340087890625, -0.3067626953125, -0.2734375, -0.2401123046875, -0.206787109375, -0.1734619140625, -0.14013671875, -0.1068115234375, -0.073486328125, -0.0401611328125, -0.0068359375, 0.0264892578125, 0.059814453125, 0.0931396484375, 0.12646484375, 0.1597900390625, 0.193115234375, 0.2264404296875, 0.259765625, 0.2930908203125, 0.326416015625, 0.3597412109375, 0.39306640625, 0.4263916015625, 0.459716796875, 0.4930419921875, 0.5263671875, 0.5596923828125, 0.593017578125, 0.6263427734375, 0.65966796875, 0.6929931640625, 0.726318359375, 0.7596435546875, 0.79296875, 0.8262939453125, 0.859619140625, 0.8929443359375, 0.92626953125, 0.9595947265625, 0.992919921875, 1.0262451171875, 1.0595703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 11.0, 17.0, 26.0, 52.0, 67.0, 106.0, 253.0, 631.0, 1917.0, 8112.0, 52883.0, 1256305.0, 2787341.0, 72772.0, 10108.0, 2277.0, 766.0, 306.0, 151.0, 75.0, 43.0, 23.0, 19.0, 13.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.53125, -8.227294921875, -7.92333984375, -7.619384765625, -7.3154296875, -7.011474609375, -6.70751953125, -6.403564453125, -6.099609375, -5.795654296875, -5.49169921875, -5.187744140625, -4.8837890625, -4.579833984375, -4.27587890625, -3.971923828125, -3.66796875, -3.364013671875, -3.06005859375, -2.756103515625, -2.4521484375, -2.148193359375, -1.84423828125, -1.540283203125, -1.236328125, -0.932373046875, -0.62841796875, -0.324462890625, -0.0205078125, 0.283447265625, 0.58740234375, 0.891357421875, 1.1953125, 1.499267578125, 1.80322265625, 2.107177734375, 2.4111328125, 2.715087890625, 3.01904296875, 3.322998046875, 3.626953125, 3.930908203125, 4.23486328125, 4.538818359375, 4.8427734375, 5.146728515625, 5.45068359375, 5.754638671875, 6.05859375, 6.362548828125, 6.66650390625, 6.970458984375, 7.2744140625, 7.578369140625, 7.88232421875, 8.186279296875, 8.490234375, 8.794189453125, 9.09814453125, 9.402099609375, 9.7060546875, 10.010009765625, 10.31396484375, 10.617919921875, 10.921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 11.0, 9.0, 19.0, 28.0, 35.0, 51.0, 85.0, 144.0, 293.0, 607.0, 1395.0, 611.0, 293.0, 162.0, 98.0, 71.0, 49.0, 28.0, 24.0, 10.0, 6.0, 11.0, 2.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.61328125, -2.524810791015625, -2.43634033203125, -2.347869873046875, -2.2593994140625, -2.170928955078125, -2.08245849609375, -1.993988037109375, -1.905517578125, -1.817047119140625, -1.72857666015625, -1.640106201171875, -1.5516357421875, -1.463165283203125, -1.37469482421875, -1.286224365234375, -1.19775390625, -1.109283447265625, -1.02081298828125, -0.932342529296875, -0.8438720703125, -0.755401611328125, -0.66693115234375, -0.578460693359375, -0.489990234375, -0.401519775390625, -0.31304931640625, -0.224578857421875, -0.1361083984375, -0.047637939453125, 0.04083251953125, 0.129302978515625, 0.2177734375, 0.306243896484375, 0.39471435546875, 0.483184814453125, 0.5716552734375, 0.660125732421875, 0.74859619140625, 0.837066650390625, 0.925537109375, 1.014007568359375, 1.10247802734375, 1.190948486328125, 1.2794189453125, 1.367889404296875, 1.45635986328125, 1.544830322265625, 1.63330078125, 1.721771240234375, 1.81024169921875, 1.898712158203125, 1.9871826171875, 2.075653076171875, 2.16412353515625, 2.252593994140625, 2.341064453125, 2.429534912109375, 2.51800537109375, 2.606475830078125, 2.6949462890625, 2.783416748046875, 2.87188720703125, 2.960357666015625, 3.048828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 62.0, 138.0, 261.0, 238.0, 141.0, 86.0, 26.0, 16.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.851215362548828, -21.765907287597656, -20.680599212646484, -19.595291137695312, -18.50998306274414, -17.42467498779297, -16.339366912841797, -15.254059791564941, -14.16875171661377, -13.083443641662598, -11.998135566711426, -10.91282844543457, -9.827520370483398, -8.742212295532227, -7.656904220581055, -6.571596145629883, -5.486288070678711, -4.400979995727539, -3.3156721591949463, -2.2303643226623535, -1.1450562477111816, -0.059748172760009766, 1.025559425354004, 2.110867500305176, 3.1961755752563477, 4.2814836502075195, 5.366791725158691, 6.452099323272705, 7.537407398223877, 8.62271499633789, 9.708023071289062, 10.793331146240234, 11.878639221191406, 12.963947296142578, 14.04925537109375, 15.134563446044922, 16.219871520996094, 17.305179595947266, 18.390487670898438, 19.47579574584961, 20.56110382080078, 21.646411895751953, 22.731719970703125, 23.817028045654297, 24.90233612060547, 25.98764419555664, 27.072952270507812, 28.158260345458984, 29.243566513061523, 30.328874588012695, 31.414182662963867, 32.499488830566406, 33.58479690551758, 34.67010498046875, 35.75541305541992, 36.840721130371094, 37.926029205322266, 39.01133728027344, 40.09664535522461, 41.18195343017578, 42.26726150512695, 43.352569580078125, 44.4378776550293, 45.52318572998047, 46.60849380493164]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 9.0, 9.0, 5.0, 11.0, 5.0, 11.0, 23.0, 19.0, 24.0, 21.0, 23.0, 24.0, 48.0, 37.0, 48.0, 37.0, 48.0, 44.0, 52.0, 44.0, 46.0, 36.0, 53.0, 39.0, 31.0, 23.0, 32.0, 32.0, 21.0, 29.0, 18.0, 18.0, 17.0, 12.0, 16.0, 7.0, 8.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54950475692749, -7.269668102264404, -6.98983097076416, -6.709994316101074, -6.430157661437988, -6.150321006774902, -5.870484352111816, -5.590647220611572, -5.310810565948486, -5.0309739112854, -4.751136779785156, -4.47130012512207, -4.191463470458984, -3.9116268157958984, -3.6317899227142334, -3.3519530296325684, -3.0721163749694824, -2.7922797203063965, -2.5124428272247314, -2.2326059341430664, -1.9527692794799805, -1.672932505607605, -1.3930957317352295, -1.113258957862854, -0.8334221839904785, -0.553585410118103, -0.27374863624572754, 0.006088137626647949, 0.28592491149902344, 0.5657616853713989, 0.8455984592437744, 1.12543523311615, 1.4052715301513672, 1.6851083040237427, 1.9649450778961182, 2.244781970977783, 2.524618625640869, 2.804455280303955, 3.08429217338562, 3.364129066467285, 3.643965721130371, 3.923802375793457, 4.203639030456543, 4.483476161956787, 4.763312816619873, 5.043149471282959, 5.322986602783203, 5.602823257446289, 5.882659912109375, 6.162496566772461, 6.442333221435547, 6.722170352935791, 7.002007007598877, 7.281843662261963, 7.561680793762207, 7.841517448425293, 8.121354103088379, 8.401190757751465, 8.68102741241455, 8.960864067077637, 9.240701675415039, 9.520538330078125, 9.800374984741211, 10.080211639404297, 10.360048294067383]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 10.0, 11.0, 11.0, 14.0, 19.0, 34.0, 38.0, 73.0, 113.0, 168.0, 216.0, 434.0, 721.0, 1225.0, 2290.0, 4469.0, 8852.0, 18305.0, 38666.0, 86628.0, 270408.0, 401411.0, 118290.0, 49881.0, 22944.0, 11128.0, 5542.0, 2805.0, 1546.0, 862.0, 541.0, 347.0, 189.0, 103.0, 86.0, 48.0, 30.0, 29.0, 14.0, 16.0, 12.0, 8.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.42578125, -4.279052734375, -4.13232421875, -3.985595703125, -3.8388671875, -3.692138671875, -3.54541015625, -3.398681640625, -3.251953125, -3.105224609375, -2.95849609375, -2.811767578125, -2.6650390625, -2.518310546875, -2.37158203125, -2.224853515625, -2.078125, -1.931396484375, -1.78466796875, -1.637939453125, -1.4912109375, -1.344482421875, -1.19775390625, -1.051025390625, -0.904296875, -0.757568359375, -0.61083984375, -0.464111328125, -0.3173828125, -0.170654296875, -0.02392578125, 0.122802734375, 0.26953125, 0.416259765625, 0.56298828125, 0.709716796875, 0.8564453125, 1.003173828125, 1.14990234375, 1.296630859375, 1.443359375, 1.590087890625, 1.73681640625, 1.883544921875, 2.0302734375, 2.177001953125, 2.32373046875, 2.470458984375, 2.6171875, 2.763916015625, 2.91064453125, 3.057373046875, 3.2041015625, 3.350830078125, 3.49755859375, 3.644287109375, 3.791015625, 3.937744140625, 4.08447265625, 4.231201171875, 4.3779296875, 4.524658203125, 4.67138671875, 4.818115234375, 4.96484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 12.0, 12.0, 20.0, 14.0, 23.0, 22.0, 25.0, 35.0, 31.0, 36.0, 54.0, 51.0, 35.0, 55.0, 57.0, 52.0, 60.0, 60.0, 43.0, 44.0, 35.0, 34.0, 31.0, 28.0, 28.0, 19.0, 13.0, 11.0, 14.0, 8.0, 6.0, 6.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1494140625, -1.1174163818359375, -1.085418701171875, -1.0534210205078125, -1.02142333984375, -0.9894256591796875, -0.957427978515625, -0.9254302978515625, -0.8934326171875, -0.8614349365234375, -0.829437255859375, -0.7974395751953125, -0.76544189453125, -0.7334442138671875, -0.701446533203125, -0.6694488525390625, -0.637451171875, -0.6054534912109375, -0.573455810546875, -0.5414581298828125, -0.50946044921875, -0.4774627685546875, -0.445465087890625, -0.4134674072265625, -0.3814697265625, -0.3494720458984375, -0.317474365234375, -0.2854766845703125, -0.25347900390625, -0.2214813232421875, -0.189483642578125, -0.1574859619140625, -0.12548828125, -0.0934906005859375, -0.061492919921875, -0.0294952392578125, 0.00250244140625, 0.0345001220703125, 0.066497802734375, 0.0984954833984375, 0.1304931640625, 0.1624908447265625, 0.194488525390625, 0.2264862060546875, 0.25848388671875, 0.2904815673828125, 0.322479248046875, 0.3544769287109375, 0.386474609375, 0.4184722900390625, 0.450469970703125, 0.4824676513671875, 0.51446533203125, 0.5464630126953125, 0.578460693359375, 0.6104583740234375, 0.6424560546875, 0.6744537353515625, 0.706451416015625, 0.7384490966796875, 0.77044677734375, 0.8024444580078125, 0.834442138671875, 0.8664398193359375, 0.8984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 8.0, 3.0, 4.0, 10.0, 13.0, 18.0, 33.0, 37.0, 46.0, 51.0, 69.0, 123.0, 160.0, 245.0, 421.0, 740.0, 1491.0, 4641.0, 18195.0, 89510.0, 691646.0, 195544.0, 33179.0, 7557.0, 2367.0, 965.0, 502.0, 321.0, 204.0, 114.0, 86.0, 71.0, 50.0, 31.0, 26.0, 18.0, 16.0, 17.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5704345703125, -7.297119140625, -7.0238037109375, -6.75048828125, -6.4771728515625, -6.203857421875, -5.9305419921875, -5.6572265625, -5.3839111328125, -5.110595703125, -4.8372802734375, -4.56396484375, -4.2906494140625, -4.017333984375, -3.7440185546875, -3.470703125, -3.1973876953125, -2.924072265625, -2.6507568359375, -2.37744140625, -2.1041259765625, -1.830810546875, -1.5574951171875, -1.2841796875, -1.0108642578125, -0.737548828125, -0.4642333984375, -0.19091796875, 0.0823974609375, 0.355712890625, 0.6290283203125, 0.90234375, 1.1756591796875, 1.448974609375, 1.7222900390625, 1.99560546875, 2.2689208984375, 2.542236328125, 2.8155517578125, 3.0888671875, 3.3621826171875, 3.635498046875, 3.9088134765625, 4.18212890625, 4.4554443359375, 4.728759765625, 5.0020751953125, 5.275390625, 5.5487060546875, 5.822021484375, 6.0953369140625, 6.36865234375, 6.6419677734375, 6.915283203125, 7.1885986328125, 7.4619140625, 7.7352294921875, 8.008544921875, 8.2818603515625, 8.55517578125, 8.8284912109375, 9.101806640625, 9.3751220703125, 9.6484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 16.0, 7.0, 14.0, 12.0, 14.0, 16.0, 16.0, 30.0, 37.0, 38.0, 35.0, 32.0, 47.0, 50.0, 47.0, 37.0, 44.0, 41.0, 47.0, 39.0, 38.0, 44.0, 34.0, 28.0, 28.0, 26.0, 29.0, 17.0, 20.0, 17.0, 4.0, 24.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.98046875, -3.85498046875, -3.7294921875, -3.60400390625, -3.478515625, -3.35302734375, -3.2275390625, -3.10205078125, -2.9765625, -2.85107421875, -2.7255859375, -2.60009765625, -2.474609375, -2.34912109375, -2.2236328125, -2.09814453125, -1.97265625, -1.84716796875, -1.7216796875, -1.59619140625, -1.470703125, -1.34521484375, -1.2197265625, -1.09423828125, -0.96875, -0.84326171875, -0.7177734375, -0.59228515625, -0.466796875, -0.34130859375, -0.2158203125, -0.09033203125, 0.03515625, 0.16064453125, 0.2861328125, 0.41162109375, 0.537109375, 0.66259765625, 0.7880859375, 0.91357421875, 1.0390625, 1.16455078125, 1.2900390625, 1.41552734375, 1.541015625, 1.66650390625, 1.7919921875, 1.91748046875, 2.04296875, 2.16845703125, 2.2939453125, 2.41943359375, 2.544921875, 2.67041015625, 2.7958984375, 2.92138671875, 3.046875, 3.17236328125, 3.2978515625, 3.42333984375, 3.548828125, 3.67431640625, 3.7998046875, 3.92529296875, 4.05078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 4.0, 7.0, 8.0, 9.0, 16.0, 10.0, 22.0, 30.0, 35.0, 52.0, 76.0, 127.0, 177.0, 261.0, 559.0, 1400.0, 4191.0, 16103.0, 93310.0, 831941.0, 79513.0, 14163.0, 3758.0, 1411.0, 561.0, 289.0, 150.0, 112.0, 80.0, 38.0, 35.0, 22.0, 24.0, 15.0, 8.0, 8.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.06109619140625, -6.8214111328125, -6.58172607421875, -6.342041015625, -6.10235595703125, -5.8626708984375, -5.62298583984375, -5.38330078125, -5.14361572265625, -4.9039306640625, -4.66424560546875, -4.424560546875, -4.18487548828125, -3.9451904296875, -3.70550537109375, -3.4658203125, -3.22613525390625, -2.9864501953125, -2.74676513671875, -2.507080078125, -2.26739501953125, -2.0277099609375, -1.78802490234375, -1.54833984375, -1.30865478515625, -1.0689697265625, -0.82928466796875, -0.589599609375, -0.34991455078125, -0.1102294921875, 0.12945556640625, 0.369140625, 0.60882568359375, 0.8485107421875, 1.08819580078125, 1.327880859375, 1.56756591796875, 1.8072509765625, 2.04693603515625, 2.28662109375, 2.52630615234375, 2.7659912109375, 3.00567626953125, 3.245361328125, 3.48504638671875, 3.7247314453125, 3.96441650390625, 4.2041015625, 4.44378662109375, 4.6834716796875, 4.92315673828125, 5.162841796875, 5.40252685546875, 5.6422119140625, 5.88189697265625, 6.12158203125, 6.36126708984375, 6.6009521484375, 6.84063720703125, 7.080322265625, 7.32000732421875, 7.5596923828125, 7.79937744140625, 8.0390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 20.0, 22.0, 31.0, 33.0, 75.0, 256.0, 326.0, 74.0, 37.0, 28.0, 22.0, 13.0, 8.0, 12.0, 4.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0017728805541992188, -0.0017297565937042236, -0.0016866326332092285, -0.0016435086727142334, -0.0016003847122192383, -0.0015572607517242432, -0.001514136791229248, -0.001471012830734253, -0.0014278888702392578, -0.0013847649097442627, -0.0013416409492492676, -0.0012985169887542725, -0.0012553930282592773, -0.0012122690677642822, -0.0011691451072692871, -0.001126021146774292, -0.0010828971862792969, -0.0010397732257843018, -0.0009966492652893066, -0.0009535253047943115, -0.0009104013442993164, -0.0008672773838043213, -0.0008241534233093262, -0.0007810294628143311, -0.0007379055023193359, -0.0006947815418243408, -0.0006516575813293457, -0.0006085336208343506, -0.0005654096603393555, -0.0005222856998443604, -0.00047916173934936523, -0.0004360377788543701, -0.000392913818359375, -0.0003497898578643799, -0.00030666589736938477, -0.00026354193687438965, -0.00022041797637939453, -0.00017729401588439941, -0.0001341700553894043, -9.104609489440918e-05, -4.792213439941406e-05, -4.798173904418945e-06, 3.832578659057617e-05, 8.144974708557129e-05, 0.0001245737075805664, 0.00016769766807556152, 0.00021082162857055664, 0.00025394558906555176, 0.0002970695495605469, 0.000340193510055542, 0.0003833174705505371, 0.0004264414310455322, 0.00046956539154052734, 0.0005126893520355225, 0.0005558133125305176, 0.0005989372730255127, 0.0006420612335205078, 0.0006851851940155029, 0.000728309154510498, 0.0007714331150054932, 0.0008145570755004883, 0.0008576810359954834, 0.0009008049964904785, 0.0009439289569854736, 0.0009870529174804688]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 11.0, 7.0, 9.0, 18.0, 31.0, 50.0, 66.0, 118.0, 234.0, 516.0, 1578.0, 6026.0, 39483.0, 919484.0, 68842.0, 8640.0, 2133.0, 636.0, 276.0, 143.0, 59.0, 47.0, 34.0, 24.0, 17.0, 15.0, 12.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.8203125, -12.3873291015625, -11.954345703125, -11.5213623046875, -11.08837890625, -10.6553955078125, -10.222412109375, -9.7894287109375, -9.3564453125, -8.9234619140625, -8.490478515625, -8.0574951171875, -7.62451171875, -7.1915283203125, -6.758544921875, -6.3255615234375, -5.892578125, -5.4595947265625, -5.026611328125, -4.5936279296875, -4.16064453125, -3.7276611328125, -3.294677734375, -2.8616943359375, -2.4287109375, -1.9957275390625, -1.562744140625, -1.1297607421875, -0.69677734375, -0.2637939453125, 0.169189453125, 0.6021728515625, 1.03515625, 1.4681396484375, 1.901123046875, 2.3341064453125, 2.76708984375, 3.2000732421875, 3.633056640625, 4.0660400390625, 4.4990234375, 4.9320068359375, 5.364990234375, 5.7979736328125, 6.23095703125, 6.6639404296875, 7.096923828125, 7.5299072265625, 7.962890625, 8.3958740234375, 8.828857421875, 9.2618408203125, 9.69482421875, 10.1278076171875, 10.560791015625, 10.9937744140625, 11.4267578125, 11.8597412109375, 12.292724609375, 12.7257080078125, 13.15869140625, 13.5916748046875, 14.024658203125, 14.4576416015625, 14.890625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 10.0, 5.0, 14.0, 20.0, 13.0, 25.0, 39.0, 96.0, 287.0, 226.0, 83.0, 28.0, 28.0, 14.0, 15.0, 9.0, 12.0, 9.0, 4.0, 7.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.6171875, -4.46246337890625, -4.3077392578125, -4.15301513671875, -3.998291015625, -3.84356689453125, -3.6888427734375, -3.53411865234375, -3.37939453125, -3.22467041015625, -3.0699462890625, -2.91522216796875, -2.760498046875, -2.60577392578125, -2.4510498046875, -2.29632568359375, -2.1416015625, -1.98687744140625, -1.8321533203125, -1.67742919921875, -1.522705078125, -1.36798095703125, -1.2132568359375, -1.05853271484375, -0.90380859375, -0.74908447265625, -0.5943603515625, -0.43963623046875, -0.284912109375, -0.13018798828125, 0.0245361328125, 0.17926025390625, 0.333984375, 0.48870849609375, 0.6434326171875, 0.79815673828125, 0.952880859375, 1.10760498046875, 1.2623291015625, 1.41705322265625, 1.57177734375, 1.72650146484375, 1.8812255859375, 2.03594970703125, 2.190673828125, 2.34539794921875, 2.5001220703125, 2.65484619140625, 2.8095703125, 2.96429443359375, 3.1190185546875, 3.27374267578125, 3.428466796875, 3.58319091796875, 3.7379150390625, 3.89263916015625, 4.04736328125, 4.20208740234375, 4.3568115234375, 4.51153564453125, 4.666259765625, 4.82098388671875, 4.9757080078125, 5.13043212890625, 5.28515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 19.0, 69.0, 262.0, 369.0, 201.0, 59.0, 10.0, 8.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-102.44647216796875, -98.25128936767578, -94.05610656738281, -89.86093139648438, -85.6657485961914, -81.47056579589844, -77.27538299560547, -73.0802001953125, -68.88502502441406, -64.6898422241211, -60.49466323852539, -56.29948043823242, -52.10430145263672, -47.90911865234375, -43.71393585205078, -39.51875305175781, -35.323570251464844, -31.128389358520508, -26.933208465576172, -22.738025665283203, -18.542844772338867, -14.347663879394531, -10.152481079101562, -5.957300186157227, -1.7621192932128906, 2.4330620765686035, 6.628243446350098, 10.82342529296875, 15.018606185913086, 19.213787078857422, 23.40896987915039, 27.604150772094727, 31.799331665039062, 35.99451446533203, 40.189693450927734, 44.3848762512207, 48.580055236816406, 52.775238037109375, 56.970420837402344, 61.16560363769531, 65.36077880859375, 69.55596160888672, 73.75114440917969, 77.94631958007812, 82.1415023803711, 86.33668518066406, 90.53186798095703, 94.72705078125, 98.92223358154297, 103.11741638183594, 107.3125991821289, 111.50778198242188, 115.70295715332031, 119.89813995361328, 124.09332275390625, 128.2884979248047, 132.4836883544922, 136.67886352539062, 140.87405395507812, 145.06922912597656, 149.26441955566406, 153.4595947265625, 157.65478515625, 161.84996032714844, 166.04513549804688]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 8.0, 9.0, 4.0, 6.0, 6.0, 17.0, 15.0, 15.0, 22.0, 12.0, 21.0, 29.0, 28.0, 35.0, 33.0, 36.0, 53.0, 54.0, 48.0, 47.0, 48.0, 37.0, 46.0, 61.0, 44.0, 32.0, 45.0, 32.0, 31.0, 18.0, 17.0, 19.0, 16.0, 14.0, 2.0, 9.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-24.40401840209961, -23.63626480102539, -22.868513107299805, -22.100759506225586, -21.333005905151367, -20.56525421142578, -19.797500610351562, -19.029747009277344, -18.261993408203125, -17.494239807128906, -16.72648811340332, -15.958734512329102, -15.190980911254883, -14.42322826385498, -13.655475616455078, -12.88772201538086, -12.119970321655273, -11.352217674255371, -10.584464073181152, -9.81671142578125, -9.048957824707031, -8.281205177307129, -7.513452529907227, -6.745699405670166, -5.9779462814331055, -5.210193157196045, -4.442440032958984, -3.674687385559082, -2.9069342613220215, -2.139181137084961, -1.3714284896850586, -0.603675365447998, 0.1640777587890625, 0.9318307638168335, 1.6995837688446045, 2.467336654663086, 3.2350897789001465, 4.002842903137207, 4.770595550537109, 5.53834867477417, 6.3061017990112305, 7.073854923248291, 7.841608047485352, 8.609360694885254, 9.377113342285156, 10.144866943359375, 10.912619590759277, 11.68037223815918, 12.448125839233398, 13.2158784866333, 13.98363208770752, 14.751384735107422, 15.51913833618164, 16.28689193725586, 17.054643630981445, 17.822397232055664, 18.59014892578125, 19.35790252685547, 20.125654220581055, 20.893407821655273, 21.661161422729492, 22.428913116455078, 23.196666717529297, 23.964420318603516, 24.732173919677734]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 8.0, 9.0, 4.0, 10.0, 12.0, 13.0, 27.0, 32.0, 51.0, 79.0, 106.0, 205.0, 405.0, 986.0, 2660.0, 8542.0, 35243.0, 336371.0, 3671665.0, 110307.0, 18945.0, 5408.0, 1857.0, 680.0, 287.0, 137.0, 83.0, 51.0, 39.0, 18.0, 11.0, 15.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-13.4296875, -13.096435546875, -12.76318359375, -12.429931640625, -12.0966796875, -11.763427734375, -11.43017578125, -11.096923828125, -10.763671875, -10.430419921875, -10.09716796875, -9.763916015625, -9.4306640625, -9.097412109375, -8.76416015625, -8.430908203125, -8.09765625, -7.764404296875, -7.43115234375, -7.097900390625, -6.7646484375, -6.431396484375, -6.09814453125, -5.764892578125, -5.431640625, -5.098388671875, -4.76513671875, -4.431884765625, -4.0986328125, -3.765380859375, -3.43212890625, -3.098876953125, -2.765625, -2.432373046875, -2.09912109375, -1.765869140625, -1.4326171875, -1.099365234375, -0.76611328125, -0.432861328125, -0.099609375, 0.233642578125, 0.56689453125, 0.900146484375, 1.2333984375, 1.566650390625, 1.89990234375, 2.233154296875, 2.56640625, 2.899658203125, 3.23291015625, 3.566162109375, 3.8994140625, 4.232666015625, 4.56591796875, 4.899169921875, 5.232421875, 5.565673828125, 5.89892578125, 6.232177734375, 6.5654296875, 6.898681640625, 7.23193359375, 7.565185546875, 7.8984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 14.0, 14.0, 21.0, 20.0, 19.0, 21.0, 32.0, 29.0, 45.0, 38.0, 45.0, 43.0, 49.0, 47.0, 60.0, 48.0, 50.0, 55.0, 53.0, 41.0, 35.0, 46.0, 29.0, 23.0, 23.0, 24.0, 15.0, 15.0, 10.0, 9.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.34765625, -1.3109817504882812, -1.2743072509765625, -1.2376327514648438, -1.200958251953125, -1.1642837524414062, -1.1276092529296875, -1.0909347534179688, -1.05426025390625, -1.0175857543945312, -0.9809112548828125, -0.9442367553710938, -0.907562255859375, -0.8708877563476562, -0.8342132568359375, -0.7975387573242188, -0.7608642578125, -0.7241897583007812, -0.6875152587890625, -0.6508407592773438, -0.614166259765625, -0.5774917602539062, -0.5408172607421875, -0.5041427612304688, -0.46746826171875, -0.43079376220703125, -0.3941192626953125, -0.35744476318359375, -0.320770263671875, -0.28409576416015625, -0.2474212646484375, -0.21074676513671875, -0.174072265625, -0.13739776611328125, -0.1007232666015625, -0.06404876708984375, -0.027374267578125, 0.00930023193359375, 0.0459747314453125, 0.08264923095703125, 0.11932373046875, 0.15599822998046875, 0.1926727294921875, 0.22934722900390625, 0.266021728515625, 0.30269622802734375, 0.3393707275390625, 0.37604522705078125, 0.4127197265625, 0.44939422607421875, 0.4860687255859375, 0.5227432250976562, 0.559417724609375, 0.5960922241210938, 0.6327667236328125, 0.6694412231445312, 0.70611572265625, 0.7427902221679688, 0.7794647216796875, 0.8161392211914062, 0.852813720703125, 0.8894882202148438, 0.9261627197265625, 0.9628372192382812, 0.99951171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 35.0, 45.0, 93.0, 208.0, 379.0, 850.0, 1792.0, 4300.0, 11662.0, 39859.0, 248379.0, 3440795.0, 372006.0, 50913.0, 13753.0, 5036.0, 2246.0, 939.0, 439.0, 241.0, 115.0, 67.0, 37.0, 11.0, 14.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.1171875, -7.8890380859375, -7.660888671875, -7.4327392578125, -7.20458984375, -6.9764404296875, -6.748291015625, -6.5201416015625, -6.2919921875, -6.0638427734375, -5.835693359375, -5.6075439453125, -5.37939453125, -5.1512451171875, -4.923095703125, -4.6949462890625, -4.466796875, -4.2386474609375, -4.010498046875, -3.7823486328125, -3.55419921875, -3.3260498046875, -3.097900390625, -2.8697509765625, -2.6416015625, -2.4134521484375, -2.185302734375, -1.9571533203125, -1.72900390625, -1.5008544921875, -1.272705078125, -1.0445556640625, -0.81640625, -0.5882568359375, -0.360107421875, -0.1319580078125, 0.09619140625, 0.3243408203125, 0.552490234375, 0.7806396484375, 1.0087890625, 1.2369384765625, 1.465087890625, 1.6932373046875, 1.92138671875, 2.1495361328125, 2.377685546875, 2.6058349609375, 2.833984375, 3.0621337890625, 3.290283203125, 3.5184326171875, 3.74658203125, 3.9747314453125, 4.202880859375, 4.4310302734375, 4.6591796875, 4.8873291015625, 5.115478515625, 5.3436279296875, 5.57177734375, 5.7999267578125, 6.028076171875, 6.2562255859375, 6.484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 8.0, 6.0, 18.0, 28.0, 19.0, 43.0, 63.0, 107.0, 148.0, 281.0, 648.0, 1443.0, 546.0, 267.0, 149.0, 93.0, 47.0, 36.0, 22.0, 17.0, 15.0, 4.0, 11.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3515625, -2.271514892578125, -2.19146728515625, -2.111419677734375, -2.0313720703125, -1.951324462890625, -1.87127685546875, -1.791229248046875, -1.711181640625, -1.631134033203125, -1.55108642578125, -1.471038818359375, -1.3909912109375, -1.310943603515625, -1.23089599609375, -1.150848388671875, -1.07080078125, -0.990753173828125, -0.91070556640625, -0.830657958984375, -0.7506103515625, -0.670562744140625, -0.59051513671875, -0.510467529296875, -0.430419921875, -0.350372314453125, -0.27032470703125, -0.190277099609375, -0.1102294921875, -0.030181884765625, 0.04986572265625, 0.129913330078125, 0.2099609375, 0.290008544921875, 0.37005615234375, 0.450103759765625, 0.5301513671875, 0.610198974609375, 0.69024658203125, 0.770294189453125, 0.850341796875, 0.930389404296875, 1.01043701171875, 1.090484619140625, 1.1705322265625, 1.250579833984375, 1.33062744140625, 1.410675048828125, 1.49072265625, 1.570770263671875, 1.65081787109375, 1.730865478515625, 1.8109130859375, 1.890960693359375, 1.97100830078125, 2.051055908203125, 2.131103515625, 2.211151123046875, 2.29119873046875, 2.371246337890625, 2.4512939453125, 2.531341552734375, 2.61138916015625, 2.691436767578125, 2.771484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 12.0, 32.0, 22.0, 68.0, 105.0, 145.0, 142.0, 166.0, 101.0, 94.0, 57.0, 32.0, 10.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.428987503051758, -12.814824104309082, -12.200661659240723, -11.586498260498047, -10.972335815429688, -10.358172416687012, -9.744009017944336, -9.129846572875977, -8.5156831741333, -7.901520252227783, -7.287357330322266, -6.67319393157959, -6.059031009674072, -5.444868087768555, -4.830704689025879, -4.216541767120361, -3.6023788452148438, -2.988215923309326, -2.3740527629852295, -1.7598897218704224, -1.1457266807556152, -0.5315637588500977, 0.08259940147399902, 0.6967625617980957, 1.3109254837036133, 1.9250885248184204, 2.5392515659332275, 3.153414726257324, 3.767577648162842, 4.381740570068359, 4.995903968811035, 5.610066890716553, 6.2242279052734375, 6.838390827178955, 7.452553749084473, 8.066717147827148, 8.680879592895508, 9.295042991638184, 9.90920639038086, 10.523368835449219, 11.137532234191895, 11.75169563293457, 12.36585807800293, 12.980021476745605, 13.594184875488281, 14.20834732055664, 14.822510719299316, 15.436674118041992, 16.05083656311035, 16.66499900817871, 17.279163360595703, 17.893325805664062, 18.507488250732422, 19.12165069580078, 19.735815048217773, 20.349977493286133, 20.964141845703125, 21.578304290771484, 22.192468643188477, 22.806631088256836, 23.420793533325195, 24.034957885742188, 24.649120330810547, 25.263282775878906, 25.877445220947266]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 9.0, 24.0, 18.0, 28.0, 25.0, 38.0, 48.0, 37.0, 46.0, 61.0, 50.0, 48.0, 46.0, 58.0, 62.0, 47.0, 46.0, 34.0, 43.0, 26.0, 37.0, 22.0, 23.0, 21.0, 13.0, 16.0, 10.0, 9.0, 6.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.060491561889648, -11.74626636505127, -11.43204116821289, -11.117815971374512, -10.803590774536133, -10.489365577697754, -10.175140380859375, -9.860915184020996, -9.546689987182617, -9.232464790344238, -8.91823959350586, -8.60401439666748, -8.289789199829102, -7.975564002990723, -7.661338806152344, -7.347113609313965, -7.032888412475586, -6.718663215637207, -6.404438018798828, -6.090212821960449, -5.77598762512207, -5.461762428283691, -5.1475372314453125, -4.833312034606934, -4.519086837768555, -4.204861640930176, -3.890636444091797, -3.576411247253418, -3.262186050415039, -2.94796085357666, -2.6337356567382812, -2.3195104598999023, -2.005284309387207, -1.6910591125488281, -1.3768339157104492, -1.0626087188720703, -0.7483835220336914, -0.4341583251953125, -0.1199331283569336, 0.1942920684814453, 0.5085172653198242, 0.8227424621582031, 1.136967658996582, 1.451192855834961, 1.7654180526733398, 2.0796432495117188, 2.3938684463500977, 2.7080936431884766, 3.0223188400268555, 3.3365440368652344, 3.6507692337036133, 3.964994430541992, 4.279219627380371, 4.59344482421875, 4.907670021057129, 5.221895217895508, 5.536120414733887, 5.850345611572266, 6.1645708084106445, 6.478796005249023, 6.793021202087402, 7.107246398925781, 7.42147159576416, 7.735696792602539, 8.049921989440918]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 13.0, 15.0, 17.0, 24.0, 36.0, 49.0, 75.0, 89.0, 155.0, 240.0, 460.0, 902.0, 2091.0, 5510.0, 15214.0, 42553.0, 137521.0, 532502.0, 217915.0, 59354.0, 20842.0, 7518.0, 2841.0, 1191.0, 571.0, 297.0, 171.0, 115.0, 84.0, 56.0, 36.0, 24.0, 22.0, 9.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.828125, -6.64678955078125, -6.4654541015625, -6.28411865234375, -6.102783203125, -5.92144775390625, -5.7401123046875, -5.55877685546875, -5.37744140625, -5.19610595703125, -5.0147705078125, -4.83343505859375, -4.652099609375, -4.47076416015625, -4.2894287109375, -4.10809326171875, -3.9267578125, -3.74542236328125, -3.5640869140625, -3.38275146484375, -3.201416015625, -3.02008056640625, -2.8387451171875, -2.65740966796875, -2.47607421875, -2.29473876953125, -2.1134033203125, -1.93206787109375, -1.750732421875, -1.56939697265625, -1.3880615234375, -1.20672607421875, -1.025390625, -0.84405517578125, -0.6627197265625, -0.48138427734375, -0.300048828125, -0.11871337890625, 0.0626220703125, 0.24395751953125, 0.42529296875, 0.60662841796875, 0.7879638671875, 0.96929931640625, 1.150634765625, 1.33197021484375, 1.5133056640625, 1.69464111328125, 1.8759765625, 2.05731201171875, 2.2386474609375, 2.41998291015625, 2.601318359375, 2.78265380859375, 2.9639892578125, 3.14532470703125, 3.32666015625, 3.50799560546875, 3.6893310546875, 3.87066650390625, 4.052001953125, 4.23333740234375, 4.4146728515625, 4.59600830078125, 4.77734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 13.0, 15.0, 21.0, 20.0, 24.0, 25.0, 24.0, 33.0, 43.0, 41.0, 44.0, 55.0, 44.0, 51.0, 44.0, 52.0, 60.0, 49.0, 35.0, 46.0, 39.0, 22.0, 43.0, 25.0, 31.0, 13.0, 16.0, 15.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3310546875, -1.293182373046875, -1.25531005859375, -1.217437744140625, -1.1795654296875, -1.141693115234375, -1.10382080078125, -1.065948486328125, -1.028076171875, -0.990203857421875, -0.95233154296875, -0.914459228515625, -0.8765869140625, -0.838714599609375, -0.80084228515625, -0.762969970703125, -0.72509765625, -0.687225341796875, -0.64935302734375, -0.611480712890625, -0.5736083984375, -0.535736083984375, -0.49786376953125, -0.459991455078125, -0.422119140625, -0.384246826171875, -0.34637451171875, -0.308502197265625, -0.2706298828125, -0.232757568359375, -0.19488525390625, -0.157012939453125, -0.119140625, -0.081268310546875, -0.04339599609375, -0.005523681640625, 0.0323486328125, 0.070220947265625, 0.10809326171875, 0.145965576171875, 0.183837890625, 0.221710205078125, 0.25958251953125, 0.297454833984375, 0.3353271484375, 0.373199462890625, 0.41107177734375, 0.448944091796875, 0.48681640625, 0.524688720703125, 0.56256103515625, 0.600433349609375, 0.6383056640625, 0.676177978515625, 0.71405029296875, 0.751922607421875, 0.789794921875, 0.827667236328125, 0.86553955078125, 0.903411865234375, 0.9412841796875, 0.979156494140625, 1.01702880859375, 1.054901123046875, 1.0927734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 17.0, 18.0, 16.0, 20.0, 36.0, 46.0, 68.0, 105.0, 173.0, 310.0, 768.0, 1843.0, 6078.0, 20914.0, 88093.0, 698356.0, 183571.0, 34056.0, 9230.0, 2770.0, 1015.0, 418.0, 233.0, 130.0, 64.0, 61.0, 37.0, 31.0, 14.0, 12.0, 10.0, 8.0, 1.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.640625, -8.3914794921875, -8.142333984375, -7.8931884765625, -7.64404296875, -7.3948974609375, -7.145751953125, -6.8966064453125, -6.6474609375, -6.3983154296875, -6.149169921875, -5.9000244140625, -5.65087890625, -5.4017333984375, -5.152587890625, -4.9034423828125, -4.654296875, -4.4051513671875, -4.156005859375, -3.9068603515625, -3.65771484375, -3.4085693359375, -3.159423828125, -2.9102783203125, -2.6611328125, -2.4119873046875, -2.162841796875, -1.9136962890625, -1.66455078125, -1.4154052734375, -1.166259765625, -0.9171142578125, -0.66796875, -0.4188232421875, -0.169677734375, 0.0794677734375, 0.32861328125, 0.5777587890625, 0.826904296875, 1.0760498046875, 1.3251953125, 1.5743408203125, 1.823486328125, 2.0726318359375, 2.32177734375, 2.5709228515625, 2.820068359375, 3.0692138671875, 3.318359375, 3.5675048828125, 3.816650390625, 4.0657958984375, 4.31494140625, 4.5640869140625, 4.813232421875, 5.0623779296875, 5.3115234375, 5.5606689453125, 5.809814453125, 6.0589599609375, 6.30810546875, 6.5572509765625, 6.806396484375, 7.0555419921875, 7.3046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 11.0, 4.0, 8.0, 15.0, 11.0, 15.0, 22.0, 23.0, 31.0, 47.0, 47.0, 51.0, 68.0, 66.0, 63.0, 69.0, 61.0, 57.0, 67.0, 32.0, 56.0, 42.0, 25.0, 17.0, 23.0, 5.0, 8.0, 14.0, 6.0, 10.0, 3.0, 4.0, 2.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.24609375, -7.02703857421875, -6.8079833984375, -6.58892822265625, -6.369873046875, -6.15081787109375, -5.9317626953125, -5.71270751953125, -5.49365234375, -5.27459716796875, -5.0555419921875, -4.83648681640625, -4.617431640625, -4.39837646484375, -4.1793212890625, -3.96026611328125, -3.7412109375, -3.52215576171875, -3.3031005859375, -3.08404541015625, -2.864990234375, -2.64593505859375, -2.4268798828125, -2.20782470703125, -1.98876953125, -1.76971435546875, -1.5506591796875, -1.33160400390625, -1.112548828125, -0.89349365234375, -0.6744384765625, -0.45538330078125, -0.236328125, -0.01727294921875, 0.2017822265625, 0.42083740234375, 0.639892578125, 0.85894775390625, 1.0780029296875, 1.29705810546875, 1.51611328125, 1.73516845703125, 1.9542236328125, 2.17327880859375, 2.392333984375, 2.61138916015625, 2.8304443359375, 3.04949951171875, 3.2685546875, 3.48760986328125, 3.7066650390625, 3.92572021484375, 4.144775390625, 4.36383056640625, 4.5828857421875, 4.80194091796875, 5.02099609375, 5.24005126953125, 5.4591064453125, 5.67816162109375, 5.897216796875, 6.11627197265625, 6.3353271484375, 6.55438232421875, 6.7734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 12.0, 13.0, 16.0, 22.0, 36.0, 60.0, 110.0, 217.0, 421.0, 1024.0, 3891.0, 21466.0, 154168.0, 779466.0, 72406.0, 11493.0, 2346.0, 724.0, 298.0, 145.0, 93.0, 51.0, 23.0, 24.0, 12.0, 10.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7890625, -3.6451416015625, -3.501220703125, -3.3572998046875, -3.21337890625, -3.0694580078125, -2.925537109375, -2.7816162109375, -2.6376953125, -2.4937744140625, -2.349853515625, -2.2059326171875, -2.06201171875, -1.9180908203125, -1.774169921875, -1.6302490234375, -1.486328125, -1.3424072265625, -1.198486328125, -1.0545654296875, -0.91064453125, -0.7667236328125, -0.622802734375, -0.4788818359375, -0.3349609375, -0.1910400390625, -0.047119140625, 0.0968017578125, 0.24072265625, 0.3846435546875, 0.528564453125, 0.6724853515625, 0.81640625, 0.9603271484375, 1.104248046875, 1.2481689453125, 1.39208984375, 1.5360107421875, 1.679931640625, 1.8238525390625, 1.9677734375, 2.1116943359375, 2.255615234375, 2.3995361328125, 2.54345703125, 2.6873779296875, 2.831298828125, 2.9752197265625, 3.119140625, 3.2630615234375, 3.406982421875, 3.5509033203125, 3.69482421875, 3.8387451171875, 3.982666015625, 4.1265869140625, 4.2705078125, 4.4144287109375, 4.558349609375, 4.7022705078125, 4.84619140625, 4.9901123046875, 5.134033203125, 5.2779541015625, 5.421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 10.0, 8.0, 3.0, 7.0, 8.0, 8.0, 17.0, 15.0, 18.0, 23.0, 53.0, 106.0, 228.0, 245.0, 91.0, 30.0, 29.0, 16.0, 10.0, 16.0, 8.0, 9.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005393028259277344, -0.0005184784531593323, -0.0004976540803909302, -0.0004768297076225281, -0.000456005334854126, -0.0004351809620857239, -0.0004143565893173218, -0.0003935322165489197, -0.0003727078437805176, -0.0003518834710121155, -0.0003310590982437134, -0.0003102347254753113, -0.0002894103527069092, -0.0002685859799385071, -0.000247761607170105, -0.00022693723440170288, -0.00020611286163330078, -0.00018528848886489868, -0.00016446411609649658, -0.00014363974332809448, -0.00012281537055969238, -0.00010199099779129028, -8.116662502288818e-05, -6.0342252254486084e-05, -3.9517879486083984e-05, -1.8693506717681885e-05, 2.130866050720215e-06, 2.2955238819122314e-05, 4.3779611587524414e-05, 6.460398435592651e-05, 8.542835712432861e-05, 0.00010625272989273071, 0.0001270771026611328, 0.0001479014754295349, 0.000168725848197937, 0.0001895502209663391, 0.0002103745937347412, 0.0002311989665031433, 0.0002520233392715454, 0.0002728477120399475, 0.0002936720848083496, 0.0003144964575767517, 0.0003353208303451538, 0.0003561452031135559, 0.000376969575881958, 0.0003977939486503601, 0.0004186183214187622, 0.0004394426941871643, 0.0004602670669555664, 0.0004810914397239685, 0.0005019158124923706, 0.0005227401852607727, 0.0005435645580291748, 0.0005643889307975769, 0.000585213303565979, 0.0006060376763343811, 0.0006268620491027832, 0.0006476864218711853, 0.0006685107946395874, 0.0006893351674079895, 0.0007101595401763916, 0.0007309839129447937, 0.0007518082857131958, 0.0007726326584815979, 0.00079345703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 18.0, 32.0, 51.0, 89.0, 156.0, 322.0, 873.0, 3097.0, 17505.0, 150499.0, 800177.0, 63832.0, 8880.0, 1868.0, 600.0, 257.0, 124.0, 57.0, 37.0, 25.0, 13.0, 10.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.2144775390625, -4.065673828125, -3.9168701171875, -3.76806640625, -3.6192626953125, -3.470458984375, -3.3216552734375, -3.1728515625, -3.0240478515625, -2.875244140625, -2.7264404296875, -2.57763671875, -2.4288330078125, -2.280029296875, -2.1312255859375, -1.982421875, -1.8336181640625, -1.684814453125, -1.5360107421875, -1.38720703125, -1.2384033203125, -1.089599609375, -0.9407958984375, -0.7919921875, -0.6431884765625, -0.494384765625, -0.3455810546875, -0.19677734375, -0.0479736328125, 0.100830078125, 0.2496337890625, 0.3984375, 0.5472412109375, 0.696044921875, 0.8448486328125, 0.99365234375, 1.1424560546875, 1.291259765625, 1.4400634765625, 1.5888671875, 1.7376708984375, 1.886474609375, 2.0352783203125, 2.18408203125, 2.3328857421875, 2.481689453125, 2.6304931640625, 2.779296875, 2.9281005859375, 3.076904296875, 3.2257080078125, 3.37451171875, 3.5233154296875, 3.672119140625, 3.8209228515625, 3.9697265625, 4.1185302734375, 4.267333984375, 4.4161376953125, 4.56494140625, 4.7137451171875, 4.862548828125, 5.0113525390625, 5.16015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 9.0, 8.0, 17.0, 13.0, 21.0, 23.0, 36.0, 50.0, 83.0, 139.0, 173.0, 129.0, 89.0, 62.0, 48.0, 35.0, 23.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.33984375, -4.244781494140625, -4.14971923828125, -4.054656982421875, -3.9595947265625, -3.864532470703125, -3.76947021484375, -3.674407958984375, -3.579345703125, -3.484283447265625, -3.38922119140625, -3.294158935546875, -3.1990966796875, -3.104034423828125, -3.00897216796875, -2.913909912109375, -2.81884765625, -2.723785400390625, -2.62872314453125, -2.533660888671875, -2.4385986328125, -2.343536376953125, -2.24847412109375, -2.153411865234375, -2.058349609375, -1.963287353515625, -1.86822509765625, -1.773162841796875, -1.6781005859375, -1.583038330078125, -1.48797607421875, -1.392913818359375, -1.2978515625, -1.202789306640625, -1.10772705078125, -1.012664794921875, -0.9176025390625, -0.822540283203125, -0.72747802734375, -0.632415771484375, -0.537353515625, -0.442291259765625, -0.34722900390625, -0.252166748046875, -0.1571044921875, -0.062042236328125, 0.03302001953125, 0.128082275390625, 0.22314453125, 0.318206787109375, 0.41326904296875, 0.508331298828125, 0.6033935546875, 0.698455810546875, 0.79351806640625, 0.888580322265625, 0.983642578125, 1.078704833984375, 1.17376708984375, 1.268829345703125, 1.3638916015625, 1.458953857421875, 1.55401611328125, 1.649078369140625, 1.744140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 13.0, 57.0, 151.0, 337.0, 267.0, 139.0, 32.0, 11.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.07796478271484, -63.710731506347656, -60.34349822998047, -56.97626495361328, -53.609031677246094, -50.241798400878906, -46.874568939208984, -43.5073356628418, -40.14010238647461, -36.77286911010742, -33.405635833740234, -30.03840446472168, -26.671171188354492, -23.303937911987305, -19.93670654296875, -16.569473266601562, -13.202239990234375, -9.835006713867188, -6.467774391174316, -3.1005420684814453, 0.2666912078857422, 3.6339244842529297, 7.001155853271484, 10.368389129638672, 13.73562240600586, 17.102855682373047, 20.470088958740234, 23.83732032775879, 27.204553604125977, 30.571786880493164, 33.93901824951172, 37.306251525878906, 40.673492431640625, 44.04072570800781, 47.407958984375, 50.77519226074219, 54.142425537109375, 57.50965881347656, 60.876888275146484, 64.24412536621094, 67.61135864257812, 70.97859191894531, 74.3458251953125, 77.71305847167969, 81.08029174804688, 84.44752502441406, 87.81475830078125, 91.18199157714844, 94.5492172241211, 97.91645050048828, 101.28368377685547, 104.65091705322266, 108.01815032958984, 111.38538360595703, 114.75260925292969, 118.11984252929688, 121.48707580566406, 124.85430908203125, 128.22154235839844, 131.58877563476562, 134.9560089111328, 138.3232421875, 141.6904754638672, 145.05770874023438, 148.42494201660156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 6.0, 15.0, 8.0, 14.0, 18.0, 14.0, 22.0, 18.0, 25.0, 29.0, 35.0, 35.0, 38.0, 43.0, 36.0, 46.0, 38.0, 40.0, 44.0, 42.0, 44.0, 49.0, 49.0, 42.0, 22.0, 22.0, 28.0, 28.0, 27.0, 17.0, 18.0, 11.0, 14.0, 11.0, 8.0, 8.0, 5.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.784788131713867, -21.032203674316406, -20.279619216918945, -19.527034759521484, -18.774450302124023, -18.021865844726562, -17.2692813873291, -16.51669692993164, -15.76411247253418, -15.011528015136719, -14.258943557739258, -13.506359100341797, -12.753774642944336, -12.001190185546875, -11.248605728149414, -10.496021270751953, -9.743436813354492, -8.990852355957031, -8.23826789855957, -7.485683441162109, -6.733098983764648, -5.9805145263671875, -5.227930068969727, -4.475345611572266, -3.7227611541748047, -2.9701766967773438, -2.217592239379883, -1.4650077819824219, -0.7124233245849609, 0.0401611328125, 0.7927455902099609, 1.5453300476074219, 2.297914505004883, 3.0504989624023438, 3.8030834197998047, 4.555667877197266, 5.308252334594727, 6.0608367919921875, 6.813421249389648, 7.566005706787109, 8.31859016418457, 9.071174621582031, 9.823759078979492, 10.576343536376953, 11.328927993774414, 12.081512451171875, 12.834096908569336, 13.586681365966797, 14.339265823364258, 15.091850280761719, 15.84443473815918, 16.59701919555664, 17.3496036529541, 18.102188110351562, 18.854772567749023, 19.607357025146484, 20.359941482543945, 21.112525939941406, 21.865110397338867, 22.617694854736328, 23.37027931213379, 24.12286376953125, 24.87544822692871, 25.628032684326172, 26.380617141723633]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 11.0, 27.0, 50.0, 75.0, 134.0, 294.0, 655.0, 2136.0, 8203.0, 42437.0, 602763.0, 3441978.0, 77694.0, 13125.0, 3134.0, 916.0, 329.0, 145.0, 71.0, 34.0, 23.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8203125, -15.4056396484375, -14.990966796875, -14.5762939453125, -14.16162109375, -13.7469482421875, -13.332275390625, -12.9176025390625, -12.5029296875, -12.0882568359375, -11.673583984375, -11.2589111328125, -10.84423828125, -10.4295654296875, -10.014892578125, -9.6002197265625, -9.185546875, -8.7708740234375, -8.356201171875, -7.9415283203125, -7.52685546875, -7.1121826171875, -6.697509765625, -6.2828369140625, -5.8681640625, -5.4534912109375, -5.038818359375, -4.6241455078125, -4.20947265625, -3.7947998046875, -3.380126953125, -2.9654541015625, -2.55078125, -2.1361083984375, -1.721435546875, -1.3067626953125, -0.89208984375, -0.4774169921875, -0.062744140625, 0.3519287109375, 0.7666015625, 1.1812744140625, 1.595947265625, 2.0106201171875, 2.42529296875, 2.8399658203125, 3.254638671875, 3.6693115234375, 4.083984375, 4.4986572265625, 4.913330078125, 5.3280029296875, 5.74267578125, 6.1573486328125, 6.572021484375, 6.9866943359375, 7.4013671875, 7.8160400390625, 8.230712890625, 8.6453857421875, 9.06005859375, 9.4747314453125, 9.889404296875, 10.3040771484375, 10.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 11.0, 8.0, 13.0, 14.0, 21.0, 22.0, 21.0, 21.0, 33.0, 34.0, 33.0, 38.0, 45.0, 45.0, 49.0, 38.0, 52.0, 55.0, 40.0, 49.0, 44.0, 48.0, 39.0, 35.0, 30.0, 26.0, 17.0, 22.0, 18.0, 16.0, 15.0, 11.0, 3.0, 6.0, 2.0, 5.0, 4.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2939453125, -1.257659912109375, -1.22137451171875, -1.185089111328125, -1.1488037109375, -1.112518310546875, -1.07623291015625, -1.039947509765625, -1.003662109375, -0.967376708984375, -0.93109130859375, -0.894805908203125, -0.8585205078125, -0.822235107421875, -0.78594970703125, -0.749664306640625, -0.71337890625, -0.677093505859375, -0.64080810546875, -0.604522705078125, -0.5682373046875, -0.531951904296875, -0.49566650390625, -0.459381103515625, -0.423095703125, -0.386810302734375, -0.35052490234375, -0.314239501953125, -0.2779541015625, -0.241668701171875, -0.20538330078125, -0.169097900390625, -0.1328125, -0.096527099609375, -0.06024169921875, -0.023956298828125, 0.0123291015625, 0.048614501953125, 0.08489990234375, 0.121185302734375, 0.157470703125, 0.193756103515625, 0.23004150390625, 0.266326904296875, 0.3026123046875, 0.338897705078125, 0.37518310546875, 0.411468505859375, 0.44775390625, 0.484039306640625, 0.52032470703125, 0.556610107421875, 0.5928955078125, 0.629180908203125, 0.66546630859375, 0.701751708984375, 0.738037109375, 0.774322509765625, 0.81060791015625, 0.846893310546875, 0.8831787109375, 0.919464111328125, 0.95574951171875, 0.992034912109375, 1.0283203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 12.0, 31.0, 41.0, 125.0, 268.0, 888.0, 4617.0, 88829.0, 4012001.0, 81729.0, 4443.0, 848.0, 266.0, 97.0, 40.0, 22.0, 12.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71875, -29.00244140625, -28.2861328125, -27.56982421875, -26.853515625, -26.13720703125, -25.4208984375, -24.70458984375, -23.98828125, -23.27197265625, -22.5556640625, -21.83935546875, -21.123046875, -20.40673828125, -19.6904296875, -18.97412109375, -18.2578125, -17.54150390625, -16.8251953125, -16.10888671875, -15.392578125, -14.67626953125, -13.9599609375, -13.24365234375, -12.52734375, -11.81103515625, -11.0947265625, -10.37841796875, -9.662109375, -8.94580078125, -8.2294921875, -7.51318359375, -6.796875, -6.08056640625, -5.3642578125, -4.64794921875, -3.931640625, -3.21533203125, -2.4990234375, -1.78271484375, -1.06640625, -0.35009765625, 0.3662109375, 1.08251953125, 1.798828125, 2.51513671875, 3.2314453125, 3.94775390625, 4.6640625, 5.38037109375, 6.0966796875, 6.81298828125, 7.529296875, 8.24560546875, 8.9619140625, 9.67822265625, 10.39453125, 11.11083984375, 11.8271484375, 12.54345703125, 13.259765625, 13.97607421875, 14.6923828125, 15.40869140625, 16.125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 17.0, 27.0, 52.0, 104.0, 197.0, 553.0, 2067.0, 580.0, 211.0, 101.0, 52.0, 33.0, 16.0, 10.0, 11.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.625, -6.465484619140625, -6.30596923828125, -6.146453857421875, -5.9869384765625, -5.827423095703125, -5.66790771484375, -5.508392333984375, -5.348876953125, -5.189361572265625, -5.02984619140625, -4.870330810546875, -4.7108154296875, -4.551300048828125, -4.39178466796875, -4.232269287109375, -4.07275390625, -3.913238525390625, -3.75372314453125, -3.594207763671875, -3.4346923828125, -3.275177001953125, -3.11566162109375, -2.956146240234375, -2.796630859375, -2.637115478515625, -2.47760009765625, -2.318084716796875, -2.1585693359375, -1.999053955078125, -1.83953857421875, -1.680023193359375, -1.5205078125, -1.360992431640625, -1.20147705078125, -1.041961669921875, -0.8824462890625, -0.722930908203125, -0.56341552734375, -0.403900146484375, -0.244384765625, -0.084869384765625, 0.07464599609375, 0.234161376953125, 0.3936767578125, 0.553192138671875, 0.71270751953125, 0.872222900390625, 1.03173828125, 1.191253662109375, 1.35076904296875, 1.510284423828125, 1.6697998046875, 1.829315185546875, 1.98883056640625, 2.148345947265625, 2.307861328125, 2.467376708984375, 2.62689208984375, 2.786407470703125, 2.9459228515625, 3.105438232421875, 3.26495361328125, 3.424468994140625, 3.583984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 10.0, 14.0, 51.0, 100.0, 228.0, 299.0, 191.0, 85.0, 23.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-74.54891967773438, -73.04124450683594, -71.53357696533203, -70.0259017944336, -68.51822662353516, -67.01055908203125, -65.50288391113281, -63.995208740234375, -62.4875373840332, -60.97986602783203, -59.472190856933594, -57.96451950073242, -56.45684814453125, -54.94917297363281, -53.44150161743164, -51.93383026123047, -50.42615509033203, -48.91848373413086, -47.41080856323242, -45.90313720703125, -44.39546203613281, -42.88779067993164, -41.38011932373047, -39.87244415283203, -38.36477279663086, -36.85710144042969, -35.34942626953125, -33.84175491333008, -32.334083557128906, -30.82640838623047, -29.318737030029297, -27.811063766479492, -26.303388595581055, -24.79571533203125, -23.288043975830078, -21.780370712280273, -20.27269744873047, -18.765024185180664, -17.25735092163086, -15.749679565429688, -14.242006301879883, -12.734333038330078, -11.22666072845459, -9.718988418579102, -8.211315155029297, -6.70364236831665, -5.195969581604004, -3.6882972717285156, -2.180624008178711, -0.6729512214660645, 0.834721565246582, 2.3423943519592285, 3.850067138671875, 5.3577399253845215, 6.865412712097168, 8.373085021972656, 9.880758285522461, 11.388431549072266, 12.896103858947754, 14.403776168823242, 15.911449432373047, 17.41912269592285, 18.926795959472656, 20.434467315673828, 21.942140579223633]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 7.0, 3.0, 8.0, 9.0, 8.0, 13.0, 9.0, 12.0, 13.0, 17.0, 15.0, 27.0, 28.0, 24.0, 36.0, 45.0, 34.0, 34.0, 50.0, 40.0, 46.0, 40.0, 51.0, 32.0, 40.0, 32.0, 37.0, 38.0, 35.0, 27.0, 27.0, 25.0, 34.0, 19.0, 21.0, 12.0, 9.0, 9.0, 7.0, 12.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0], "bins": [-13.534879684448242, -13.160469055175781, -12.786059379577637, -12.411648750305176, -12.037239074707031, -11.66282844543457, -11.288418769836426, -10.914008140563965, -10.53959846496582, -10.16518783569336, -9.790778160095215, -9.416367530822754, -9.04195785522461, -8.667547225952148, -8.293137550354004, -7.918726921081543, -7.54431676864624, -7.1699066162109375, -6.795496463775635, -6.421086311340332, -6.046676158905029, -5.672266006469727, -5.297855377197266, -4.923445701599121, -4.54903507232666, -4.174624919891357, -3.8002147674560547, -3.425804615020752, -3.051394462585449, -2.6769843101501465, -2.3025739192962646, -1.928163766860962, -1.5537538528442383, -1.1793437004089355, -0.804933488368988, -0.4305232763290405, -0.05611312389373779, 0.31829702854156494, 0.6927073001861572, 1.06711745262146, 1.4415276050567627, 1.8159377574920654, 2.190347909927368, 2.56475830078125, 2.9391684532165527, 3.3135786056518555, 3.687988758087158, 4.062398910522461, 4.436809062957764, 4.811219215393066, 5.185629367828369, 5.560039520263672, 5.934449672698975, 6.308859825134277, 6.683270454406738, 7.057680130004883, 7.432090759277344, 7.8065009117126465, 8.18091106414795, 8.55532169342041, 8.929731369018555, 9.304141998291016, 9.67855167388916, 10.052962303161621, 10.427371978759766]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 15.0, 13.0, 17.0, 31.0, 41.0, 70.0, 84.0, 169.0, 226.0, 459.0, 922.0, 1757.0, 3930.0, 9064.0, 22341.0, 54310.0, 127743.0, 303071.0, 303368.0, 127761.0, 54100.0, 22414.0, 8982.0, 3779.0, 1844.0, 853.0, 439.0, 256.0, 152.0, 99.0, 83.0, 37.0, 36.0, 25.0, 12.0, 12.0, 4.0, 10.0, 3.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.68359375, -4.5274658203125, -4.371337890625, -4.2152099609375, -4.05908203125, -3.9029541015625, -3.746826171875, -3.5906982421875, -3.4345703125, -3.2784423828125, -3.122314453125, -2.9661865234375, -2.81005859375, -2.6539306640625, -2.497802734375, -2.3416748046875, -2.185546875, -2.0294189453125, -1.873291015625, -1.7171630859375, -1.56103515625, -1.4049072265625, -1.248779296875, -1.0926513671875, -0.9365234375, -0.7803955078125, -0.624267578125, -0.4681396484375, -0.31201171875, -0.1558837890625, 0.000244140625, 0.1563720703125, 0.3125, 0.4686279296875, 0.624755859375, 0.7808837890625, 0.93701171875, 1.0931396484375, 1.249267578125, 1.4053955078125, 1.5615234375, 1.7176513671875, 1.873779296875, 2.0299072265625, 2.18603515625, 2.3421630859375, 2.498291015625, 2.6544189453125, 2.810546875, 2.9666748046875, 3.122802734375, 3.2789306640625, 3.43505859375, 3.5911865234375, 3.747314453125, 3.9034423828125, 4.0595703125, 4.2156982421875, 4.371826171875, 4.5279541015625, 4.68408203125, 4.8402099609375, 4.996337890625, 5.1524658203125, 5.30859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 8.0, 7.0, 7.0, 17.0, 15.0, 16.0, 16.0, 21.0, 22.0, 29.0, 31.0, 29.0, 24.0, 35.0, 42.0, 30.0, 45.0, 35.0, 47.0, 39.0, 55.0, 44.0, 31.0, 33.0, 39.0, 31.0, 30.0, 29.0, 21.0, 23.0, 26.0, 14.0, 16.0, 9.0, 13.0, 16.0, 8.0, 5.0, 5.0, 3.0, 4.0, 6.0, 2.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.1579742431640625, -1.120635986328125, -1.0832977294921875, -1.04595947265625, -1.0086212158203125, -0.971282958984375, -0.9339447021484375, -0.8966064453125, -0.8592681884765625, -0.821929931640625, -0.7845916748046875, -0.74725341796875, -0.7099151611328125, -0.672576904296875, -0.6352386474609375, -0.597900390625, -0.5605621337890625, -0.523223876953125, -0.4858856201171875, -0.44854736328125, -0.4112091064453125, -0.373870849609375, -0.3365325927734375, -0.2991943359375, -0.2618560791015625, -0.224517822265625, -0.1871795654296875, -0.14984130859375, -0.1125030517578125, -0.075164794921875, -0.0378265380859375, -0.00048828125, 0.0368499755859375, 0.074188232421875, 0.1115264892578125, 0.14886474609375, 0.1862030029296875, 0.223541259765625, 0.2608795166015625, 0.2982177734375, 0.3355560302734375, 0.372894287109375, 0.4102325439453125, 0.44757080078125, 0.4849090576171875, 0.522247314453125, 0.5595855712890625, 0.596923828125, 0.6342620849609375, 0.671600341796875, 0.7089385986328125, 0.74627685546875, 0.7836151123046875, 0.820953369140625, 0.8582916259765625, 0.8956298828125, 0.9329681396484375, 0.970306396484375, 1.0076446533203125, 1.04498291015625, 1.0823211669921875, 1.119659423828125, 1.1569976806640625, 1.1943359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 9.0, 17.0, 28.0, 25.0, 40.0, 53.0, 91.0, 148.0, 181.0, 343.0, 515.0, 873.0, 1782.0, 6443.0, 50094.0, 540668.0, 399702.0, 38255.0, 5348.0, 1668.0, 799.0, 489.0, 299.0, 205.0, 147.0, 100.0, 66.0, 44.0, 32.0, 20.0, 18.0, 14.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.5, -12.1317138671875, -11.763427734375, -11.3951416015625, -11.02685546875, -10.6585693359375, -10.290283203125, -9.9219970703125, -9.5537109375, -9.1854248046875, -8.817138671875, -8.4488525390625, -8.08056640625, -7.7122802734375, -7.343994140625, -6.9757080078125, -6.607421875, -6.2391357421875, -5.870849609375, -5.5025634765625, -5.13427734375, -4.7659912109375, -4.397705078125, -4.0294189453125, -3.6611328125, -3.2928466796875, -2.924560546875, -2.5562744140625, -2.18798828125, -1.8197021484375, -1.451416015625, -1.0831298828125, -0.71484375, -0.3465576171875, 0.021728515625, 0.3900146484375, 0.75830078125, 1.1265869140625, 1.494873046875, 1.8631591796875, 2.2314453125, 2.5997314453125, 2.968017578125, 3.3363037109375, 3.70458984375, 4.0728759765625, 4.441162109375, 4.8094482421875, 5.177734375, 5.5460205078125, 5.914306640625, 6.2825927734375, 6.65087890625, 7.0191650390625, 7.387451171875, 7.7557373046875, 8.1240234375, 8.4923095703125, 8.860595703125, 9.2288818359375, 9.59716796875, 9.9654541015625, 10.333740234375, 10.7020263671875, 11.0703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 10.0, 10.0, 25.0, 22.0, 34.0, 42.0, 31.0, 41.0, 41.0, 43.0, 56.0, 51.0, 54.0, 57.0, 65.0, 63.0, 48.0, 48.0, 40.0, 44.0, 29.0, 20.0, 23.0, 14.0, 12.0, 8.0, 22.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.3515625, -9.0740966796875, -8.796630859375, -8.5191650390625, -8.24169921875, -7.9642333984375, -7.686767578125, -7.4093017578125, -7.1318359375, -6.8543701171875, -6.576904296875, -6.2994384765625, -6.02197265625, -5.7445068359375, -5.467041015625, -5.1895751953125, -4.912109375, -4.6346435546875, -4.357177734375, -4.0797119140625, -3.80224609375, -3.5247802734375, -3.247314453125, -2.9698486328125, -2.6923828125, -2.4149169921875, -2.137451171875, -1.8599853515625, -1.58251953125, -1.3050537109375, -1.027587890625, -0.7501220703125, -0.47265625, -0.1951904296875, 0.082275390625, 0.3597412109375, 0.63720703125, 0.9146728515625, 1.192138671875, 1.4696044921875, 1.7470703125, 2.0245361328125, 2.302001953125, 2.5794677734375, 2.85693359375, 3.1343994140625, 3.411865234375, 3.6893310546875, 3.966796875, 4.2442626953125, 4.521728515625, 4.7991943359375, 5.07666015625, 5.3541259765625, 5.631591796875, 5.9090576171875, 6.1865234375, 6.4639892578125, 6.741455078125, 7.0189208984375, 7.29638671875, 7.5738525390625, 7.851318359375, 8.1287841796875, 8.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 6.0, 11.0, 10.0, 25.0, 25.0, 37.0, 50.0, 63.0, 136.0, 261.0, 632.0, 1777.0, 6822.0, 40241.0, 388071.0, 549380.0, 49481.0, 8127.0, 2029.0, 656.0, 309.0, 145.0, 84.0, 55.0, 30.0, 24.0, 12.0, 10.0, 9.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.69140625, -6.48895263671875, -6.2864990234375, -6.08404541015625, -5.881591796875, -5.67913818359375, -5.4766845703125, -5.27423095703125, -5.07177734375, -4.86932373046875, -4.6668701171875, -4.46441650390625, -4.261962890625, -4.05950927734375, -3.8570556640625, -3.65460205078125, -3.4521484375, -3.24969482421875, -3.0472412109375, -2.84478759765625, -2.642333984375, -2.43988037109375, -2.2374267578125, -2.03497314453125, -1.83251953125, -1.63006591796875, -1.4276123046875, -1.22515869140625, -1.022705078125, -0.82025146484375, -0.6177978515625, -0.41534423828125, -0.212890625, -0.01043701171875, 0.1920166015625, 0.39447021484375, 0.596923828125, 0.79937744140625, 1.0018310546875, 1.20428466796875, 1.40673828125, 1.60919189453125, 1.8116455078125, 2.01409912109375, 2.216552734375, 2.41900634765625, 2.6214599609375, 2.82391357421875, 3.0263671875, 3.22882080078125, 3.4312744140625, 3.63372802734375, 3.836181640625, 4.03863525390625, 4.2410888671875, 4.44354248046875, 4.64599609375, 4.84844970703125, 5.0509033203125, 5.25335693359375, 5.455810546875, 5.65826416015625, 5.8607177734375, 6.06317138671875, 6.265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 8.0, 12.0, 15.0, 16.0, 13.0, 11.0, 30.0, 35.0, 37.0, 29.0, 46.0, 67.0, 137.0, 172.0, 64.0, 62.0, 41.0, 37.0, 25.0, 29.0, 21.0, 22.0, 9.0, 16.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006933212280273438, -0.0006695389747619629, -0.000645756721496582, -0.0006219744682312012, -0.0005981922149658203, -0.0005744099617004395, -0.0005506277084350586, -0.0005268454551696777, -0.0005030632019042969, -0.000479280948638916, -0.00045549869537353516, -0.0004317164421081543, -0.00040793418884277344, -0.0003841519355773926, -0.0003603696823120117, -0.00033658742904663086, -0.00031280517578125, -0.00028902292251586914, -0.0002652406692504883, -0.00024145841598510742, -0.00021767616271972656, -0.0001938939094543457, -0.00017011165618896484, -0.00014632940292358398, -0.00012254714965820312, -9.876489639282227e-05, -7.49826431274414e-05, -5.120038986206055e-05, -2.7418136596679688e-05, -3.635883331298828e-06, 2.014636993408203e-05, 4.392862319946289e-05, 6.771087646484375e-05, 9.149312973022461e-05, 0.00011527538299560547, 0.00013905763626098633, 0.0001628398895263672, 0.00018662214279174805, 0.0002104043960571289, 0.00023418664932250977, 0.0002579689025878906, 0.0002817511558532715, 0.00030553340911865234, 0.0003293156623840332, 0.00035309791564941406, 0.0003768801689147949, 0.0004006624221801758, 0.00042444467544555664, 0.0004482269287109375, 0.00047200918197631836, 0.0004957914352416992, 0.0005195736885070801, 0.0005433559417724609, 0.0005671381950378418, 0.0005909204483032227, 0.0006147027015686035, 0.0006384849548339844, 0.0006622672080993652, 0.0006860494613647461, 0.000709831714630127, 0.0007336139678955078, 0.0007573962211608887, 0.0007811784744262695, 0.0008049607276916504, 0.0008287429809570312]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 21.0, 38.0, 62.0, 100.0, 179.0, 401.0, 1229.0, 8889.0, 415103.0, 609139.0, 11009.0, 1423.0, 489.0, 204.0, 109.0, 63.0, 41.0, 20.0, 9.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.41259765625, -14.0126953125, -13.61279296875, -13.212890625, -12.81298828125, -12.4130859375, -12.01318359375, -11.61328125, -11.21337890625, -10.8134765625, -10.41357421875, -10.013671875, -9.61376953125, -9.2138671875, -8.81396484375, -8.4140625, -8.01416015625, -7.6142578125, -7.21435546875, -6.814453125, -6.41455078125, -6.0146484375, -5.61474609375, -5.21484375, -4.81494140625, -4.4150390625, -4.01513671875, -3.615234375, -3.21533203125, -2.8154296875, -2.41552734375, -2.015625, -1.61572265625, -1.2158203125, -0.81591796875, -0.416015625, -0.01611328125, 0.3837890625, 0.78369140625, 1.18359375, 1.58349609375, 1.9833984375, 2.38330078125, 2.783203125, 3.18310546875, 3.5830078125, 3.98291015625, 4.3828125, 4.78271484375, 5.1826171875, 5.58251953125, 5.982421875, 6.38232421875, 6.7822265625, 7.18212890625, 7.58203125, 7.98193359375, 8.3818359375, 8.78173828125, 9.181640625, 9.58154296875, 9.9814453125, 10.38134765625, 10.78125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 10.0, 11.0, 12.0, 16.0, 23.0, 29.0, 33.0, 65.0, 89.0, 123.0, 134.0, 125.0, 90.0, 72.0, 42.0, 34.0, 27.0, 22.0, 15.0, 11.0, 10.0, 5.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.08935546875, -5.9130859375, -5.73681640625, -5.560546875, -5.38427734375, -5.2080078125, -5.03173828125, -4.85546875, -4.67919921875, -4.5029296875, -4.32666015625, -4.150390625, -3.97412109375, -3.7978515625, -3.62158203125, -3.4453125, -3.26904296875, -3.0927734375, -2.91650390625, -2.740234375, -2.56396484375, -2.3876953125, -2.21142578125, -2.03515625, -1.85888671875, -1.6826171875, -1.50634765625, -1.330078125, -1.15380859375, -0.9775390625, -0.80126953125, -0.625, -0.44873046875, -0.2724609375, -0.09619140625, 0.080078125, 0.25634765625, 0.4326171875, 0.60888671875, 0.78515625, 0.96142578125, 1.1376953125, 1.31396484375, 1.490234375, 1.66650390625, 1.8427734375, 2.01904296875, 2.1953125, 2.37158203125, 2.5478515625, 2.72412109375, 2.900390625, 3.07666015625, 3.2529296875, 3.42919921875, 3.60546875, 3.78173828125, 3.9580078125, 4.13427734375, 4.310546875, 4.48681640625, 4.6630859375, 4.83935546875, 5.015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 24.0, 92.0, 239.0, 311.0, 206.0, 86.0, 24.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.21240234375, -169.92276000976562, -165.63311767578125, -161.34347534179688, -157.0538330078125, -152.76419067382812, -148.47454833984375, -144.18490600585938, -139.895263671875, -135.60562133789062, -131.31597900390625, -127.02633666992188, -122.7366943359375, -118.44705200195312, -114.15741729736328, -109.8677749633789, -105.57814025878906, -101.28849792480469, -96.99885559082031, -92.70921325683594, -88.41957092285156, -84.12992858886719, -79.84029388427734, -75.55065155029297, -71.2610092163086, -66.97136688232422, -62.681724548339844, -58.392086029052734, -54.10244369506836, -49.812801361083984, -45.523162841796875, -41.2335205078125, -36.943885803222656, -32.65424346923828, -28.36460304260254, -24.074962615966797, -19.785320281982422, -15.495677947998047, -11.206037521362305, -6.9163970947265625, -2.6267547607421875, 1.662886619567871, 5.95252799987793, 10.242169380187988, 14.531810760498047, 18.821453094482422, 23.111093521118164, 27.400733947753906, 31.69037628173828, 35.980018615722656, 40.26966094970703, 44.55929946899414, 48.848941802978516, 53.13858413696289, 57.42822265625, 61.717864990234375, 66.00750732421875, 70.29714965820312, 74.5867919921875, 78.87643432617188, 83.16607666015625, 87.45571899414062, 91.74535369873047, 96.03499603271484, 100.32463836669922]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 5.0, 12.0, 17.0, 15.0, 15.0, 17.0, 30.0, 30.0, 27.0, 31.0, 34.0, 33.0, 45.0, 35.0, 27.0, 38.0, 49.0, 36.0, 57.0, 41.0, 42.0, 32.0, 35.0, 38.0, 35.0, 22.0, 25.0, 21.0, 17.0, 17.0, 18.0, 12.0, 12.0, 8.0, 10.0, 9.0, 7.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-37.81949996948242, -36.68879318237305, -35.55809020996094, -34.42738342285156, -33.29668045043945, -32.16597366333008, -31.035268783569336, -29.904563903808594, -28.77385902404785, -27.64315414428711, -26.512449264526367, -25.381744384765625, -24.25103759765625, -23.12033462524414, -21.989627838134766, -20.858922958374023, -19.72821807861328, -18.59751319885254, -17.466808319091797, -16.336103439331055, -15.205397605895996, -14.074692726135254, -12.943986892700195, -11.813282012939453, -10.682577133178711, -9.551872253417969, -8.421167373657227, -7.290461540222168, -6.159756660461426, -5.029051780700684, -3.898346424102783, -2.767641067504883, -1.636932373046875, -0.5062272548675537, 0.6244778633117676, 1.7551829814910889, 2.88588809967041, 4.016592979431152, 5.147298336029053, 6.278003692626953, 7.408708572387695, 8.539413452148438, 9.67011833190918, 10.800824165344238, 11.93152904510498, 13.062233924865723, 14.192939758300781, 15.323644638061523, 16.454349517822266, 17.585054397583008, 18.71575927734375, 19.846464157104492, 20.977169036865234, 22.10787582397461, 23.23858070373535, 24.369285583496094, 25.499990463256836, 26.630695343017578, 27.76140022277832, 28.892105102539062, 30.022811889648438, 31.153514862060547, 32.28422164916992, 33.41492462158203, 34.545631408691406]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 11.0, 8.0, 7.0, 14.0, 21.0, 44.0, 79.0, 123.0, 231.0, 462.0, 1061.0, 2809.0, 8601.0, 33858.0, 219112.0, 3494681.0, 369398.0, 46471.0, 11324.0, 3638.0, 1253.0, 574.0, 226.0, 126.0, 64.0, 36.0, 19.0, 11.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.046875, -10.76068115234375, -10.4744873046875, -10.18829345703125, -9.902099609375, -9.61590576171875, -9.3297119140625, -9.04351806640625, -8.75732421875, -8.47113037109375, -8.1849365234375, -7.89874267578125, -7.612548828125, -7.32635498046875, -7.0401611328125, -6.75396728515625, -6.4677734375, -6.18157958984375, -5.8953857421875, -5.60919189453125, -5.322998046875, -5.03680419921875, -4.7506103515625, -4.46441650390625, -4.17822265625, -3.89202880859375, -3.6058349609375, -3.31964111328125, -3.033447265625, -2.74725341796875, -2.4610595703125, -2.17486572265625, -1.888671875, -1.60247802734375, -1.3162841796875, -1.03009033203125, -0.743896484375, -0.45770263671875, -0.1715087890625, 0.11468505859375, 0.40087890625, 0.68707275390625, 0.9732666015625, 1.25946044921875, 1.545654296875, 1.83184814453125, 2.1180419921875, 2.40423583984375, 2.6904296875, 2.97662353515625, 3.2628173828125, 3.54901123046875, 3.835205078125, 4.12139892578125, 4.4075927734375, 4.69378662109375, 4.97998046875, 5.26617431640625, 5.5523681640625, 5.83856201171875, 6.124755859375, 6.41094970703125, 6.6971435546875, 6.98333740234375, 7.26953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 3.0, 10.0, 7.0, 12.0, 11.0, 6.0, 22.0, 16.0, 13.0, 21.0, 33.0, 19.0, 43.0, 22.0, 36.0, 47.0, 27.0, 39.0, 43.0, 45.0, 41.0, 34.0, 37.0, 31.0, 40.0, 39.0, 40.0, 31.0, 34.0, 29.0, 19.0, 29.0, 13.0, 24.0, 17.0, 8.0, 9.0, 15.0, 3.0, 5.0, 3.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.5390625, -1.49676513671875, -1.4544677734375, -1.41217041015625, -1.369873046875, -1.32757568359375, -1.2852783203125, -1.24298095703125, -1.20068359375, -1.15838623046875, -1.1160888671875, -1.07379150390625, -1.031494140625, -0.98919677734375, -0.9468994140625, -0.90460205078125, -0.8623046875, -0.82000732421875, -0.7777099609375, -0.73541259765625, -0.693115234375, -0.65081787109375, -0.6085205078125, -0.56622314453125, -0.52392578125, -0.48162841796875, -0.4393310546875, -0.39703369140625, -0.354736328125, -0.31243896484375, -0.2701416015625, -0.22784423828125, -0.185546875, -0.14324951171875, -0.1009521484375, -0.05865478515625, -0.016357421875, 0.02593994140625, 0.0682373046875, 0.11053466796875, 0.15283203125, 0.19512939453125, 0.2374267578125, 0.27972412109375, 0.322021484375, 0.36431884765625, 0.4066162109375, 0.44891357421875, 0.4912109375, 0.53350830078125, 0.5758056640625, 0.61810302734375, 0.660400390625, 0.70269775390625, 0.7449951171875, 0.78729248046875, 0.82958984375, 0.87188720703125, 0.9141845703125, 0.95648193359375, 0.998779296875, 1.04107666015625, 1.0833740234375, 1.12567138671875, 1.16796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 13.0, 25.0, 65.0, 138.0, 340.0, 806.0, 2679.0, 13552.0, 166709.0, 3781924.0, 208150.0, 15464.0, 2999.0, 850.0, 318.0, 120.0, 59.0, 19.0, 14.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.4127197265625, -12.942626953125, -12.4725341796875, -12.00244140625, -11.5323486328125, -11.062255859375, -10.5921630859375, -10.1220703125, -9.6519775390625, -9.181884765625, -8.7117919921875, -8.24169921875, -7.7716064453125, -7.301513671875, -6.8314208984375, -6.361328125, -5.8912353515625, -5.421142578125, -4.9510498046875, -4.48095703125, -4.0108642578125, -3.540771484375, -3.0706787109375, -2.6005859375, -2.1304931640625, -1.660400390625, -1.1903076171875, -0.72021484375, -0.2501220703125, 0.219970703125, 0.6900634765625, 1.16015625, 1.6302490234375, 2.100341796875, 2.5704345703125, 3.04052734375, 3.5106201171875, 3.980712890625, 4.4508056640625, 4.9208984375, 5.3909912109375, 5.861083984375, 6.3311767578125, 6.80126953125, 7.2713623046875, 7.741455078125, 8.2115478515625, 8.681640625, 9.1517333984375, 9.621826171875, 10.0919189453125, 10.56201171875, 11.0321044921875, 11.502197265625, 11.9722900390625, 12.4423828125, 12.9124755859375, 13.382568359375, 13.8526611328125, 14.32275390625, 14.7928466796875, 15.262939453125, 15.7330322265625, 16.203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 18.0, 12.0, 12.0, 35.0, 40.0, 59.0, 131.0, 225.0, 459.0, 1242.0, 891.0, 393.0, 209.0, 94.0, 70.0, 49.0, 32.0, 16.0, 11.0, 15.0, 10.0, 7.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.86505126953125, -3.7261962890625, -3.58734130859375, -3.448486328125, -3.30963134765625, -3.1707763671875, -3.03192138671875, -2.89306640625, -2.75421142578125, -2.6153564453125, -2.47650146484375, -2.337646484375, -2.19879150390625, -2.0599365234375, -1.92108154296875, -1.7822265625, -1.64337158203125, -1.5045166015625, -1.36566162109375, -1.226806640625, -1.08795166015625, -0.9490966796875, -0.81024169921875, -0.67138671875, -0.53253173828125, -0.3936767578125, -0.25482177734375, -0.115966796875, 0.02288818359375, 0.1617431640625, 0.30059814453125, 0.439453125, 0.57830810546875, 0.7171630859375, 0.85601806640625, 0.994873046875, 1.13372802734375, 1.2725830078125, 1.41143798828125, 1.55029296875, 1.68914794921875, 1.8280029296875, 1.96685791015625, 2.105712890625, 2.24456787109375, 2.3834228515625, 2.52227783203125, 2.6611328125, 2.79998779296875, 2.9388427734375, 3.07769775390625, 3.216552734375, 3.35540771484375, 3.4942626953125, 3.63311767578125, 3.77197265625, 3.91082763671875, 4.0496826171875, 4.18853759765625, 4.327392578125, 4.46624755859375, 4.6051025390625, 4.74395751953125, 4.8828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 20.0, 51.0, 145.0, 230.0, 248.0, 169.0, 77.0, 29.0, 14.0, 9.0, 7.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6103515625, -20.863819122314453, -19.11728858947754, -17.370756149291992, -15.624224662780762, -13.877693176269531, -12.131160736083984, -10.384629249572754, -8.638097763061523, -6.891566276550293, -5.145034313201904, -3.3985023498535156, -1.6519708633422852, 0.09456062316894531, 1.8410930633544922, 3.5876245498657227, 5.334156036376953, 7.080687522888184, 8.827219009399414, 10.573751449584961, 12.320282936096191, 14.066814422607422, 15.813346862792969, 17.559879302978516, 19.30640983581543, 21.052942276000977, 22.79947280883789, 24.546005249023438, 26.292537689208984, 28.0390682220459, 29.785600662231445, 31.53213119506836, 33.278663635253906, 35.02519607543945, 36.771728515625, 38.51825714111328, 40.26478958129883, 42.011322021484375, 43.75785446166992, 45.50438690185547, 47.25091552734375, 48.9974479675293, 50.743980407714844, 52.490509033203125, 54.23704147338867, 55.98357391357422, 57.730106353759766, 59.47663879394531, 61.22317123413086, 62.969703674316406, 64.71623229980469, 66.4627685546875, 68.20929718017578, 69.95582580566406, 71.70236206054688, 73.44889068603516, 75.19542694091797, 76.94195556640625, 78.68849182128906, 80.43502044677734, 82.18155670166016, 83.92808532714844, 85.67462158203125, 87.42115020751953, 89.16767883300781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 9.0, 7.0, 5.0, 12.0, 7.0, 13.0, 13.0, 22.0, 16.0, 23.0, 25.0, 26.0, 24.0, 23.0, 33.0, 30.0, 36.0, 38.0, 44.0, 32.0, 38.0, 40.0, 39.0, 29.0, 38.0, 28.0, 45.0, 44.0, 32.0, 34.0, 28.0, 19.0, 19.0, 16.0, 16.0, 15.0, 20.0, 17.0, 12.0, 7.0, 3.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0], "bins": [-16.00847053527832, -15.56777572631836, -15.127079963684082, -14.686385154724121, -14.24569034576416, -13.804994583129883, -13.364299774169922, -12.923604965209961, -12.48291015625, -12.042215347290039, -11.601519584655762, -11.1608247756958, -10.72012996673584, -10.279434204101562, -9.838739395141602, -9.39804458618164, -8.957348823547363, -8.516654014587402, -8.075958251953125, -7.635263442993164, -7.194568634033203, -6.753873348236084, -6.313178062438965, -5.872483253479004, -5.431787967681885, -4.991092681884766, -4.550397872924805, -4.1097025871276855, -3.6690075397491455, -3.2283124923706055, -2.7876172065734863, -2.3469221591949463, -1.9062261581420898, -1.4655311107635498, -1.0248359441757202, -0.5841407775878906, -0.14344573020935059, 0.29724931716918945, 0.7379446029663086, 1.1786396503448486, 1.6193346977233887, 2.0600297451019287, 2.5007247924804688, 2.941420078277588, 3.382115125656128, 3.822810173034668, 4.263505458831787, 4.704200744628906, 5.144895553588867, 5.585590839385986, 6.026285648345947, 6.466980934143066, 6.907675743103027, 7.3483710289001465, 7.789066314697266, 8.229761123657227, 8.670455932617188, 9.111150741577148, 9.551846504211426, 9.992541313171387, 10.433236122131348, 10.873931884765625, 11.314626693725586, 11.755321502685547, 12.196017265319824]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 6.0, 7.0, 23.0, 23.0, 36.0, 102.0, 159.0, 263.0, 558.0, 1375.0, 4011.0, 14065.0, 56135.0, 215546.0, 450016.0, 225764.0, 58601.0, 15104.0, 4128.0, 1429.0, 596.0, 266.0, 131.0, 84.0, 46.0, 25.0, 10.0, 16.0, 10.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4765625, -9.23675537109375, -8.9969482421875, -8.75714111328125, -8.517333984375, -8.27752685546875, -8.0377197265625, -7.79791259765625, -7.55810546875, -7.31829833984375, -7.0784912109375, -6.83868408203125, -6.598876953125, -6.35906982421875, -6.1192626953125, -5.87945556640625, -5.6396484375, -5.39984130859375, -5.1600341796875, -4.92022705078125, -4.680419921875, -4.44061279296875, -4.2008056640625, -3.96099853515625, -3.72119140625, -3.48138427734375, -3.2415771484375, -3.00177001953125, -2.761962890625, -2.52215576171875, -2.2823486328125, -2.04254150390625, -1.802734375, -1.56292724609375, -1.3231201171875, -1.08331298828125, -0.843505859375, -0.60369873046875, -0.3638916015625, -0.12408447265625, 0.11572265625, 0.35552978515625, 0.5953369140625, 0.83514404296875, 1.074951171875, 1.31475830078125, 1.5545654296875, 1.79437255859375, 2.0341796875, 2.27398681640625, 2.5137939453125, 2.75360107421875, 2.993408203125, 3.23321533203125, 3.4730224609375, 3.71282958984375, 3.95263671875, 4.19244384765625, 4.4322509765625, 4.67205810546875, 4.911865234375, 5.15167236328125, 5.3914794921875, 5.63128662109375, 5.87109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 8.0, 11.0, 8.0, 18.0, 8.0, 29.0, 27.0, 32.0, 36.0, 36.0, 37.0, 37.0, 40.0, 40.0, 51.0, 56.0, 44.0, 49.0, 42.0, 41.0, 42.0, 46.0, 38.0, 44.0, 28.0, 30.0, 19.0, 19.0, 16.0, 12.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9638671875, -1.906158447265625, -1.84844970703125, -1.790740966796875, -1.7330322265625, -1.675323486328125, -1.61761474609375, -1.559906005859375, -1.502197265625, -1.444488525390625, -1.38677978515625, -1.329071044921875, -1.2713623046875, -1.213653564453125, -1.15594482421875, -1.098236083984375, -1.04052734375, -0.982818603515625, -0.92510986328125, -0.867401123046875, -0.8096923828125, -0.751983642578125, -0.69427490234375, -0.636566162109375, -0.578857421875, -0.521148681640625, -0.46343994140625, -0.405731201171875, -0.3480224609375, -0.290313720703125, -0.23260498046875, -0.174896240234375, -0.1171875, -0.059478759765625, -0.00177001953125, 0.055938720703125, 0.1136474609375, 0.171356201171875, 0.22906494140625, 0.286773681640625, 0.344482421875, 0.402191162109375, 0.45989990234375, 0.517608642578125, 0.5753173828125, 0.633026123046875, 0.69073486328125, 0.748443603515625, 0.80615234375, 0.863861083984375, 0.92156982421875, 0.979278564453125, 1.0369873046875, 1.094696044921875, 1.15240478515625, 1.210113525390625, 1.267822265625, 1.325531005859375, 1.38323974609375, 1.440948486328125, 1.4986572265625, 1.556365966796875, 1.61407470703125, 1.671783447265625, 1.7294921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 14.0, 25.0, 34.0, 34.0, 60.0, 80.0, 111.0, 211.0, 354.0, 613.0, 1242.0, 3735.0, 29766.0, 539051.0, 443295.0, 23853.0, 3357.0, 1183.0, 574.0, 336.0, 188.0, 128.0, 82.0, 64.0, 39.0, 28.0, 20.0, 9.0, 6.0, 5.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.61376953125, -16.0400390625, -15.46630859375, -14.892578125, -14.31884765625, -13.7451171875, -13.17138671875, -12.59765625, -12.02392578125, -11.4501953125, -10.87646484375, -10.302734375, -9.72900390625, -9.1552734375, -8.58154296875, -8.0078125, -7.43408203125, -6.8603515625, -6.28662109375, -5.712890625, -5.13916015625, -4.5654296875, -3.99169921875, -3.41796875, -2.84423828125, -2.2705078125, -1.69677734375, -1.123046875, -0.54931640625, 0.0244140625, 0.59814453125, 1.171875, 1.74560546875, 2.3193359375, 2.89306640625, 3.466796875, 4.04052734375, 4.6142578125, 5.18798828125, 5.76171875, 6.33544921875, 6.9091796875, 7.48291015625, 8.056640625, 8.63037109375, 9.2041015625, 9.77783203125, 10.3515625, 10.92529296875, 11.4990234375, 12.07275390625, 12.646484375, 13.22021484375, 13.7939453125, 14.36767578125, 14.94140625, 15.51513671875, 16.0888671875, 16.66259765625, 17.236328125, 17.81005859375, 18.3837890625, 18.95751953125, 19.53125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 8.0, 7.0, 9.0, 10.0, 8.0, 10.0, 23.0, 15.0, 24.0, 17.0, 32.0, 25.0, 21.0, 31.0, 39.0, 34.0, 30.0, 56.0, 39.0, 47.0, 39.0, 44.0, 29.0, 34.0, 44.0, 31.0, 38.0, 34.0, 34.0, 22.0, 17.0, 19.0, 17.0, 20.0, 21.0, 10.0, 12.0, 10.0, 7.0, 8.0, 5.0, 1.0, 10.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.7578125, -9.4600830078125, -9.162353515625, -8.8646240234375, -8.56689453125, -8.2691650390625, -7.971435546875, -7.6737060546875, -7.3759765625, -7.0782470703125, -6.780517578125, -6.4827880859375, -6.18505859375, -5.8873291015625, -5.589599609375, -5.2918701171875, -4.994140625, -4.6964111328125, -4.398681640625, -4.1009521484375, -3.80322265625, -3.5054931640625, -3.207763671875, -2.9100341796875, -2.6123046875, -2.3145751953125, -2.016845703125, -1.7191162109375, -1.42138671875, -1.1236572265625, -0.825927734375, -0.5281982421875, -0.23046875, 0.0672607421875, 0.364990234375, 0.6627197265625, 0.96044921875, 1.2581787109375, 1.555908203125, 1.8536376953125, 2.1513671875, 2.4490966796875, 2.746826171875, 3.0445556640625, 3.34228515625, 3.6400146484375, 3.937744140625, 4.2354736328125, 4.533203125, 4.8309326171875, 5.128662109375, 5.4263916015625, 5.72412109375, 6.0218505859375, 6.319580078125, 6.6173095703125, 6.9150390625, 7.2127685546875, 7.510498046875, 7.8082275390625, 8.10595703125, 8.4036865234375, 8.701416015625, 8.9991455078125, 9.296875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 14.0, 14.0, 23.0, 26.0, 63.0, 92.0, 198.0, 428.0, 1538.0, 9497.0, 233438.0, 768077.0, 30826.0, 3019.0, 756.0, 253.0, 134.0, 60.0, 52.0, 11.0, 13.0, 10.0, 1.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0078125, -12.6761474609375, -12.344482421875, -12.0128173828125, -11.68115234375, -11.3494873046875, -11.017822265625, -10.6861572265625, -10.3544921875, -10.0228271484375, -9.691162109375, -9.3594970703125, -9.02783203125, -8.6961669921875, -8.364501953125, -8.0328369140625, -7.701171875, -7.3695068359375, -7.037841796875, -6.7061767578125, -6.37451171875, -6.0428466796875, -5.711181640625, -5.3795166015625, -5.0478515625, -4.7161865234375, -4.384521484375, -4.0528564453125, -3.72119140625, -3.3895263671875, -3.057861328125, -2.7261962890625, -2.39453125, -2.0628662109375, -1.731201171875, -1.3995361328125, -1.06787109375, -0.7362060546875, -0.404541015625, -0.0728759765625, 0.2587890625, 0.5904541015625, 0.922119140625, 1.2537841796875, 1.58544921875, 1.9171142578125, 2.248779296875, 2.5804443359375, 2.912109375, 3.2437744140625, 3.575439453125, 3.9071044921875, 4.23876953125, 4.5704345703125, 4.902099609375, 5.2337646484375, 5.5654296875, 5.8970947265625, 6.228759765625, 6.5604248046875, 6.89208984375, 7.2237548828125, 7.555419921875, 7.8870849609375, 8.21875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 7.0, 14.0, 37.0, 38.0, 79.0, 108.0, 137.0, 174.0, 134.0, 90.0, 79.0, 34.0, 22.0, 19.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012607574462890625, -0.0012178122997283936, -0.0011748671531677246, -0.0011319220066070557, -0.0010889768600463867, -0.0010460317134857178, -0.0010030865669250488, -0.0009601414203643799, -0.0009171962738037109, -0.000874251127243042, -0.000831305980682373, -0.0007883608341217041, -0.0007454156875610352, -0.0007024705410003662, -0.0006595253944396973, -0.0006165802478790283, -0.0005736351013183594, -0.0005306899547576904, -0.0004877448081970215, -0.00044479966163635254, -0.0004018545150756836, -0.00035890936851501465, -0.0003159642219543457, -0.00027301907539367676, -0.0002300739288330078, -0.00018712878227233887, -0.00014418363571166992, -0.00010123848915100098, -5.829334259033203e-05, -1.5348196029663086e-05, 2.759695053100586e-05, 7.05420970916748e-05, 0.00011348724365234375, 0.0001564323902130127, 0.00019937753677368164, 0.00024232268333435059, 0.00028526782989501953, 0.0003282129764556885, 0.0003711581230163574, 0.00041410326957702637, 0.0004570484161376953, 0.0004999935626983643, 0.0005429387092590332, 0.0005858838558197021, 0.0006288290023803711, 0.00067177414894104, 0.000714719295501709, 0.0007576644420623779, 0.0008006095886230469, 0.0008435547351837158, 0.0008864998817443848, 0.0009294450283050537, 0.0009723901748657227, 0.0010153353214263916, 0.0010582804679870605, 0.0011012256145477295, 0.0011441707611083984, 0.0011871159076690674, 0.0012300610542297363, 0.0012730062007904053, 0.0013159513473510742, 0.0013588964939117432, 0.0014018416404724121, 0.001444786787033081, 0.00148773193359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 8.0, 16.0, 28.0, 35.0, 66.0, 110.0, 153.0, 260.0, 448.0, 920.0, 2140.0, 5955.0, 29822.0, 341613.0, 593430.0, 59233.0, 9019.0, 2825.0, 1100.0, 558.0, 277.0, 182.0, 108.0, 79.0, 39.0, 30.0, 21.0, 18.0, 7.0, 7.0, 6.0, 3.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.0452880859375, -6.832763671875, -6.6202392578125, -6.40771484375, -6.1951904296875, -5.982666015625, -5.7701416015625, -5.5576171875, -5.3450927734375, -5.132568359375, -4.9200439453125, -4.70751953125, -4.4949951171875, -4.282470703125, -4.0699462890625, -3.857421875, -3.6448974609375, -3.432373046875, -3.2198486328125, -3.00732421875, -2.7947998046875, -2.582275390625, -2.3697509765625, -2.1572265625, -1.9447021484375, -1.732177734375, -1.5196533203125, -1.30712890625, -1.0946044921875, -0.882080078125, -0.6695556640625, -0.45703125, -0.2445068359375, -0.031982421875, 0.1805419921875, 0.39306640625, 0.6055908203125, 0.818115234375, 1.0306396484375, 1.2431640625, 1.4556884765625, 1.668212890625, 1.8807373046875, 2.09326171875, 2.3057861328125, 2.518310546875, 2.7308349609375, 2.943359375, 3.1558837890625, 3.368408203125, 3.5809326171875, 3.79345703125, 4.0059814453125, 4.218505859375, 4.4310302734375, 4.6435546875, 4.8560791015625, 5.068603515625, 5.2811279296875, 5.49365234375, 5.7061767578125, 5.918701171875, 6.1312255859375, 6.34375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 17.0, 27.0, 30.0, 56.0, 67.0, 76.0, 86.0, 123.0, 91.0, 85.0, 90.0, 66.0, 52.0, 41.0, 19.0, 17.0, 14.0, 7.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.336822509765625, -8.14239501953125, -7.947967529296875, -7.7535400390625, -7.559112548828125, -7.36468505859375, -7.170257568359375, -6.975830078125, -6.781402587890625, -6.58697509765625, -6.392547607421875, -6.1981201171875, -6.003692626953125, -5.80926513671875, -5.614837646484375, -5.42041015625, -5.225982666015625, -5.03155517578125, -4.837127685546875, -4.6427001953125, -4.448272705078125, -4.25384521484375, -4.059417724609375, -3.864990234375, -3.670562744140625, -3.47613525390625, -3.281707763671875, -3.0872802734375, -2.892852783203125, -2.69842529296875, -2.503997802734375, -2.3095703125, -2.115142822265625, -1.92071533203125, -1.726287841796875, -1.5318603515625, -1.337432861328125, -1.14300537109375, -0.948577880859375, -0.754150390625, -0.559722900390625, -0.36529541015625, -0.170867919921875, 0.0235595703125, 0.217987060546875, 0.41241455078125, 0.606842041015625, 0.80126953125, 0.995697021484375, 1.19012451171875, 1.384552001953125, 1.5789794921875, 1.773406982421875, 1.96783447265625, 2.162261962890625, 2.356689453125, 2.551116943359375, 2.74554443359375, 2.939971923828125, 3.1343994140625, 3.328826904296875, 3.52325439453125, 3.717681884765625, 3.912109375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 25.0, 55.0, 89.0, 186.0, 224.0, 191.0, 123.0, 49.0, 28.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-86.39786529541016, -83.01380920410156, -79.62975311279297, -76.24569702148438, -72.86164855957031, -69.47758483886719, -66.09353637695312, -62.70948028564453, -59.32542419433594, -55.941368103027344, -52.55731201171875, -49.17325973510742, -45.78920364379883, -42.405147552490234, -39.021095275878906, -35.63703918457031, -32.25298309326172, -28.868927001953125, -25.484872817993164, -22.100818634033203, -18.71676254272461, -15.332706451416016, -11.948652267456055, -8.564598083496094, -5.1805419921875, -1.7964868545532227, 1.5875682830810547, 4.971623420715332, 8.35567855834961, 11.739734649658203, 15.123788833618164, 18.507843017578125, 21.891891479492188, 25.27594757080078, 28.660001754760742, 32.0440559387207, 35.4281120300293, 38.81216812133789, 42.19622039794922, 45.58027648925781, 48.964332580566406, 52.348388671875, 55.732444763183594, 59.11649703979492, 62.500553131103516, 65.88461303710938, 69.26866149902344, 72.65271759033203, 76.03677368164062, 79.42082977294922, 82.80488586425781, 86.1889419555664, 89.572998046875, 92.95704650878906, 96.34110260009766, 99.72515869140625, 103.10921478271484, 106.49327087402344, 109.87732696533203, 113.26138305664062, 116.64543151855469, 120.02949523925781, 123.41354370117188, 126.79759979248047, 130.18165588378906]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 8.0, 17.0, 16.0, 15.0, 8.0, 23.0, 19.0, 35.0, 25.0, 32.0, 35.0, 43.0, 44.0, 49.0, 41.0, 49.0, 55.0, 31.0, 38.0, 47.0, 33.0, 38.0, 23.0, 39.0, 29.0, 20.0, 17.0, 23.0, 20.0, 22.0, 16.0, 12.0, 5.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.90693283081055, -48.360836029052734, -46.814735412597656, -45.268638610839844, -43.72254180908203, -42.17644500732422, -40.63034439086914, -39.08424758911133, -37.53814697265625, -35.99205017089844, -34.44594955444336, -32.89985275268555, -31.353755950927734, -29.80765724182129, -28.261558532714844, -26.71546173095703, -25.16936492919922, -23.623266220092773, -22.07716941833496, -20.531070709228516, -18.984973907470703, -17.438875198364258, -15.892776489257812, -14.346678733825684, -12.800580978393555, -11.254483222961426, -9.708385467529297, -8.162286758422852, -6.616189002990723, -5.070091247558594, -3.5239925384521484, -1.9778947830200195, -0.431793212890625, 1.114304780960083, 2.660402774810791, 4.206501007080078, 5.752598762512207, 7.298696517944336, 8.844795227050781, 10.39089298248291, 11.936990737915039, 13.483088493347168, 15.029186248779297, 16.575284957885742, 18.121383666992188, 19.66748046875, 21.213579177856445, 22.75967788696289, 24.305774688720703, 25.85187339782715, 27.39797019958496, 28.944068908691406, 30.49016571044922, 32.03626251220703, 33.58236312866211, 35.12845993041992, 36.674560546875, 38.22065734863281, 39.76675796508789, 41.3128547668457, 42.858951568603516, 44.405052185058594, 45.951148986816406, 47.49724578857422, 49.04334259033203]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 16.0, 23.0, 37.0, 57.0, 101.0, 153.0, 362.0, 761.0, 1799.0, 5677.0, 32824.0, 3967602.0, 166161.0, 13238.0, 3128.0, 1192.0, 540.0, 278.0, 145.0, 73.0, 42.0, 24.0, 18.0, 7.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-20.90625, -20.449462890625, -19.99267578125, -19.535888671875, -19.0791015625, -18.622314453125, -18.16552734375, -17.708740234375, -17.251953125, -16.795166015625, -16.33837890625, -15.881591796875, -15.4248046875, -14.968017578125, -14.51123046875, -14.054443359375, -13.59765625, -13.140869140625, -12.68408203125, -12.227294921875, -11.7705078125, -11.313720703125, -10.85693359375, -10.400146484375, -9.943359375, -9.486572265625, -9.02978515625, -8.572998046875, -8.1162109375, -7.659423828125, -7.20263671875, -6.745849609375, -6.2890625, -5.832275390625, -5.37548828125, -4.918701171875, -4.4619140625, -4.005126953125, -3.54833984375, -3.091552734375, -2.634765625, -2.177978515625, -1.72119140625, -1.264404296875, -0.8076171875, -0.350830078125, 0.10595703125, 0.562744140625, 1.01953125, 1.476318359375, 1.93310546875, 2.389892578125, 2.8466796875, 3.303466796875, 3.76025390625, 4.217041015625, 4.673828125, 5.130615234375, 5.58740234375, 6.044189453125, 6.5009765625, 6.957763671875, 7.41455078125, 7.871337890625, 8.328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 11.0, 6.0, 17.0, 18.0, 11.0, 21.0, 25.0, 25.0, 38.0, 27.0, 34.0, 46.0, 36.0, 43.0, 47.0, 38.0, 56.0, 47.0, 50.0, 48.0, 42.0, 46.0, 29.0, 33.0, 31.0, 33.0, 22.0, 18.0, 9.0, 11.0, 9.0, 12.0, 6.0, 11.0, 3.0, 5.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.954925537109375, -1.89422607421875, -1.833526611328125, -1.7728271484375, -1.712127685546875, -1.65142822265625, -1.590728759765625, -1.530029296875, -1.469329833984375, -1.40863037109375, -1.347930908203125, -1.2872314453125, -1.226531982421875, -1.16583251953125, -1.105133056640625, -1.04443359375, -0.983734130859375, -0.92303466796875, -0.862335205078125, -0.8016357421875, -0.740936279296875, -0.68023681640625, -0.619537353515625, -0.558837890625, -0.498138427734375, -0.43743896484375, -0.376739501953125, -0.3160400390625, -0.255340576171875, -0.19464111328125, -0.133941650390625, -0.0732421875, -0.012542724609375, 0.04815673828125, 0.108856201171875, 0.1695556640625, 0.230255126953125, 0.29095458984375, 0.351654052734375, 0.412353515625, 0.473052978515625, 0.53375244140625, 0.594451904296875, 0.6551513671875, 0.715850830078125, 0.77655029296875, 0.837249755859375, 0.89794921875, 0.958648681640625, 1.01934814453125, 1.080047607421875, 1.1407470703125, 1.201446533203125, 1.26214599609375, 1.322845458984375, 1.383544921875, 1.444244384765625, 1.50494384765625, 1.565643310546875, 1.6263427734375, 1.687042236328125, 1.74774169921875, 1.808441162109375, 1.869140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 16.0, 19.0, 15.0, 34.0, 65.0, 85.0, 160.0, 217.0, 312.0, 494.0, 784.0, 1431.0, 2543.0, 5110.0, 11728.0, 36688.0, 222068.0, 3736067.0, 129769.0, 27262.0, 9534.0, 4366.0, 2196.0, 1259.0, 731.0, 449.0, 283.0, 191.0, 132.0, 74.0, 50.0, 42.0, 23.0, 21.0, 16.0, 8.0, 3.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.56561279296875, -6.3421630859375, -6.11871337890625, -5.895263671875, -5.67181396484375, -5.4483642578125, -5.22491455078125, -5.00146484375, -4.77801513671875, -4.5545654296875, -4.33111572265625, -4.107666015625, -3.88421630859375, -3.6607666015625, -3.43731689453125, -3.2138671875, -2.99041748046875, -2.7669677734375, -2.54351806640625, -2.320068359375, -2.09661865234375, -1.8731689453125, -1.64971923828125, -1.42626953125, -1.20281982421875, -0.9793701171875, -0.75592041015625, -0.532470703125, -0.30902099609375, -0.0855712890625, 0.13787841796875, 0.361328125, 0.58477783203125, 0.8082275390625, 1.03167724609375, 1.255126953125, 1.47857666015625, 1.7020263671875, 1.92547607421875, 2.14892578125, 2.37237548828125, 2.5958251953125, 2.81927490234375, 3.042724609375, 3.26617431640625, 3.4896240234375, 3.71307373046875, 3.9365234375, 4.15997314453125, 4.3834228515625, 4.60687255859375, 4.830322265625, 5.05377197265625, 5.2772216796875, 5.50067138671875, 5.72412109375, 5.94757080078125, 6.1710205078125, 6.39447021484375, 6.617919921875, 6.84136962890625, 7.0648193359375, 7.28826904296875, 7.51171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 11.0, 15.0, 24.0, 35.0, 61.0, 110.0, 304.0, 2885.0, 319.0, 116.0, 67.0, 36.0, 24.0, 21.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7177734375, -1.6596221923828125, -1.601470947265625, -1.5433197021484375, -1.48516845703125, -1.4270172119140625, -1.368865966796875, -1.3107147216796875, -1.2525634765625, -1.1944122314453125, -1.136260986328125, -1.0781097412109375, -1.01995849609375, -0.9618072509765625, -0.903656005859375, -0.8455047607421875, -0.787353515625, -0.7292022705078125, -0.671051025390625, -0.6128997802734375, -0.55474853515625, -0.4965972900390625, -0.438446044921875, -0.3802947998046875, -0.3221435546875, -0.2639923095703125, -0.205841064453125, -0.1476898193359375, -0.08953857421875, -0.0313873291015625, 0.026763916015625, 0.0849151611328125, 0.14306640625, 0.2012176513671875, 0.259368896484375, 0.3175201416015625, 0.37567138671875, 0.4338226318359375, 0.491973876953125, 0.5501251220703125, 0.6082763671875, 0.6664276123046875, 0.724578857421875, 0.7827301025390625, 0.84088134765625, 0.8990325927734375, 0.957183837890625, 1.0153350830078125, 1.073486328125, 1.1316375732421875, 1.189788818359375, 1.2479400634765625, 1.30609130859375, 1.3642425537109375, 1.422393798828125, 1.4805450439453125, 1.5386962890625, 1.5968475341796875, 1.654998779296875, 1.7131500244140625, 1.77130126953125, 1.8294525146484375, 1.887603759765625, 1.9457550048828125, 2.00390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 23.0, 53.0, 118.0, 188.0, 218.0, 189.0, 115.0, 54.0, 19.0, 13.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.867193222045898, -5.43170166015625, -4.996210098266602, -4.560718536376953, -4.125226974487305, -3.6897356510162354, -3.254244089126587, -2.8187525272369385, -2.38326096534729, -1.9477694034576416, -1.5122778415679932, -1.0767863988876343, -0.6412948369979858, -0.20580339431762695, 0.22968816757202148, 0.6651797294616699, 1.1006712913513184, 1.5361628532409668, 1.9716544151306152, 2.4071459770202637, 2.842637538909912, 3.2781288623809814, 3.71362042427063, 4.149111747741699, 4.584603309631348, 5.020094871520996, 5.4555864334106445, 5.891077995300293, 6.326569557189941, 6.76206111907959, 7.197552680969238, 7.633044242858887, 8.068535804748535, 8.504027366638184, 8.939518928527832, 9.37501049041748, 9.810502052307129, 10.245993614196777, 10.681485176086426, 11.116976737976074, 11.552468299865723, 11.987959861755371, 12.42345142364502, 12.858942985534668, 13.294434547424316, 13.729926109313965, 14.165417671203613, 14.600909233093262, 15.036399841308594, 15.471891403198242, 15.90738296508789, 16.34287452697754, 16.778366088867188, 17.213857650756836, 17.649349212646484, 18.084840774536133, 18.52033233642578, 18.95582389831543, 19.391315460205078, 19.826807022094727, 20.262298583984375, 20.697790145874023, 21.133281707763672, 21.56877326965332, 22.00426483154297]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 8.0, 1.0, 8.0, 12.0, 12.0, 12.0, 12.0, 23.0, 18.0, 21.0, 22.0, 30.0, 31.0, 33.0, 51.0, 46.0, 48.0, 44.0, 43.0, 40.0, 39.0, 51.0, 45.0, 55.0, 35.0, 37.0, 33.0, 32.0, 12.0, 22.0, 22.0, 25.0, 16.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.157932281494141, -4.031371593475342, -3.904810905456543, -3.778250217437744, -3.6516895294189453, -3.5251288414001465, -3.3985681533813477, -3.272007465362549, -3.14544677734375, -3.018886089324951, -2.8923254013061523, -2.7657647132873535, -2.6392040252685547, -2.512643337249756, -2.386082649230957, -2.259521961212158, -2.1329612731933594, -2.0064005851745605, -1.8798398971557617, -1.753279209136963, -1.626718521118164, -1.5001578330993652, -1.3735971450805664, -1.2470364570617676, -1.1204757690429688, -0.9939150810241699, -0.8673543930053711, -0.7407937049865723, -0.6142330169677734, -0.4876723289489746, -0.3611116409301758, -0.23455095291137695, -0.10799074172973633, 0.0185699462890625, 0.14513063430786133, 0.27169132232666016, 0.398252010345459, 0.5248126983642578, 0.6513733863830566, 0.7779340744018555, 0.9044947624206543, 1.0310554504394531, 1.157616138458252, 1.2841768264770508, 1.4107375144958496, 1.5372982025146484, 1.6638588905334473, 1.790419578552246, 1.916980266571045, 2.0435409545898438, 2.1701016426086426, 2.2966623306274414, 2.4232230186462402, 2.549783706665039, 2.676344394683838, 2.8029050827026367, 2.9294657707214355, 3.0560264587402344, 3.182587146759033, 3.309147834777832, 3.435708522796631, 3.5622692108154297, 3.6888298988342285, 3.8153905868530273, 3.941951274871826]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 26.0, 44.0, 66.0, 125.0, 243.0, 491.0, 1301.0, 4181.0, 17210.0, 76444.0, 300523.0, 446208.0, 154308.0, 35400.0, 8222.0, 2267.0, 780.0, 344.0, 138.0, 74.0, 59.0, 28.0, 14.0, 12.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.49609375, -7.24822998046875, -7.0003662109375, -6.75250244140625, -6.504638671875, -6.25677490234375, -6.0089111328125, -5.76104736328125, -5.51318359375, -5.26531982421875, -5.0174560546875, -4.76959228515625, -4.521728515625, -4.27386474609375, -4.0260009765625, -3.77813720703125, -3.5302734375, -3.28240966796875, -3.0345458984375, -2.78668212890625, -2.538818359375, -2.29095458984375, -2.0430908203125, -1.79522705078125, -1.54736328125, -1.29949951171875, -1.0516357421875, -0.80377197265625, -0.555908203125, -0.30804443359375, -0.0601806640625, 0.18768310546875, 0.435546875, 0.68341064453125, 0.9312744140625, 1.17913818359375, 1.427001953125, 1.67486572265625, 1.9227294921875, 2.17059326171875, 2.41845703125, 2.66632080078125, 2.9141845703125, 3.16204833984375, 3.409912109375, 3.65777587890625, 3.9056396484375, 4.15350341796875, 4.4013671875, 4.64923095703125, 4.8970947265625, 5.14495849609375, 5.392822265625, 5.64068603515625, 5.8885498046875, 6.13641357421875, 6.38427734375, 6.63214111328125, 6.8800048828125, 7.12786865234375, 7.375732421875, 7.62359619140625, 7.8714599609375, 8.11932373046875, 8.3671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 3.0, 9.0, 8.0, 18.0, 17.0, 14.0, 23.0, 30.0, 23.0, 20.0, 40.0, 41.0, 41.0, 36.0, 53.0, 51.0, 44.0, 59.0, 44.0, 46.0, 46.0, 34.0, 38.0, 47.0, 31.0, 39.0, 21.0, 19.0, 16.0, 20.0, 18.0, 11.0, 3.0, 6.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33807373046875, -2.2679443359375, -2.19781494140625, -2.127685546875, -2.05755615234375, -1.9874267578125, -1.91729736328125, -1.84716796875, -1.77703857421875, -1.7069091796875, -1.63677978515625, -1.566650390625, -1.49652099609375, -1.4263916015625, -1.35626220703125, -1.2861328125, -1.21600341796875, -1.1458740234375, -1.07574462890625, -1.005615234375, -0.93548583984375, -0.8653564453125, -0.79522705078125, -0.72509765625, -0.65496826171875, -0.5848388671875, -0.51470947265625, -0.444580078125, -0.37445068359375, -0.3043212890625, -0.23419189453125, -0.1640625, -0.09393310546875, -0.0238037109375, 0.04632568359375, 0.116455078125, 0.18658447265625, 0.2567138671875, 0.32684326171875, 0.39697265625, 0.46710205078125, 0.5372314453125, 0.60736083984375, 0.677490234375, 0.74761962890625, 0.8177490234375, 0.88787841796875, 0.9580078125, 1.02813720703125, 1.0982666015625, 1.16839599609375, 1.238525390625, 1.30865478515625, 1.3787841796875, 1.44891357421875, 1.51904296875, 1.58917236328125, 1.6593017578125, 1.72943115234375, 1.799560546875, 1.86968994140625, 1.9398193359375, 2.00994873046875, 2.080078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 10.0, 11.0, 11.0, 16.0, 12.0, 29.0, 34.0, 44.0, 75.0, 126.0, 157.0, 224.0, 437.0, 706.0, 1553.0, 5546.0, 59967.0, 733164.0, 227291.0, 14091.0, 2553.0, 965.0, 574.0, 319.0, 198.0, 127.0, 76.0, 59.0, 39.0, 30.0, 24.0, 16.0, 11.0, 11.0, 6.0, 10.0, 3.0, 4.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-15.3515625, -14.8824462890625, -14.413330078125, -13.9442138671875, -13.47509765625, -13.0059814453125, -12.536865234375, -12.0677490234375, -11.5986328125, -11.1295166015625, -10.660400390625, -10.1912841796875, -9.72216796875, -9.2530517578125, -8.783935546875, -8.3148193359375, -7.845703125, -7.3765869140625, -6.907470703125, -6.4383544921875, -5.96923828125, -5.5001220703125, -5.031005859375, -4.5618896484375, -4.0927734375, -3.6236572265625, -3.154541015625, -2.6854248046875, -2.21630859375, -1.7471923828125, -1.278076171875, -0.8089599609375, -0.33984375, 0.1292724609375, 0.598388671875, 1.0675048828125, 1.53662109375, 2.0057373046875, 2.474853515625, 2.9439697265625, 3.4130859375, 3.8822021484375, 4.351318359375, 4.8204345703125, 5.28955078125, 5.7586669921875, 6.227783203125, 6.6968994140625, 7.166015625, 7.6351318359375, 8.104248046875, 8.5733642578125, 9.04248046875, 9.5115966796875, 9.980712890625, 10.4498291015625, 10.9189453125, 11.3880615234375, 11.857177734375, 12.3262939453125, 12.79541015625, 13.2645263671875, 13.733642578125, 14.2027587890625, 14.671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 2.0, 9.0, 8.0, 11.0, 12.0, 9.0, 12.0, 22.0, 15.0, 19.0, 19.0, 22.0, 20.0, 29.0, 14.0, 24.0, 36.0, 34.0, 46.0, 32.0, 46.0, 37.0, 38.0, 46.0, 39.0, 31.0, 34.0, 26.0, 33.0, 20.0, 37.0, 29.0, 26.0, 24.0, 22.0, 18.0, 16.0, 10.0, 9.0, 11.0, 14.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1171875, -8.83203125, -8.546875, -8.26171875, -7.9765625, -7.69140625, -7.40625, -7.12109375, -6.8359375, -6.55078125, -6.265625, -5.98046875, -5.6953125, -5.41015625, -5.125, -4.83984375, -4.5546875, -4.26953125, -3.984375, -3.69921875, -3.4140625, -3.12890625, -2.84375, -2.55859375, -2.2734375, -1.98828125, -1.703125, -1.41796875, -1.1328125, -0.84765625, -0.5625, -0.27734375, 0.0078125, 0.29296875, 0.578125, 0.86328125, 1.1484375, 1.43359375, 1.71875, 2.00390625, 2.2890625, 2.57421875, 2.859375, 3.14453125, 3.4296875, 3.71484375, 4.0, 4.28515625, 4.5703125, 4.85546875, 5.140625, 5.42578125, 5.7109375, 5.99609375, 6.28125, 6.56640625, 6.8515625, 7.13671875, 7.421875, 7.70703125, 7.9921875, 8.27734375, 8.5625, 8.84765625, 9.1328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 9.0, 6.0, 16.0, 22.0, 33.0, 64.0, 128.0, 217.0, 666.0, 1952.0, 9790.0, 102181.0, 766715.0, 150414.0, 12572.0, 2381.0, 735.0, 268.0, 130.0, 68.0, 55.0, 33.0, 21.0, 18.0, 18.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.56640625, -6.3583984375, -6.150390625, -5.9423828125, -5.734375, -5.5263671875, -5.318359375, -5.1103515625, -4.90234375, -4.6943359375, -4.486328125, -4.2783203125, -4.0703125, -3.8623046875, -3.654296875, -3.4462890625, -3.23828125, -3.0302734375, -2.822265625, -2.6142578125, -2.40625, -2.1982421875, -1.990234375, -1.7822265625, -1.57421875, -1.3662109375, -1.158203125, -0.9501953125, -0.7421875, -0.5341796875, -0.326171875, -0.1181640625, 0.08984375, 0.2978515625, 0.505859375, 0.7138671875, 0.921875, 1.1298828125, 1.337890625, 1.5458984375, 1.75390625, 1.9619140625, 2.169921875, 2.3779296875, 2.5859375, 2.7939453125, 3.001953125, 3.2099609375, 3.41796875, 3.6259765625, 3.833984375, 4.0419921875, 4.25, 4.4580078125, 4.666015625, 4.8740234375, 5.08203125, 5.2900390625, 5.498046875, 5.7060546875, 5.9140625, 6.1220703125, 6.330078125, 6.5380859375, 6.74609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 5.0, 11.0, 14.0, 21.0, 33.0, 44.0, 53.0, 76.0, 82.0, 78.0, 98.0, 98.0, 97.0, 53.0, 67.0, 52.0, 25.0, 31.0, 14.0, 15.0, 4.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009455680847167969, -0.0009210333228111267, -0.0008964985609054565, -0.0008719637989997864, -0.0008474290370941162, -0.000822894275188446, -0.0007983595132827759, -0.0007738247513771057, -0.0007492899894714355, -0.0007247552275657654, -0.0007002204656600952, -0.000675685703754425, -0.0006511509418487549, -0.0006266161799430847, -0.0006020814180374146, -0.0005775466561317444, -0.0005530118942260742, -0.000528477132320404, -0.0005039423704147339, -0.0004794076085090637, -0.00045487284660339355, -0.0004303380846977234, -0.0004058033227920532, -0.00038126856088638306, -0.0003567337989807129, -0.0003321990370750427, -0.00030766427516937256, -0.0002831295132637024, -0.0002585947513580322, -0.00023405998945236206, -0.0002095252275466919, -0.00018499046564102173, -0.00016045570373535156, -0.0001359209418296814, -0.00011138617992401123, -8.685141801834106e-05, -6.23166561126709e-05, -3.778189420700073e-05, -1.3247132301330566e-05, 1.12876296043396e-05, 3.5822391510009766e-05, 6.035715341567993e-05, 8.48919153213501e-05, 0.00010942667722702026, 0.00013396143913269043, 0.0001584962010383606, 0.00018303096294403076, 0.00020756572484970093, 0.0002321004867553711, 0.00025663524866104126, 0.0002811700105667114, 0.0003057047724723816, 0.00033023953437805176, 0.0003547742962837219, 0.0003793090581893921, 0.00040384382009506226, 0.0004283785820007324, 0.0004529133439064026, 0.00047744810581207275, 0.0005019828677177429, 0.0005265176296234131, 0.0005510523915290833, 0.0005755871534347534, 0.0006001219153404236, 0.0006246566772460938]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 9.0, 20.0, 29.0, 61.0, 118.0, 303.0, 976.0, 5807.0, 393321.0, 638204.0, 7971.0, 1150.0, 299.0, 121.0, 69.0, 34.0, 23.0, 14.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.421875, -11.0418701171875, -10.661865234375, -10.2818603515625, -9.90185546875, -9.5218505859375, -9.141845703125, -8.7618408203125, -8.3818359375, -8.0018310546875, -7.621826171875, -7.2418212890625, -6.86181640625, -6.4818115234375, -6.101806640625, -5.7218017578125, -5.341796875, -4.9617919921875, -4.581787109375, -4.2017822265625, -3.82177734375, -3.4417724609375, -3.061767578125, -2.6817626953125, -2.3017578125, -1.9217529296875, -1.541748046875, -1.1617431640625, -0.78173828125, -0.4017333984375, -0.021728515625, 0.3582763671875, 0.73828125, 1.1182861328125, 1.498291015625, 1.8782958984375, 2.25830078125, 2.6383056640625, 3.018310546875, 3.3983154296875, 3.7783203125, 4.1583251953125, 4.538330078125, 4.9183349609375, 5.29833984375, 5.6783447265625, 6.058349609375, 6.4383544921875, 6.818359375, 7.1983642578125, 7.578369140625, 7.9583740234375, 8.33837890625, 8.7183837890625, 9.098388671875, 9.4783935546875, 9.8583984375, 10.2384033203125, 10.618408203125, 10.9984130859375, 11.37841796875, 11.7584228515625, 12.138427734375, 12.5184326171875, 12.8984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 8.0, 11.0, 12.0, 11.0, 25.0, 26.0, 29.0, 41.0, 55.0, 46.0, 70.0, 90.0, 92.0, 80.0, 73.0, 55.0, 57.0, 55.0, 32.0, 24.0, 20.0, 23.0, 13.0, 7.0, 6.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9921875, -3.86956787109375, -3.7469482421875, -3.62432861328125, -3.501708984375, -3.37908935546875, -3.2564697265625, -3.13385009765625, -3.01123046875, -2.88861083984375, -2.7659912109375, -2.64337158203125, -2.520751953125, -2.39813232421875, -2.2755126953125, -2.15289306640625, -2.0302734375, -1.90765380859375, -1.7850341796875, -1.66241455078125, -1.539794921875, -1.41717529296875, -1.2945556640625, -1.17193603515625, -1.04931640625, -0.92669677734375, -0.8040771484375, -0.68145751953125, -0.558837890625, -0.43621826171875, -0.3135986328125, -0.19097900390625, -0.068359375, 0.05426025390625, 0.1768798828125, 0.29949951171875, 0.422119140625, 0.54473876953125, 0.6673583984375, 0.78997802734375, 0.91259765625, 1.03521728515625, 1.1578369140625, 1.28045654296875, 1.403076171875, 1.52569580078125, 1.6483154296875, 1.77093505859375, 1.8935546875, 2.01617431640625, 2.1387939453125, 2.26141357421875, 2.384033203125, 2.50665283203125, 2.6292724609375, 2.75189208984375, 2.87451171875, 2.99713134765625, 3.1197509765625, 3.24237060546875, 3.364990234375, 3.48760986328125, 3.6102294921875, 3.73284912109375, 3.85546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 31.0, 73.0, 144.0, 223.0, 244.0, 185.0, 57.0, 24.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.04737854003906, -118.25071716308594, -114.45406341552734, -110.65740203857422, -106.86074829101562, -103.0640869140625, -99.26742553710938, -95.47077178955078, -91.67411804199219, -87.87745666503906, -84.08080291748047, -80.28414154052734, -76.48748779296875, -72.69082641601562, -68.8941650390625, -65.0975112915039, -61.30084991455078, -57.50419235229492, -53.70753479003906, -49.91087341308594, -46.114219665527344, -42.31755828857422, -38.52090072631836, -34.7242431640625, -30.92758560180664, -27.13092803955078, -23.334270477294922, -19.53761100769043, -15.74095344543457, -11.944295883178711, -8.147636413574219, -4.350978851318359, -0.5543212890625, 3.2423367500305176, 7.038994789123535, 10.835653305053711, 14.63231086730957, 18.42896842956543, 22.225627899169922, 26.02228546142578, 29.81894302368164, 33.6156005859375, 37.41225814819336, 41.20891571044922, 45.005577087402344, 48.80223083496094, 52.59889221191406, 56.39554977416992, 60.19220733642578, 63.98886489868164, 67.7855224609375, 71.58218383789062, 75.37883758544922, 79.17549896240234, 82.97215270996094, 86.76881408691406, 90.56547546386719, 94.36213684082031, 98.1587905883789, 101.95545196533203, 105.75210571289062, 109.54876708984375, 113.34542846679688, 117.14208221435547, 120.93873596191406]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 9.0, 10.0, 5.0, 16.0, 15.0, 25.0, 23.0, 31.0, 34.0, 31.0, 30.0, 37.0, 42.0, 38.0, 48.0, 56.0, 51.0, 49.0, 41.0, 42.0, 33.0, 42.0, 43.0, 32.0, 34.0, 24.0, 29.0, 10.0, 15.0, 12.0, 20.0, 11.0, 8.0, 7.0, 3.0, 5.0, 1.0, 4.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.25354766845703, -49.56117248535156, -47.86880111694336, -46.17642593383789, -44.48405456542969, -42.79167938232422, -41.09930419921875, -39.40692901611328, -37.71455764770508, -36.02218246459961, -34.329811096191406, -32.63743591308594, -30.9450626373291, -29.252689361572266, -27.560314178466797, -25.86794090270996, -24.175567626953125, -22.48319435119629, -20.790821075439453, -19.098445892333984, -17.40607261657715, -15.713699340820312, -14.02132511138916, -12.328950881958008, -10.636577606201172, -8.944204330444336, -7.251830101013184, -5.5594563484191895, -3.8670825958251953, -2.1747093200683594, -0.48233509063720703, 1.2100391387939453, 2.9024124145507812, 4.594786167144775, 6.2871599197387695, 7.979533672332764, 9.671907424926758, 11.364280700683594, 13.056654930114746, 14.749029159545898, 16.441402435302734, 18.13377571105957, 19.826148986816406, 21.518524169921875, 23.21089744567871, 24.903270721435547, 26.595645904541016, 28.28801918029785, 29.980392456054688, 31.672765731811523, 33.36513900756836, 35.05751419067383, 36.74988555908203, 38.4422607421875, 40.13463592529297, 41.82701110839844, 43.51938247680664, 45.21175765991211, 46.90412902832031, 48.59650421142578, 50.28887939453125, 51.98125076293945, 53.67362594604492, 55.365997314453125, 57.058372497558594]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 12.0, 14.0, 24.0, 23.0, 39.0, 52.0, 88.0, 164.0, 252.0, 534.0, 1290.0, 4231.0, 19191.0, 196668.0, 3902564.0, 55774.0, 9163.0, 2376.0, 834.0, 382.0, 189.0, 127.0, 80.0, 51.0, 40.0, 30.0, 17.0, 11.0, 12.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.782958984375, -9.44873046875, -9.114501953125, -8.7802734375, -8.446044921875, -8.11181640625, -7.777587890625, -7.443359375, -7.109130859375, -6.77490234375, -6.440673828125, -6.1064453125, -5.772216796875, -5.43798828125, -5.103759765625, -4.76953125, -4.435302734375, -4.10107421875, -3.766845703125, -3.4326171875, -3.098388671875, -2.76416015625, -2.429931640625, -2.095703125, -1.761474609375, -1.42724609375, -1.093017578125, -0.7587890625, -0.424560546875, -0.09033203125, 0.243896484375, 0.578125, 0.912353515625, 1.24658203125, 1.580810546875, 1.9150390625, 2.249267578125, 2.58349609375, 2.917724609375, 3.251953125, 3.586181640625, 3.92041015625, 4.254638671875, 4.5888671875, 4.923095703125, 5.25732421875, 5.591552734375, 5.92578125, 6.260009765625, 6.59423828125, 6.928466796875, 7.2626953125, 7.596923828125, 7.93115234375, 8.265380859375, 8.599609375, 8.933837890625, 9.26806640625, 9.602294921875, 9.9365234375, 10.270751953125, 10.60498046875, 10.939208984375, 11.2734375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 7.0, 8.0, 10.0, 11.0, 15.0, 18.0, 17.0, 15.0, 31.0, 24.0, 39.0, 41.0, 40.0, 46.0, 36.0, 40.0, 39.0, 42.0, 53.0, 38.0, 35.0, 48.0, 39.0, 30.0, 31.0, 25.0, 27.0, 29.0, 27.0, 26.0, 19.0, 14.0, 11.0, 7.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0], "bins": [-2.12109375, -2.0618438720703125, -2.002593994140625, -1.9433441162109375, -1.88409423828125, -1.8248443603515625, -1.765594482421875, -1.7063446044921875, -1.6470947265625, -1.5878448486328125, -1.528594970703125, -1.4693450927734375, -1.41009521484375, -1.3508453369140625, -1.291595458984375, -1.2323455810546875, -1.173095703125, -1.1138458251953125, -1.054595947265625, -0.9953460693359375, -0.93609619140625, -0.8768463134765625, -0.817596435546875, -0.7583465576171875, -0.6990966796875, -0.6398468017578125, -0.580596923828125, -0.5213470458984375, -0.46209716796875, -0.4028472900390625, -0.343597412109375, -0.2843475341796875, -0.22509765625, -0.1658477783203125, -0.106597900390625, -0.0473480224609375, 0.01190185546875, 0.0711517333984375, 0.130401611328125, 0.1896514892578125, 0.2489013671875, 0.3081512451171875, 0.367401123046875, 0.4266510009765625, 0.48590087890625, 0.5451507568359375, 0.604400634765625, 0.6636505126953125, 0.722900390625, 0.7821502685546875, 0.841400146484375, 0.9006500244140625, 0.95989990234375, 1.0191497802734375, 1.078399658203125, 1.1376495361328125, 1.1968994140625, 1.2561492919921875, 1.315399169921875, 1.3746490478515625, 1.43389892578125, 1.4931488037109375, 1.552398681640625, 1.6116485595703125, 1.6708984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 17.0, 15.0, 18.0, 32.0, 47.0, 56.0, 82.0, 127.0, 172.0, 244.0, 327.0, 532.0, 725.0, 996.0, 1529.0, 2358.0, 3633.0, 6048.0, 9873.0, 17649.0, 34577.0, 79256.0, 261926.0, 3306847.0, 298885.0, 85799.0, 36462.0, 18398.0, 10246.0, 6086.0, 3821.0, 2444.0, 1597.0, 1063.0, 707.0, 489.0, 343.0, 256.0, 165.0, 110.0, 84.0, 64.0, 50.0, 28.0, 34.0, 10.0, 13.0, 10.0, 6.0, 5.0, 2.0, 7.0, 4.0, 1.0], "bins": [-3.490234375, -3.38616943359375, -3.2821044921875, -3.17803955078125, -3.073974609375, -2.96990966796875, -2.8658447265625, -2.76177978515625, -2.65771484375, -2.55364990234375, -2.4495849609375, -2.34552001953125, -2.241455078125, -2.13739013671875, -2.0333251953125, -1.92926025390625, -1.8251953125, -1.72113037109375, -1.6170654296875, -1.51300048828125, -1.408935546875, -1.30487060546875, -1.2008056640625, -1.09674072265625, -0.99267578125, -0.88861083984375, -0.7845458984375, -0.68048095703125, -0.576416015625, -0.47235107421875, -0.3682861328125, -0.26422119140625, -0.16015625, -0.05609130859375, 0.0479736328125, 0.15203857421875, 0.256103515625, 0.36016845703125, 0.4642333984375, 0.56829833984375, 0.67236328125, 0.77642822265625, 0.8804931640625, 0.98455810546875, 1.088623046875, 1.19268798828125, 1.2967529296875, 1.40081787109375, 1.5048828125, 1.60894775390625, 1.7130126953125, 1.81707763671875, 1.921142578125, 2.02520751953125, 2.1292724609375, 2.23333740234375, 2.33740234375, 2.44146728515625, 2.5455322265625, 2.64959716796875, 2.753662109375, 2.85772705078125, 2.9617919921875, 3.06585693359375, 3.169921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 2.0, 8.0, 10.0, 15.0, 16.0, 20.0, 22.0, 41.0, 65.0, 82.0, 189.0, 458.0, 2463.0, 282.0, 145.0, 69.0, 49.0, 27.0, 24.0, 18.0, 12.0, 15.0, 6.0, 4.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.61328125, -1.566253662109375, -1.51922607421875, -1.472198486328125, -1.4251708984375, -1.378143310546875, -1.33111572265625, -1.284088134765625, -1.237060546875, -1.190032958984375, -1.14300537109375, -1.095977783203125, -1.0489501953125, -1.001922607421875, -0.95489501953125, -0.907867431640625, -0.86083984375, -0.813812255859375, -0.76678466796875, -0.719757080078125, -0.6727294921875, -0.625701904296875, -0.57867431640625, -0.531646728515625, -0.484619140625, -0.437591552734375, -0.39056396484375, -0.343536376953125, -0.2965087890625, -0.249481201171875, -0.20245361328125, -0.155426025390625, -0.1083984375, -0.061370849609375, -0.01434326171875, 0.032684326171875, 0.0797119140625, 0.126739501953125, 0.17376708984375, 0.220794677734375, 0.267822265625, 0.314849853515625, 0.36187744140625, 0.408905029296875, 0.4559326171875, 0.502960205078125, 0.54998779296875, 0.597015380859375, 0.64404296875, 0.691070556640625, 0.73809814453125, 0.785125732421875, 0.8321533203125, 0.879180908203125, 0.92620849609375, 0.973236083984375, 1.020263671875, 1.067291259765625, 1.11431884765625, 1.161346435546875, 1.2083740234375, 1.255401611328125, 1.30242919921875, 1.349456787109375, 1.396484375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 16.0, 7.0, 22.0, 78.0, 158.0, 241.0, 237.0, 148.0, 48.0, 28.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.13353729248047, -23.561254501342773, -22.988969802856445, -22.41668701171875, -21.844404220581055, -21.272119522094727, -20.69983673095703, -20.127552032470703, -19.555269241333008, -18.982986450195312, -18.410701751708984, -17.83841896057129, -17.266136169433594, -16.693851470947266, -16.12156867980957, -15.549284934997559, -14.977002143859863, -14.404718399047852, -13.832435607910156, -13.260151863098145, -12.687868118286133, -12.115585327148438, -11.543301582336426, -10.971017837524414, -10.398735046386719, -9.826451301574707, -9.254168510437012, -8.681884765625, -8.109601020812988, -7.537317752838135, -6.965034484863281, -6.3927507400512695, -5.820466041564941, -5.248182773590088, -4.675899028778076, -4.103615760803223, -3.53133225440979, -2.9590487480163574, -2.386765480041504, -1.8144817352294922, -1.2421984672546387, -0.6699150204658508, -0.09763157367706299, 0.4746518135070801, 1.0469353199005127, 1.6192188262939453, 2.191502094268799, 2.7637858390808105, 3.336069107055664, 3.9083526134490967, 4.480636119842529, 5.052919387817383, 5.6252031326293945, 6.197486400604248, 6.769769668579102, 7.342053413391113, 7.914336681365967, 8.48661994934082, 9.058903694152832, 9.631187438964844, 10.203470230102539, 10.77575397491455, 11.348037719726562, 11.920320510864258, 12.49260425567627]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 11.0, 23.0, 16.0, 27.0, 31.0, 26.0, 41.0, 38.0, 39.0, 32.0, 48.0, 46.0, 47.0, 36.0, 61.0, 51.0, 56.0, 45.0, 43.0, 36.0, 31.0, 31.0, 31.0, 21.0, 12.0, 23.0, 14.0, 17.0, 14.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.349039077758789, -5.192065715789795, -5.035092353820801, -4.878118991851807, -4.7211456298828125, -4.564172744750977, -4.407199382781982, -4.250226020812988, -4.093252658843994, -3.936279296875, -3.779305934906006, -3.622332811355591, -3.4653594493865967, -3.3083860874176025, -3.1514129638671875, -2.9944396018981934, -2.837466239929199, -2.680492877960205, -2.523519515991211, -2.366546392440796, -2.2095730304718018, -2.0525996685028076, -1.895626425743103, -1.7386531829833984, -1.5816798210144043, -1.4247064590454102, -1.2677332162857056, -1.110759973526001, -0.9537866115570068, -0.7968133091926575, -0.6398400068283081, -0.4828667640686035, -0.3258934020996094, -0.16892009973526, -0.011946797370910645, 0.14502650499343872, 0.3019998073577881, 0.45897310972213745, 0.6159464120864868, 0.7729196548461914, 0.9298930168151855, 1.0868663787841797, 1.2438396215438843, 1.4008128643035889, 1.557786226272583, 1.7147595882415771, 1.8717328310012817, 2.0287060737609863, 2.1856794357299805, 2.3426527976989746, 2.4996261596679688, 2.656599283218384, 2.813572645187378, 2.970546007156372, 3.127519130706787, 3.2844924926757812, 3.4414658546447754, 3.5984392166137695, 3.7554125785827637, 3.9123857021331787, 4.069358825683594, 4.226332187652588, 4.383305549621582, 4.540278911590576, 4.69725227355957]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 21.0, 35.0, 52.0, 124.0, 187.0, 394.0, 866.0, 2095.0, 5873.0, 19168.0, 70460.0, 233557.0, 408964.0, 216881.0, 63398.0, 17465.0, 5443.0, 1958.0, 789.0, 387.0, 189.0, 100.0, 56.0, 26.0, 18.0, 16.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.09765625, -6.9222412109375, -6.746826171875, -6.5714111328125, -6.39599609375, -6.2205810546875, -6.045166015625, -5.8697509765625, -5.6943359375, -5.5189208984375, -5.343505859375, -5.1680908203125, -4.99267578125, -4.8172607421875, -4.641845703125, -4.4664306640625, -4.291015625, -4.1156005859375, -3.940185546875, -3.7647705078125, -3.58935546875, -3.4139404296875, -3.238525390625, -3.0631103515625, -2.8876953125, -2.7122802734375, -2.536865234375, -2.3614501953125, -2.18603515625, -2.0106201171875, -1.835205078125, -1.6597900390625, -1.484375, -1.3089599609375, -1.133544921875, -0.9581298828125, -0.78271484375, -0.6072998046875, -0.431884765625, -0.2564697265625, -0.0810546875, 0.0943603515625, 0.269775390625, 0.4451904296875, 0.62060546875, 0.7960205078125, 0.971435546875, 1.1468505859375, 1.322265625, 1.4976806640625, 1.673095703125, 1.8485107421875, 2.02392578125, 2.1993408203125, 2.374755859375, 2.5501708984375, 2.7255859375, 2.9010009765625, 3.076416015625, 3.2518310546875, 3.42724609375, 3.6026611328125, 3.778076171875, 3.9534912109375, 4.12890625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 6.0, 11.0, 8.0, 15.0, 25.0, 19.0, 23.0, 26.0, 28.0, 38.0, 50.0, 45.0, 57.0, 54.0, 49.0, 49.0, 60.0, 44.0, 57.0, 42.0, 43.0, 40.0, 32.0, 26.0, 26.0, 23.0, 21.0, 19.0, 7.0, 4.0, 5.0, 14.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.719970703125, -2.64501953125, -2.570068359375, -2.4951171875, -2.420166015625, -2.34521484375, -2.270263671875, -2.1953125, -2.120361328125, -2.04541015625, -1.970458984375, -1.8955078125, -1.820556640625, -1.74560546875, -1.670654296875, -1.595703125, -1.520751953125, -1.44580078125, -1.370849609375, -1.2958984375, -1.220947265625, -1.14599609375, -1.071044921875, -0.99609375, -0.921142578125, -0.84619140625, -0.771240234375, -0.6962890625, -0.621337890625, -0.54638671875, -0.471435546875, -0.396484375, -0.321533203125, -0.24658203125, -0.171630859375, -0.0966796875, -0.021728515625, 0.05322265625, 0.128173828125, 0.203125, 0.278076171875, 0.35302734375, 0.427978515625, 0.5029296875, 0.577880859375, 0.65283203125, 0.727783203125, 0.802734375, 0.877685546875, 0.95263671875, 1.027587890625, 1.1025390625, 1.177490234375, 1.25244140625, 1.327392578125, 1.40234375, 1.477294921875, 1.55224609375, 1.627197265625, 1.7021484375, 1.777099609375, 1.85205078125, 1.927001953125, 2.001953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 3.0, 14.0, 20.0, 17.0, 29.0, 45.0, 58.0, 101.0, 136.0, 248.0, 365.0, 686.0, 1307.0, 4045.0, 45275.0, 855899.0, 129840.0, 6735.0, 1675.0, 817.0, 463.0, 236.0, 148.0, 110.0, 77.0, 51.0, 40.0, 26.0, 13.0, 17.0, 8.0, 8.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.328125, -15.8427734375, -15.357421875, -14.8720703125, -14.38671875, -13.9013671875, -13.416015625, -12.9306640625, -12.4453125, -11.9599609375, -11.474609375, -10.9892578125, -10.50390625, -10.0185546875, -9.533203125, -9.0478515625, -8.5625, -8.0771484375, -7.591796875, -7.1064453125, -6.62109375, -6.1357421875, -5.650390625, -5.1650390625, -4.6796875, -4.1943359375, -3.708984375, -3.2236328125, -2.73828125, -2.2529296875, -1.767578125, -1.2822265625, -0.796875, -0.3115234375, 0.173828125, 0.6591796875, 1.14453125, 1.6298828125, 2.115234375, 2.6005859375, 3.0859375, 3.5712890625, 4.056640625, 4.5419921875, 5.02734375, 5.5126953125, 5.998046875, 6.4833984375, 6.96875, 7.4541015625, 7.939453125, 8.4248046875, 8.91015625, 9.3955078125, 9.880859375, 10.3662109375, 10.8515625, 11.3369140625, 11.822265625, 12.3076171875, 12.79296875, 13.2783203125, 13.763671875, 14.2490234375, 14.734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 11.0, 9.0, 12.0, 11.0, 15.0, 18.0, 18.0, 22.0, 32.0, 29.0, 23.0, 46.0, 39.0, 28.0, 39.0, 33.0, 43.0, 48.0, 41.0, 42.0, 33.0, 25.0, 38.0, 29.0, 45.0, 28.0, 22.0, 20.0, 40.0, 27.0, 24.0, 25.0, 12.0, 10.0, 6.0, 7.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.140625, -7.864990234375, -7.58935546875, -7.313720703125, -7.0380859375, -6.762451171875, -6.48681640625, -6.211181640625, -5.935546875, -5.659912109375, -5.38427734375, -5.108642578125, -4.8330078125, -4.557373046875, -4.28173828125, -4.006103515625, -3.73046875, -3.454833984375, -3.17919921875, -2.903564453125, -2.6279296875, -2.352294921875, -2.07666015625, -1.801025390625, -1.525390625, -1.249755859375, -0.97412109375, -0.698486328125, -0.4228515625, -0.147216796875, 0.12841796875, 0.404052734375, 0.6796875, 0.955322265625, 1.23095703125, 1.506591796875, 1.7822265625, 2.057861328125, 2.33349609375, 2.609130859375, 2.884765625, 3.160400390625, 3.43603515625, 3.711669921875, 3.9873046875, 4.262939453125, 4.53857421875, 4.814208984375, 5.08984375, 5.365478515625, 5.64111328125, 5.916748046875, 6.1923828125, 6.468017578125, 6.74365234375, 7.019287109375, 7.294921875, 7.570556640625, 7.84619140625, 8.121826171875, 8.3974609375, 8.673095703125, 8.94873046875, 9.224365234375, 9.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 3.0, 9.0, 11.0, 17.0, 20.0, 21.0, 28.0, 36.0, 56.0, 87.0, 117.0, 191.0, 326.0, 687.0, 1629.0, 6589.0, 50595.0, 668681.0, 291984.0, 21266.0, 3786.0, 1142.0, 484.0, 278.0, 154.0, 88.0, 70.0, 59.0, 44.0, 26.0, 14.0, 15.0, 9.0, 11.0, 7.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.28515625, -5.10174560546875, -4.9183349609375, -4.73492431640625, -4.551513671875, -4.36810302734375, -4.1846923828125, -4.00128173828125, -3.81787109375, -3.63446044921875, -3.4510498046875, -3.26763916015625, -3.084228515625, -2.90081787109375, -2.7174072265625, -2.53399658203125, -2.3505859375, -2.16717529296875, -1.9837646484375, -1.80035400390625, -1.616943359375, -1.43353271484375, -1.2501220703125, -1.06671142578125, -0.88330078125, -0.69989013671875, -0.5164794921875, -0.33306884765625, -0.149658203125, 0.03375244140625, 0.2171630859375, 0.40057373046875, 0.583984375, 0.76739501953125, 0.9508056640625, 1.13421630859375, 1.317626953125, 1.50103759765625, 1.6844482421875, 1.86785888671875, 2.05126953125, 2.23468017578125, 2.4180908203125, 2.60150146484375, 2.784912109375, 2.96832275390625, 3.1517333984375, 3.33514404296875, 3.5185546875, 3.70196533203125, 3.8853759765625, 4.06878662109375, 4.252197265625, 4.43560791015625, 4.6190185546875, 4.80242919921875, 4.98583984375, 5.16925048828125, 5.3526611328125, 5.53607177734375, 5.719482421875, 5.90289306640625, 6.0863037109375, 6.26971435546875, 6.453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 10.0, 7.0, 8.0, 16.0, 11.0, 20.0, 27.0, 32.0, 39.0, 44.0, 56.0, 58.0, 88.0, 88.0, 76.0, 88.0, 84.0, 51.0, 34.0, 34.0, 35.0, 18.0, 14.0, 7.0, 16.0, 16.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006055831909179688, -0.0005870312452316284, -0.0005684792995452881, -0.0005499273538589478, -0.0005313754081726074, -0.0005128234624862671, -0.0004942715167999268, -0.0004757195711135864, -0.0004571676254272461, -0.00043861567974090576, -0.00042006373405456543, -0.0004015117883682251, -0.00038295984268188477, -0.00036440789699554443, -0.0003458559513092041, -0.00032730400562286377, -0.00030875205993652344, -0.0002902001142501831, -0.0002716481685638428, -0.00025309622287750244, -0.0002345442771911621, -0.00021599233150482178, -0.00019744038581848145, -0.0001788884401321411, -0.00016033649444580078, -0.00014178454875946045, -0.00012323260307312012, -0.00010468065738677979, -8.612871170043945e-05, -6.757676601409912e-05, -4.902482032775879e-05, -3.0472874641418457e-05, -1.1920928955078125e-05, 6.631016731262207e-06, 2.518296241760254e-05, 4.373490810394287e-05, 6.22868537902832e-05, 8.083879947662354e-05, 9.939074516296387e-05, 0.0001179426908493042, 0.00013649463653564453, 0.00015504658222198486, 0.0001735985279083252, 0.00019215047359466553, 0.00021070241928100586, 0.0002292543649673462, 0.0002478063106536865, 0.00026635825634002686, 0.0002849102020263672, 0.0003034621477127075, 0.00032201409339904785, 0.0003405660390853882, 0.0003591179847717285, 0.00037766993045806885, 0.0003962218761444092, 0.0004147738218307495, 0.00043332576751708984, 0.0004518777132034302, 0.0004704296588897705, 0.0004889816045761108, 0.0005075335502624512, 0.0005260854959487915, 0.0005446374416351318, 0.0005631893873214722, 0.0005817413330078125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 12.0, 18.0, 28.0, 47.0, 77.0, 175.0, 357.0, 1002.0, 4351.0, 127155.0, 895661.0, 16645.0, 1904.0, 581.0, 257.0, 104.0, 62.0, 39.0, 18.0, 13.0, 11.0, 7.0, 3.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.13037109375, -9.7841796875, -9.43798828125, -9.091796875, -8.74560546875, -8.3994140625, -8.05322265625, -7.70703125, -7.36083984375, -7.0146484375, -6.66845703125, -6.322265625, -5.97607421875, -5.6298828125, -5.28369140625, -4.9375, -4.59130859375, -4.2451171875, -3.89892578125, -3.552734375, -3.20654296875, -2.8603515625, -2.51416015625, -2.16796875, -1.82177734375, -1.4755859375, -1.12939453125, -0.783203125, -0.43701171875, -0.0908203125, 0.25537109375, 0.6015625, 0.94775390625, 1.2939453125, 1.64013671875, 1.986328125, 2.33251953125, 2.6787109375, 3.02490234375, 3.37109375, 3.71728515625, 4.0634765625, 4.40966796875, 4.755859375, 5.10205078125, 5.4482421875, 5.79443359375, 6.140625, 6.48681640625, 6.8330078125, 7.17919921875, 7.525390625, 7.87158203125, 8.2177734375, 8.56396484375, 8.91015625, 9.25634765625, 9.6025390625, 9.94873046875, 10.294921875, 10.64111328125, 10.9873046875, 11.33349609375, 11.6796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 7.0, 12.0, 13.0, 17.0, 27.0, 27.0, 47.0, 58.0, 67.0, 67.0, 90.0, 91.0, 103.0, 82.0, 65.0, 49.0, 40.0, 35.0, 15.0, 15.0, 13.0, 8.0, 9.0, 2.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.300384521484375, -4.17108154296875, -4.041778564453125, -3.9124755859375, -3.783172607421875, -3.65386962890625, -3.524566650390625, -3.395263671875, -3.265960693359375, -3.13665771484375, -3.007354736328125, -2.8780517578125, -2.748748779296875, -2.61944580078125, -2.490142822265625, -2.36083984375, -2.231536865234375, -2.10223388671875, -1.972930908203125, -1.8436279296875, -1.714324951171875, -1.58502197265625, -1.455718994140625, -1.326416015625, -1.197113037109375, -1.06781005859375, -0.938507080078125, -0.8092041015625, -0.679901123046875, -0.55059814453125, -0.421295166015625, -0.2919921875, -0.162689208984375, -0.03338623046875, 0.095916748046875, 0.2252197265625, 0.354522705078125, 0.48382568359375, 0.613128662109375, 0.742431640625, 0.871734619140625, 1.00103759765625, 1.130340576171875, 1.2596435546875, 1.388946533203125, 1.51824951171875, 1.647552490234375, 1.77685546875, 1.906158447265625, 2.03546142578125, 2.164764404296875, 2.2940673828125, 2.423370361328125, 2.55267333984375, 2.681976318359375, 2.811279296875, 2.940582275390625, 3.06988525390625, 3.199188232421875, 3.3284912109375, 3.457794189453125, 3.58709716796875, 3.716400146484375, 3.845703125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 30.0, 177.0, 419.0, 280.0, 74.0, 11.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-305.6329345703125, -299.8376770019531, -294.04241943359375, -288.2471618652344, -282.451904296875, -276.6566467285156, -270.86138916015625, -265.0661315917969, -259.2708740234375, -253.47561645507812, -247.68035888671875, -241.88510131835938, -236.08984375, -230.29458618164062, -224.49932861328125, -218.70407104492188, -212.9088134765625, -207.11355590820312, -201.31829833984375, -195.52304077148438, -189.727783203125, -183.93252563476562, -178.13726806640625, -172.34201049804688, -166.54673767089844, -160.75148010253906, -154.9562225341797, -149.1609649658203, -143.36570739746094, -137.57044982910156, -131.7751922607422, -125.97993469238281, -120.18467712402344, -114.38941955566406, -108.59416198730469, -102.79890441894531, -97.00364685058594, -91.20838928222656, -85.41313171386719, -79.61787414550781, -73.82261657714844, -68.02735900878906, -62.23210144042969, -56.43684387207031, -50.64158630371094, -44.84632873535156, -39.05106735229492, -33.25580978393555, -27.460548400878906, -21.66529083251953, -15.87003231048584, -10.074773788452148, -4.279516220092773, 1.5157413482666016, 7.311000823974609, 13.106258392333984, 18.90151596069336, 24.696773529052734, 30.49203109741211, 36.28729248046875, 42.082550048828125, 47.8778076171875, 53.673065185546875, 59.46832275390625, 65.26358032226562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 10.0, 4.0, 10.0, 18.0, 10.0, 20.0, 19.0, 27.0, 32.0, 40.0, 31.0, 45.0, 46.0, 48.0, 55.0, 52.0, 63.0, 50.0, 53.0, 51.0, 34.0, 32.0, 41.0, 22.0, 30.0, 25.0, 22.0, 22.0, 18.0, 13.0, 13.0, 10.0, 9.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.66792297363281, -47.11891174316406, -45.56990051269531, -44.02089309692383, -42.47188186645508, -40.92287063598633, -39.373863220214844, -37.824851989746094, -36.275840759277344, -34.726829528808594, -33.177818298339844, -31.62881088256836, -30.07979965209961, -28.53078842163086, -26.981779098510742, -25.432769775390625, -23.883758544921875, -22.334747314453125, -20.785737991333008, -19.23672866821289, -17.68771743774414, -16.13870620727539, -14.589696884155273, -13.04068660736084, -11.491676330566406, -9.942666053771973, -8.393655776977539, -6.8446455001831055, -5.295635223388672, -3.7466249465942383, -2.1976146697998047, -0.6486043930053711, 0.9004058837890625, 2.449416160583496, 3.9984264373779297, 5.547436714172363, 7.096446990966797, 8.64545726776123, 10.194467544555664, 11.743477821350098, 13.292488098144531, 14.841498374938965, 16.3905086517334, 17.939517974853516, 19.488529205322266, 21.037540435791016, 22.586549758911133, 24.13555908203125, 25.6845703125, 27.23358154296875, 28.782590866088867, 30.331600189208984, 31.880611419677734, 33.429622650146484, 34.97863006591797, 36.52764129638672, 38.07665252685547, 39.62566375732422, 41.17467498779297, 42.72368240356445, 44.2726936340332, 45.82170486450195, 47.37071228027344, 48.91972351074219, 50.46873474121094]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 8.0, 8.0, 8.0, 15.0, 15.0, 21.0, 35.0, 47.0, 59.0, 79.0, 147.0, 201.0, 355.0, 579.0, 1144.0, 2490.0, 5965.0, 18715.0, 122030.0, 3970428.0, 51750.0, 11986.0, 4202.0, 1764.0, 863.0, 446.0, 297.0, 176.0, 135.0, 92.0, 67.0, 39.0, 26.0, 25.0, 11.0, 5.0, 14.0, 9.0, 4.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3125, -8.0552978515625, -7.798095703125, -7.5408935546875, -7.28369140625, -7.0264892578125, -6.769287109375, -6.5120849609375, -6.2548828125, -5.9976806640625, -5.740478515625, -5.4832763671875, -5.22607421875, -4.9688720703125, -4.711669921875, -4.4544677734375, -4.197265625, -3.9400634765625, -3.682861328125, -3.4256591796875, -3.16845703125, -2.9112548828125, -2.654052734375, -2.3968505859375, -2.1396484375, -1.8824462890625, -1.625244140625, -1.3680419921875, -1.11083984375, -0.8536376953125, -0.596435546875, -0.3392333984375, -0.08203125, 0.1751708984375, 0.432373046875, 0.6895751953125, 0.94677734375, 1.2039794921875, 1.461181640625, 1.7183837890625, 1.9755859375, 2.2327880859375, 2.489990234375, 2.7471923828125, 3.00439453125, 3.2615966796875, 3.518798828125, 3.7760009765625, 4.033203125, 4.2904052734375, 4.547607421875, 4.8048095703125, 5.06201171875, 5.3192138671875, 5.576416015625, 5.8336181640625, 6.0908203125, 6.3480224609375, 6.605224609375, 6.8624267578125, 7.11962890625, 7.3768310546875, 7.634033203125, 7.8912353515625, 8.1484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 5.0, 3.0, 11.0, 13.0, 22.0, 22.0, 18.0, 26.0, 33.0, 32.0, 40.0, 48.0, 62.0, 52.0, 49.0, 55.0, 54.0, 54.0, 45.0, 61.0, 33.0, 31.0, 34.0, 19.0, 28.0, 34.0, 21.0, 17.0, 10.0, 14.0, 8.0, 7.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.736328125, -2.66058349609375, -2.5848388671875, -2.50909423828125, -2.433349609375, -2.35760498046875, -2.2818603515625, -2.20611572265625, -2.13037109375, -2.05462646484375, -1.9788818359375, -1.90313720703125, -1.827392578125, -1.75164794921875, -1.6759033203125, -1.60015869140625, -1.5244140625, -1.44866943359375, -1.3729248046875, -1.29718017578125, -1.221435546875, -1.14569091796875, -1.0699462890625, -0.99420166015625, -0.91845703125, -0.84271240234375, -0.7669677734375, -0.69122314453125, -0.615478515625, -0.53973388671875, -0.4639892578125, -0.38824462890625, -0.3125, -0.23675537109375, -0.1610107421875, -0.08526611328125, -0.009521484375, 0.06622314453125, 0.1419677734375, 0.21771240234375, 0.29345703125, 0.36920166015625, 0.4449462890625, 0.52069091796875, 0.596435546875, 0.67218017578125, 0.7479248046875, 0.82366943359375, 0.8994140625, 0.97515869140625, 1.0509033203125, 1.12664794921875, 1.202392578125, 1.27813720703125, 1.3538818359375, 1.42962646484375, 1.50537109375, 1.58111572265625, 1.6568603515625, 1.73260498046875, 1.808349609375, 1.88409423828125, 1.9598388671875, 2.03558349609375, 2.111328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 4.0, 6.0, 22.0, 19.0, 24.0, 39.0, 51.0, 68.0, 118.0, 179.0, 273.0, 367.0, 608.0, 910.0, 1530.0, 2499.0, 4362.0, 8400.0, 20387.0, 69791.0, 3698927.0, 313438.0, 42041.0, 14343.0, 6766.0, 3526.0, 1981.0, 1225.0, 781.0, 537.0, 317.0, 245.0, 150.0, 104.0, 72.0, 61.0, 30.0, 30.0, 12.0, 13.0, 11.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.97265625, -4.80010986328125, -4.6275634765625, -4.45501708984375, -4.282470703125, -4.10992431640625, -3.9373779296875, -3.76483154296875, -3.59228515625, -3.41973876953125, -3.2471923828125, -3.07464599609375, -2.902099609375, -2.72955322265625, -2.5570068359375, -2.38446044921875, -2.2119140625, -2.03936767578125, -1.8668212890625, -1.69427490234375, -1.521728515625, -1.34918212890625, -1.1766357421875, -1.00408935546875, -0.83154296875, -0.65899658203125, -0.4864501953125, -0.31390380859375, -0.141357421875, 0.03118896484375, 0.2037353515625, 0.37628173828125, 0.548828125, 0.72137451171875, 0.8939208984375, 1.06646728515625, 1.239013671875, 1.41156005859375, 1.5841064453125, 1.75665283203125, 1.92919921875, 2.10174560546875, 2.2742919921875, 2.44683837890625, 2.619384765625, 2.79193115234375, 2.9644775390625, 3.13702392578125, 3.3095703125, 3.48211669921875, 3.6546630859375, 3.82720947265625, 3.999755859375, 4.17230224609375, 4.3448486328125, 4.51739501953125, 4.68994140625, 4.86248779296875, 5.0350341796875, 5.20758056640625, 5.380126953125, 5.55267333984375, 5.7252197265625, 5.89776611328125, 6.0703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 9.0, 8.0, 10.0, 15.0, 33.0, 50.0, 129.0, 572.0, 2897.0, 174.0, 51.0, 35.0, 26.0, 10.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4224395751953125, -1.363433837890625, -1.3044281005859375, -1.24542236328125, -1.1864166259765625, -1.127410888671875, -1.0684051513671875, -1.0093994140625, -0.9503936767578125, -0.891387939453125, -0.8323822021484375, -0.77337646484375, -0.7143707275390625, -0.655364990234375, -0.5963592529296875, -0.537353515625, -0.4783477783203125, -0.419342041015625, -0.3603363037109375, -0.30133056640625, -0.2423248291015625, -0.183319091796875, -0.1243133544921875, -0.0653076171875, -0.0063018798828125, 0.052703857421875, 0.1117095947265625, 0.17071533203125, 0.2297210693359375, 0.288726806640625, 0.3477325439453125, 0.40673828125, 0.4657440185546875, 0.524749755859375, 0.5837554931640625, 0.64276123046875, 0.7017669677734375, 0.760772705078125, 0.8197784423828125, 0.8787841796875, 0.9377899169921875, 0.996795654296875, 1.0558013916015625, 1.11480712890625, 1.1738128662109375, 1.232818603515625, 1.2918243408203125, 1.350830078125, 1.4098358154296875, 1.468841552734375, 1.5278472900390625, 1.58685302734375, 1.6458587646484375, 1.704864501953125, 1.7638702392578125, 1.8228759765625, 1.8818817138671875, 1.940887451171875, 1.9998931884765625, 2.05889892578125, 2.1179046630859375, 2.176910400390625, 2.2359161376953125, 2.294921875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 14.0, 67.0, 216.0, 339.0, 244.0, 75.0, 30.0, 8.0, 11.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962778091430664, -5.252849578857422, -4.5429205894470215, -3.8329918384552, -3.123063087463379, -2.4131343364715576, -1.7032055854797363, -0.9932765960693359, -0.28334808349609375, 0.42658066749572754, 1.1365094184875488, 1.8464381694793701, 2.5563669204711914, 3.2662956714630127, 3.976224422454834, 4.686153411865234, 5.396081924438477, 6.106010437011719, 6.815939426422119, 7.5258684158325195, 8.235796928405762, 8.945725440979004, 9.655654907226562, 10.365583419799805, 11.075511932373047, 11.785440444946289, 12.495368957519531, 13.20529842376709, 13.915226936340332, 14.625155448913574, 15.335084915161133, 16.045013427734375, 16.75494384765625, 17.464872360229492, 18.174800872802734, 18.884729385375977, 19.59465789794922, 20.304588317871094, 21.014516830444336, 21.724445343017578, 22.43437385559082, 23.144302368164062, 23.854230880737305, 24.564159393310547, 25.274089813232422, 25.984018325805664, 26.693946838378906, 27.40387535095215, 28.11380386352539, 28.823732376098633, 29.533660888671875, 30.243589401245117, 30.95351791381836, 31.663448333740234, 32.373374938964844, 33.08330535888672, 33.793235778808594, 34.50316619873047, 35.21309280395508, 35.92302322387695, 36.63294982910156, 37.34288024902344, 38.05280685424805, 38.76273727416992, 39.47266387939453]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 14.0, 10.0, 10.0, 17.0, 19.0, 26.0, 20.0, 26.0, 33.0, 35.0, 37.0, 39.0, 48.0, 43.0, 41.0, 42.0, 41.0, 42.0, 39.0, 43.0, 57.0, 42.0, 40.0, 29.0, 25.0, 20.0, 21.0, 18.0, 20.0, 18.0, 21.0, 17.0, 8.0, 6.0, 5.0, 3.0, 6.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.661427974700928, -4.5208024978637695, -4.380177021026611, -4.239551544189453, -4.098926067352295, -3.9583005905151367, -3.8176753520965576, -3.6770498752593994, -3.536424398422241, -3.395798921585083, -3.255173444747925, -3.1145479679107666, -2.9739227294921875, -2.8332972526550293, -2.692671775817871, -2.552046298980713, -2.4114208221435547, -2.2707953453063965, -2.1301698684692383, -1.9895445108413696, -1.8489190340042114, -1.7082935571670532, -1.5676681995391846, -1.4270427227020264, -1.2864172458648682, -1.14579176902771, -1.0051662921905518, -0.8645409345626831, -0.7239154577255249, -0.5832899808883667, -0.44266456365585327, -0.30203914642333984, -0.16141319274902344, -0.020787745714187622, 0.1198377013206482, 0.260463148355484, 0.4010885953903198, 0.541714072227478, 0.6823394894599915, 0.8229649066925049, 0.9635903835296631, 1.1042158603668213, 1.2448413372039795, 1.3854666948318481, 1.5260921716690063, 1.6667176485061646, 1.8073430061340332, 1.9479684829711914, 2.0885939598083496, 2.229219436645508, 2.369844913482666, 2.510470390319824, 2.6510958671569824, 2.7917213439941406, 2.9323465824127197, 3.072972059249878, 3.213597536087036, 3.3542230129241943, 3.4948484897613525, 3.6354739665985107, 3.77609920501709, 3.916724681854248, 4.057350158691406, 4.1979756355285645, 4.338601112365723]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 6.0, 8.0, 13.0, 22.0, 20.0, 45.0, 72.0, 117.0, 209.0, 430.0, 961.0, 2584.0, 8421.0, 32531.0, 136434.0, 438241.0, 317310.0, 82388.0, 20065.0, 5428.0, 1814.0, 666.0, 334.0, 173.0, 96.0, 66.0, 38.0, 18.0, 17.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.23046875, -5.04248046875, -4.8544921875, -4.66650390625, -4.478515625, -4.29052734375, -4.1025390625, -3.91455078125, -3.7265625, -3.53857421875, -3.3505859375, -3.16259765625, -2.974609375, -2.78662109375, -2.5986328125, -2.41064453125, -2.22265625, -2.03466796875, -1.8466796875, -1.65869140625, -1.470703125, -1.28271484375, -1.0947265625, -0.90673828125, -0.71875, -0.53076171875, -0.3427734375, -0.15478515625, 0.033203125, 0.22119140625, 0.4091796875, 0.59716796875, 0.78515625, 0.97314453125, 1.1611328125, 1.34912109375, 1.537109375, 1.72509765625, 1.9130859375, 2.10107421875, 2.2890625, 2.47705078125, 2.6650390625, 2.85302734375, 3.041015625, 3.22900390625, 3.4169921875, 3.60498046875, 3.79296875, 3.98095703125, 4.1689453125, 4.35693359375, 4.544921875, 4.73291015625, 4.9208984375, 5.10888671875, 5.296875, 5.48486328125, 5.6728515625, 5.86083984375, 6.048828125, 6.23681640625, 6.4248046875, 6.61279296875, 6.80078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 3.0, 5.0, 5.0, 7.0, 19.0, 25.0, 19.0, 29.0, 26.0, 37.0, 36.0, 52.0, 43.0, 52.0, 60.0, 59.0, 56.0, 60.0, 44.0, 49.0, 42.0, 37.0, 32.0, 35.0, 24.0, 26.0, 18.0, 15.0, 25.0, 16.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.173828125, -3.09100341796875, -3.0081787109375, -2.92535400390625, -2.842529296875, -2.75970458984375, -2.6768798828125, -2.59405517578125, -2.51123046875, -2.42840576171875, -2.3455810546875, -2.26275634765625, -2.179931640625, -2.09710693359375, -2.0142822265625, -1.93145751953125, -1.8486328125, -1.76580810546875, -1.6829833984375, -1.60015869140625, -1.517333984375, -1.43450927734375, -1.3516845703125, -1.26885986328125, -1.18603515625, -1.10321044921875, -1.0203857421875, -0.93756103515625, -0.854736328125, -0.77191162109375, -0.6890869140625, -0.60626220703125, -0.5234375, -0.44061279296875, -0.3577880859375, -0.27496337890625, -0.192138671875, -0.10931396484375, -0.0264892578125, 0.05633544921875, 0.13916015625, 0.22198486328125, 0.3048095703125, 0.38763427734375, 0.470458984375, 0.55328369140625, 0.6361083984375, 0.71893310546875, 0.8017578125, 0.88458251953125, 0.9674072265625, 1.05023193359375, 1.133056640625, 1.21588134765625, 1.2987060546875, 1.38153076171875, 1.46435546875, 1.54718017578125, 1.6300048828125, 1.71282958984375, 1.795654296875, 1.87847900390625, 1.9613037109375, 2.04412841796875, 2.126953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 13.0, 19.0, 25.0, 40.0, 59.0, 97.0, 163.0, 238.0, 487.0, 1142.0, 3488.0, 70514.0, 947764.0, 20345.0, 2261.0, 873.0, 430.0, 220.0, 136.0, 95.0, 45.0, 39.0, 18.0, 14.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.106689453125, -16.43212890625, -15.757568359375, -15.0830078125, -14.408447265625, -13.73388671875, -13.059326171875, -12.384765625, -11.710205078125, -11.03564453125, -10.361083984375, -9.6865234375, -9.011962890625, -8.33740234375, -7.662841796875, -6.98828125, -6.313720703125, -5.63916015625, -4.964599609375, -4.2900390625, -3.615478515625, -2.94091796875, -2.266357421875, -1.591796875, -0.917236328125, -0.24267578125, 0.431884765625, 1.1064453125, 1.781005859375, 2.45556640625, 3.130126953125, 3.8046875, 4.479248046875, 5.15380859375, 5.828369140625, 6.5029296875, 7.177490234375, 7.85205078125, 8.526611328125, 9.201171875, 9.875732421875, 10.55029296875, 11.224853515625, 11.8994140625, 12.573974609375, 13.24853515625, 13.923095703125, 14.59765625, 15.272216796875, 15.94677734375, 16.621337890625, 17.2958984375, 17.970458984375, 18.64501953125, 19.319580078125, 19.994140625, 20.668701171875, 21.34326171875, 22.017822265625, 22.6923828125, 23.366943359375, 24.04150390625, 24.716064453125, 25.390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 7.0, 14.0, 17.0, 19.0, 23.0, 34.0, 39.0, 43.0, 55.0, 58.0, 72.0, 71.0, 72.0, 68.0, 62.0, 53.0, 49.0, 40.0, 44.0, 42.0, 25.0, 18.0, 11.0, 12.0, 12.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7421875, -14.2249755859375, -13.707763671875, -13.1905517578125, -12.67333984375, -12.1561279296875, -11.638916015625, -11.1217041015625, -10.6044921875, -10.0872802734375, -9.570068359375, -9.0528564453125, -8.53564453125, -8.0184326171875, -7.501220703125, -6.9840087890625, -6.466796875, -5.9495849609375, -5.432373046875, -4.9151611328125, -4.39794921875, -3.8807373046875, -3.363525390625, -2.8463134765625, -2.3291015625, -1.8118896484375, -1.294677734375, -0.7774658203125, -0.26025390625, 0.2569580078125, 0.774169921875, 1.2913818359375, 1.80859375, 2.3258056640625, 2.843017578125, 3.3602294921875, 3.87744140625, 4.3946533203125, 4.911865234375, 5.4290771484375, 5.9462890625, 6.4635009765625, 6.980712890625, 7.4979248046875, 8.01513671875, 8.5323486328125, 9.049560546875, 9.5667724609375, 10.083984375, 10.6011962890625, 11.118408203125, 11.6356201171875, 12.15283203125, 12.6700439453125, 13.187255859375, 13.7044677734375, 14.2216796875, 14.7388916015625, 15.256103515625, 15.7733154296875, 16.29052734375, 16.8077392578125, 17.324951171875, 17.8421630859375, 18.359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 9.0, 8.0, 8.0, 6.0, 12.0, 20.0, 31.0, 26.0, 31.0, 48.0, 79.0, 110.0, 186.0, 367.0, 692.0, 2494.0, 37324.0, 966614.0, 36357.0, 2487.0, 672.0, 347.0, 190.0, 125.0, 83.0, 67.0, 49.0, 28.0, 20.0, 18.0, 12.0, 11.0, 9.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8828125, -11.528076171875, -11.17333984375, -10.818603515625, -10.4638671875, -10.109130859375, -9.75439453125, -9.399658203125, -9.044921875, -8.690185546875, -8.33544921875, -7.980712890625, -7.6259765625, -7.271240234375, -6.91650390625, -6.561767578125, -6.20703125, -5.852294921875, -5.49755859375, -5.142822265625, -4.7880859375, -4.433349609375, -4.07861328125, -3.723876953125, -3.369140625, -3.014404296875, -2.65966796875, -2.304931640625, -1.9501953125, -1.595458984375, -1.24072265625, -0.885986328125, -0.53125, -0.176513671875, 0.17822265625, 0.532958984375, 0.8876953125, 1.242431640625, 1.59716796875, 1.951904296875, 2.306640625, 2.661376953125, 3.01611328125, 3.370849609375, 3.7255859375, 4.080322265625, 4.43505859375, 4.789794921875, 5.14453125, 5.499267578125, 5.85400390625, 6.208740234375, 6.5634765625, 6.918212890625, 7.27294921875, 7.627685546875, 7.982421875, 8.337158203125, 8.69189453125, 9.046630859375, 9.4013671875, 9.756103515625, 10.11083984375, 10.465576171875, 10.8203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 12.0, 17.0, 18.0, 22.0, 36.0, 32.0, 62.0, 63.0, 93.0, 127.0, 99.0, 91.0, 74.0, 49.0, 42.0, 26.0, 26.0, 19.0, 8.0, 11.0, 14.0, 7.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007353052496910095, -0.0007148236036300659, -0.0006943419575691223, -0.0006738603115081787, -0.0006533786654472351, -0.0006328970193862915, -0.0006124153733253479, -0.0005919337272644043, -0.0005714520812034607, -0.0005509704351425171, -0.0005304887890815735, -0.0005100071430206299, -0.0004895254969596863, -0.0004690438508987427, -0.00044856220483779907, -0.00042808055877685547, -0.00040759891271591187, -0.00038711726665496826, -0.00036663562059402466, -0.00034615397453308105, -0.00032567232847213745, -0.00030519068241119385, -0.00028470903635025024, -0.00026422739028930664, -0.00024374574422836304, -0.00022326409816741943, -0.00020278245210647583, -0.00018230080604553223, -0.00016181915998458862, -0.00014133751392364502, -0.00012085586786270142, -0.00010037422180175781, -7.989257574081421e-05, -5.9410929679870605e-05, -3.8929283618927e-05, -1.84476375579834e-05, 2.034008502960205e-06, 2.251565456390381e-05, 4.299730062484741e-05, 6.347894668579102e-05, 8.396059274673462e-05, 0.00010444223880767822, 0.00012492388486862183, 0.00014540553092956543, 0.00016588717699050903, 0.00018636882305145264, 0.00020685046911239624, 0.00022733211517333984, 0.00024781376123428345, 0.00026829540729522705, 0.00028877705335617065, 0.00030925869941711426, 0.00032974034547805786, 0.00035022199153900146, 0.00037070363759994507, 0.00039118528366088867, 0.0004116669297218323, 0.0004321485757827759, 0.0004526302218437195, 0.0004731118679046631, 0.0004935935139656067, 0.0005140751600265503, 0.0005345568060874939, 0.0005550384521484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 5.0, 12.0, 10.0, 18.0, 29.0, 38.0, 46.0, 63.0, 94.0, 149.0, 218.0, 449.0, 1191.0, 5102.0, 68749.0, 928578.0, 37895.0, 3863.0, 962.0, 420.0, 224.0, 123.0, 78.0, 62.0, 45.0, 28.0, 18.0, 16.0, 7.0, 9.0, 12.0, 5.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1640625, -8.8525390625, -8.541015625, -8.2294921875, -7.91796875, -7.6064453125, -7.294921875, -6.9833984375, -6.671875, -6.3603515625, -6.048828125, -5.7373046875, -5.42578125, -5.1142578125, -4.802734375, -4.4912109375, -4.1796875, -3.8681640625, -3.556640625, -3.2451171875, -2.93359375, -2.6220703125, -2.310546875, -1.9990234375, -1.6875, -1.3759765625, -1.064453125, -0.7529296875, -0.44140625, -0.1298828125, 0.181640625, 0.4931640625, 0.8046875, 1.1162109375, 1.427734375, 1.7392578125, 2.05078125, 2.3623046875, 2.673828125, 2.9853515625, 3.296875, 3.6083984375, 3.919921875, 4.2314453125, 4.54296875, 4.8544921875, 5.166015625, 5.4775390625, 5.7890625, 6.1005859375, 6.412109375, 6.7236328125, 7.03515625, 7.3466796875, 7.658203125, 7.9697265625, 8.28125, 8.5927734375, 8.904296875, 9.2158203125, 9.52734375, 9.8388671875, 10.150390625, 10.4619140625, 10.7734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 5.0, 7.0, 17.0, 19.0, 17.0, 17.0, 28.0, 42.0, 56.0, 81.0, 110.0, 92.0, 106.0, 76.0, 82.0, 58.0, 53.0, 26.0, 17.0, 17.0, 16.0, 3.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.390625, -3.24261474609375, -3.0946044921875, -2.94659423828125, -2.798583984375, -2.65057373046875, -2.5025634765625, -2.35455322265625, -2.20654296875, -2.05853271484375, -1.9105224609375, -1.76251220703125, -1.614501953125, -1.46649169921875, -1.3184814453125, -1.17047119140625, -1.0224609375, -0.87445068359375, -0.7264404296875, -0.57843017578125, -0.430419921875, -0.28240966796875, -0.1343994140625, 0.01361083984375, 0.16162109375, 0.30963134765625, 0.4576416015625, 0.60565185546875, 0.753662109375, 0.90167236328125, 1.0496826171875, 1.19769287109375, 1.345703125, 1.49371337890625, 1.6417236328125, 1.78973388671875, 1.937744140625, 2.08575439453125, 2.2337646484375, 2.38177490234375, 2.52978515625, 2.67779541015625, 2.8258056640625, 2.97381591796875, 3.121826171875, 3.26983642578125, 3.4178466796875, 3.56585693359375, 3.7138671875, 3.86187744140625, 4.0098876953125, 4.15789794921875, 4.305908203125, 4.45391845703125, 4.6019287109375, 4.74993896484375, 4.89794921875, 5.04595947265625, 5.1939697265625, 5.34197998046875, 5.489990234375, 5.63800048828125, 5.7860107421875, 5.93402099609375, 6.08203125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 11.0, 73.0, 493.0, 366.0, 49.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.33428955078125, -321.27410888671875, -313.21392822265625, -305.15374755859375, -297.09356689453125, -289.03338623046875, -280.97320556640625, -272.91302490234375, -264.85284423828125, -256.79266357421875, -248.73248291015625, -240.67230224609375, -232.61212158203125, -224.55194091796875, -216.49176025390625, -208.43157958984375, -200.37139892578125, -192.31121826171875, -184.25103759765625, -176.19085693359375, -168.13067626953125, -160.07049560546875, -152.01031494140625, -143.95013427734375, -135.88995361328125, -127.82977294921875, -119.76959228515625, -111.70941162109375, -103.64923095703125, -95.58905029296875, -87.52886962890625, -79.46868896484375, -71.40850830078125, -63.34832763671875, -55.28814697265625, -47.22796630859375, -39.16778564453125, -31.10760498046875, -23.04742431640625, -14.98724365234375, -6.92706298828125, 1.13311767578125, 9.19329833984375, 17.25347900390625, 25.31365966796875, 33.37384033203125, 41.43402099609375, 49.49420166015625, 57.55438232421875, 65.61456298828125, 73.67474365234375, 81.73492431640625, 89.79510498046875, 97.85528564453125, 105.91546630859375, 113.97564697265625, 122.03582763671875, 130.09600830078125, 138.15618896484375, 146.21636962890625, 154.27655029296875, 162.33673095703125, 170.39691162109375, 178.45709228515625, 186.51727294921875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 9.0, 9.0, 15.0, 19.0, 21.0, 21.0, 20.0, 19.0, 33.0, 29.0, 46.0, 41.0, 43.0, 49.0, 50.0, 48.0, 51.0, 57.0, 57.0, 51.0, 37.0, 37.0, 44.0, 23.0, 31.0, 22.0, 13.0, 22.0, 16.0, 15.0, 10.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.81565856933594, -48.26628112792969, -46.71690368652344, -45.16752624511719, -43.61814880371094, -42.06877136230469, -40.51939392089844, -38.97001647949219, -37.42063903808594, -35.87126159667969, -34.32188415527344, -32.77250671386719, -31.223129272460938, -29.673751831054688, -28.124372482299805, -26.574995040893555, -25.025615692138672, -23.476238250732422, -21.926860809326172, -20.377483367919922, -18.828105926513672, -17.278728485107422, -15.729349136352539, -14.179971694946289, -12.630594253540039, -11.081216812133789, -9.531839370727539, -7.982460975646973, -6.433083534240723, -4.883706092834473, -3.3343276977539062, -1.7849502563476562, -0.23557281494140625, 1.3138048648834229, 2.863182544708252, 4.41256046295166, 5.96193790435791, 7.51131534576416, 9.060693740844727, 10.610071182250977, 12.159448623657227, 13.708826065063477, 15.258203506469727, 16.80758285522461, 18.35696029663086, 19.90633773803711, 21.45571517944336, 23.00509262084961, 24.55447006225586, 26.10384750366211, 27.65322494506836, 29.20260238647461, 30.75197982788086, 32.30135726928711, 33.850738525390625, 35.400115966796875, 36.949493408203125, 38.498870849609375, 40.048248291015625, 41.597625732421875, 43.147003173828125, 44.696380615234375, 46.245758056640625, 47.795135498046875, 49.344512939453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 14.0, 21.0, 35.0, 53.0, 125.0, 283.0, 566.0, 1196.0, 3206.0, 10790.0, 70577.0, 3980442.0, 107092.0, 13591.0, 3684.0, 1397.0, 639.0, 267.0, 126.0, 58.0, 38.0, 32.0, 12.0, 9.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.578125, -7.269775390625, -6.96142578125, -6.653076171875, -6.3447265625, -6.036376953125, -5.72802734375, -5.419677734375, -5.111328125, -4.802978515625, -4.49462890625, -4.186279296875, -3.8779296875, -3.569580078125, -3.26123046875, -2.952880859375, -2.64453125, -2.336181640625, -2.02783203125, -1.719482421875, -1.4111328125, -1.102783203125, -0.79443359375, -0.486083984375, -0.177734375, 0.130615234375, 0.43896484375, 0.747314453125, 1.0556640625, 1.364013671875, 1.67236328125, 1.980712890625, 2.2890625, 2.597412109375, 2.90576171875, 3.214111328125, 3.5224609375, 3.830810546875, 4.13916015625, 4.447509765625, 4.755859375, 5.064208984375, 5.37255859375, 5.680908203125, 5.9892578125, 6.297607421875, 6.60595703125, 6.914306640625, 7.22265625, 7.531005859375, 7.83935546875, 8.147705078125, 8.4560546875, 8.764404296875, 9.07275390625, 9.381103515625, 9.689453125, 9.997802734375, 10.30615234375, 10.614501953125, 10.9228515625, 11.231201171875, 11.53955078125, 11.847900390625, 12.15625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 7.0, 9.0, 11.0, 17.0, 16.0, 38.0, 35.0, 45.0, 49.0, 58.0, 71.0, 63.0, 82.0, 70.0, 65.0, 62.0, 49.0, 53.0, 38.0, 40.0, 27.0, 31.0, 14.0, 9.0, 10.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.57421875, -3.47149658203125, -3.3687744140625, -3.26605224609375, -3.163330078125, -3.06060791015625, -2.9578857421875, -2.85516357421875, -2.75244140625, -2.64971923828125, -2.5469970703125, -2.44427490234375, -2.341552734375, -2.23883056640625, -2.1361083984375, -2.03338623046875, -1.9306640625, -1.82794189453125, -1.7252197265625, -1.62249755859375, -1.519775390625, -1.41705322265625, -1.3143310546875, -1.21160888671875, -1.10888671875, -1.00616455078125, -0.9034423828125, -0.80072021484375, -0.697998046875, -0.59527587890625, -0.4925537109375, -0.38983154296875, -0.287109375, -0.18438720703125, -0.0816650390625, 0.02105712890625, 0.123779296875, 0.22650146484375, 0.3292236328125, 0.43194580078125, 0.53466796875, 0.63739013671875, 0.7401123046875, 0.84283447265625, 0.945556640625, 1.04827880859375, 1.1510009765625, 1.25372314453125, 1.3564453125, 1.45916748046875, 1.5618896484375, 1.66461181640625, 1.767333984375, 1.87005615234375, 1.9727783203125, 2.07550048828125, 2.17822265625, 2.28094482421875, 2.3836669921875, 2.48638916015625, 2.589111328125, 2.69183349609375, 2.7945556640625, 2.89727783203125, 3.0]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 11.0, 10.0, 21.0, 22.0, 47.0, 77.0, 102.0, 153.0, 245.0, 378.0, 617.0, 1042.0, 1818.0, 3225.0, 5954.0, 12542.0, 31417.0, 105187.0, 3124845.0, 778957.0, 78756.0, 25483.0, 11099.0, 5540.0, 2691.0, 1608.0, 939.0, 533.0, 359.0, 221.0, 131.0, 69.0, 61.0, 39.0, 27.0, 18.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.583587646484375, -3.45037841796875, -3.317169189453125, -3.1839599609375, -3.050750732421875, -2.91754150390625, -2.784332275390625, -2.651123046875, -2.517913818359375, -2.38470458984375, -2.251495361328125, -2.1182861328125, -1.985076904296875, -1.85186767578125, -1.718658447265625, -1.58544921875, -1.452239990234375, -1.31903076171875, -1.185821533203125, -1.0526123046875, -0.919403076171875, -0.78619384765625, -0.652984619140625, -0.519775390625, -0.386566162109375, -0.25335693359375, -0.120147705078125, 0.0130615234375, 0.146270751953125, 0.27947998046875, 0.412689208984375, 0.5458984375, 0.679107666015625, 0.81231689453125, 0.945526123046875, 1.0787353515625, 1.211944580078125, 1.34515380859375, 1.478363037109375, 1.611572265625, 1.744781494140625, 1.87799072265625, 2.011199951171875, 2.1444091796875, 2.277618408203125, 2.41082763671875, 2.544036865234375, 2.67724609375, 2.810455322265625, 2.94366455078125, 3.076873779296875, 3.2100830078125, 3.343292236328125, 3.47650146484375, 3.609710693359375, 3.742919921875, 3.876129150390625, 4.00933837890625, 4.142547607421875, 4.2757568359375, 4.408966064453125, 4.54217529296875, 4.675384521484375, 4.80859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 13.0, 15.0, 16.0, 23.0, 33.0, 29.0, 49.0, 105.0, 153.0, 509.0, 2357.0, 391.0, 144.0, 71.0, 38.0, 26.0, 19.0, 18.0, 11.0, 9.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.904296875, -1.829315185546875, -1.75433349609375, -1.679351806640625, -1.6043701171875, -1.529388427734375, -1.45440673828125, -1.379425048828125, -1.304443359375, -1.229461669921875, -1.15447998046875, -1.079498291015625, -1.0045166015625, -0.929534912109375, -0.85455322265625, -0.779571533203125, -0.70458984375, -0.629608154296875, -0.55462646484375, -0.479644775390625, -0.4046630859375, -0.329681396484375, -0.25469970703125, -0.179718017578125, -0.104736328125, -0.029754638671875, 0.04522705078125, 0.120208740234375, 0.1951904296875, 0.270172119140625, 0.34515380859375, 0.420135498046875, 0.4951171875, 0.570098876953125, 0.64508056640625, 0.720062255859375, 0.7950439453125, 0.870025634765625, 0.94500732421875, 1.019989013671875, 1.094970703125, 1.169952392578125, 1.24493408203125, 1.319915771484375, 1.3948974609375, 1.469879150390625, 1.54486083984375, 1.619842529296875, 1.69482421875, 1.769805908203125, 1.84478759765625, 1.919769287109375, 1.9947509765625, 2.069732666015625, 2.14471435546875, 2.219696044921875, 2.294677734375, 2.369659423828125, 2.44464111328125, 2.519622802734375, 2.5946044921875, 2.669586181640625, 2.74456787109375, 2.819549560546875, 2.89453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 9.0, 23.0, 56.0, 83.0, 121.0, 149.0, 198.0, 152.0, 90.0, 46.0, 25.0, 13.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.088930130004883, -17.51546859741211, -16.942007064819336, -16.368547439575195, -15.795085906982422, -15.221624374389648, -14.648162841796875, -14.074701309204102, -13.501240730285645, -12.927779197692871, -12.354318618774414, -11.78085708618164, -11.207395553588867, -10.63393497467041, -10.060473442077637, -9.48701286315918, -8.913551330566406, -8.340089797973633, -7.766629219055176, -7.193167686462402, -6.619706630706787, -6.046245574951172, -5.472784042358398, -4.899322986602783, -4.325861930847168, -3.7524008750915527, -3.1789395809173584, -2.605478286743164, -2.032017230987549, -1.4585561752319336, -0.8850948810577393, -0.3116335868835449, 0.2618293762207031, 0.8352905511856079, 1.4087517261505127, 1.9822129011154175, 2.5556740760803223, 3.1291351318359375, 3.702596426010132, 4.276057720184326, 4.849518775939941, 5.422979831695557, 5.996440887451172, 6.569902420043945, 7.1433634757995605, 7.716824531555176, 8.29028606414795, 8.863746643066406, 9.43720817565918, 10.010669708251953, 10.58413028717041, 11.157591819763184, 11.73105239868164, 12.304513931274414, 12.877975463867188, 13.451436996459961, 14.024897575378418, 14.598359107971191, 15.171819686889648, 15.745281219482422, 16.318742752075195, 16.89220428466797, 17.46566390991211, 18.039125442504883, 18.612586975097656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 9.0, 6.0, 8.0, 11.0, 16.0, 16.0, 26.0, 18.0, 13.0, 28.0, 33.0, 24.0, 27.0, 39.0, 38.0, 55.0, 42.0, 53.0, 55.0, 48.0, 47.0, 41.0, 45.0, 49.0, 49.0, 46.0, 27.0, 25.0, 17.0, 13.0, 12.0, 14.0, 10.0, 9.0, 4.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.451807975769043, -7.198174953460693, -6.944541931152344, -6.690908908843994, -6.4372758865356445, -6.183642864227295, -5.930009841918945, -5.676377296447754, -5.422743797302246, -5.1691107749938965, -4.915477752685547, -4.661844730377197, -4.408211708068848, -4.154578685760498, -3.9009459018707275, -3.647312879562378, -3.3936800956726074, -3.140047073364258, -2.886414051055908, -2.6327810287475586, -2.379148006439209, -2.1255149841308594, -1.8718822002410889, -1.6182491779327393, -1.3646161556243896, -1.11098313331604, -0.8573501706123352, -0.6037172079086304, -0.35008418560028076, -0.09645116329193115, 0.1571817398071289, 0.4108147621154785, 0.6644477844238281, 0.9180808067321777, 1.1717138290405273, 1.4253467321395874, 1.678979754447937, 1.9326127767562866, 2.1862456798553467, 2.4398787021636963, 2.693511724472046, 2.9471447467803955, 3.200777769088745, 3.4544105529785156, 3.7080435752868652, 3.961676597595215, 4.2153096199035645, 4.468942642211914, 4.722575664520264, 4.976208686828613, 5.229841709136963, 5.4834747314453125, 5.737107753753662, 5.990740776062012, 6.244373321533203, 6.498006820678711, 6.751639366149902, 7.005272388458252, 7.258905410766602, 7.512538433074951, 7.766171455383301, 8.019804000854492, 8.2734375, 8.527070045471191, 8.7807035446167]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 10.0, 7.0, 11.0, 11.0, 27.0, 32.0, 55.0, 92.0, 210.0, 412.0, 921.0, 2381.0, 7499.0, 30427.0, 152786.0, 563725.0, 230037.0, 44414.0, 10188.0, 3058.0, 1123.0, 512.0, 263.0, 122.0, 82.0, 46.0, 21.0, 12.0, 12.0, 13.0, 8.0, 2.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2635498046875, -8.988037109375, -8.7125244140625, -8.43701171875, -8.1614990234375, -7.885986328125, -7.6104736328125, -7.3349609375, -7.0594482421875, -6.783935546875, -6.5084228515625, -6.23291015625, -5.9573974609375, -5.681884765625, -5.4063720703125, -5.130859375, -4.8553466796875, -4.579833984375, -4.3043212890625, -4.02880859375, -3.7532958984375, -3.477783203125, -3.2022705078125, -2.9267578125, -2.6512451171875, -2.375732421875, -2.1002197265625, -1.82470703125, -1.5491943359375, -1.273681640625, -0.9981689453125, -0.72265625, -0.4471435546875, -0.171630859375, 0.1038818359375, 0.37939453125, 0.6549072265625, 0.930419921875, 1.2059326171875, 1.4814453125, 1.7569580078125, 2.032470703125, 2.3079833984375, 2.58349609375, 2.8590087890625, 3.134521484375, 3.4100341796875, 3.685546875, 3.9610595703125, 4.236572265625, 4.5120849609375, 4.78759765625, 5.0631103515625, 5.338623046875, 5.6141357421875, 5.8896484375, 6.1651611328125, 6.440673828125, 6.7161865234375, 6.99169921875, 7.2672119140625, 7.542724609375, 7.8182373046875, 8.09375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 9.0, 16.0, 14.0, 17.0, 23.0, 37.0, 41.0, 52.0, 53.0, 65.0, 87.0, 76.0, 70.0, 75.0, 61.0, 49.0, 55.0, 44.0, 38.0, 31.0, 19.0, 20.0, 16.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.085784912109375, -3.97235107421875, -3.858917236328125, -3.7454833984375, -3.632049560546875, -3.51861572265625, -3.405181884765625, -3.291748046875, -3.178314208984375, -3.06488037109375, -2.951446533203125, -2.8380126953125, -2.724578857421875, -2.61114501953125, -2.497711181640625, -2.38427734375, -2.270843505859375, -2.15740966796875, -2.043975830078125, -1.9305419921875, -1.817108154296875, -1.70367431640625, -1.590240478515625, -1.476806640625, -1.363372802734375, -1.24993896484375, -1.136505126953125, -1.0230712890625, -0.909637451171875, -0.79620361328125, -0.682769775390625, -0.5693359375, -0.455902099609375, -0.34246826171875, -0.229034423828125, -0.1156005859375, -0.002166748046875, 0.11126708984375, 0.224700927734375, 0.338134765625, 0.451568603515625, 0.56500244140625, 0.678436279296875, 0.7918701171875, 0.905303955078125, 1.01873779296875, 1.132171630859375, 1.24560546875, 1.359039306640625, 1.47247314453125, 1.585906982421875, 1.6993408203125, 1.812774658203125, 1.92620849609375, 2.039642333984375, 2.153076171875, 2.266510009765625, 2.37994384765625, 2.493377685546875, 2.6068115234375, 2.720245361328125, 2.83367919921875, 2.947113037109375, 3.060546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 8.0, 4.0, 10.0, 24.0, 34.0, 29.0, 45.0, 96.0, 141.0, 295.0, 580.0, 1759.0, 11364.0, 889173.0, 138482.0, 4453.0, 1080.0, 420.0, 219.0, 92.0, 78.0, 49.0, 30.0, 22.0, 18.0, 15.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-34.625, -33.708984375, -32.79296875, -31.876953125, -30.9609375, -30.044921875, -29.12890625, -28.212890625, -27.296875, -26.380859375, -25.46484375, -24.548828125, -23.6328125, -22.716796875, -21.80078125, -20.884765625, -19.96875, -19.052734375, -18.13671875, -17.220703125, -16.3046875, -15.388671875, -14.47265625, -13.556640625, -12.640625, -11.724609375, -10.80859375, -9.892578125, -8.9765625, -8.060546875, -7.14453125, -6.228515625, -5.3125, -4.396484375, -3.48046875, -2.564453125, -1.6484375, -0.732421875, 0.18359375, 1.099609375, 2.015625, 2.931640625, 3.84765625, 4.763671875, 5.6796875, 6.595703125, 7.51171875, 8.427734375, 9.34375, 10.259765625, 11.17578125, 12.091796875, 13.0078125, 13.923828125, 14.83984375, 15.755859375, 16.671875, 17.587890625, 18.50390625, 19.419921875, 20.3359375, 21.251953125, 22.16796875, 23.083984375, 24.0]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 12.0, 13.0, 18.0, 19.0, 19.0, 26.0, 29.0, 33.0, 30.0, 44.0, 34.0, 64.0, 57.0, 49.0, 62.0, 38.0, 53.0, 50.0, 47.0, 51.0, 37.0, 29.0, 39.0, 24.0, 26.0, 18.0, 10.0, 14.0, 14.0, 10.0, 3.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-15.828125, -15.431640625, -15.03515625, -14.638671875, -14.2421875, -13.845703125, -13.44921875, -13.052734375, -12.65625, -12.259765625, -11.86328125, -11.466796875, -11.0703125, -10.673828125, -10.27734375, -9.880859375, -9.484375, -9.087890625, -8.69140625, -8.294921875, -7.8984375, -7.501953125, -7.10546875, -6.708984375, -6.3125, -5.916015625, -5.51953125, -5.123046875, -4.7265625, -4.330078125, -3.93359375, -3.537109375, -3.140625, -2.744140625, -2.34765625, -1.951171875, -1.5546875, -1.158203125, -0.76171875, -0.365234375, 0.03125, 0.427734375, 0.82421875, 1.220703125, 1.6171875, 2.013671875, 2.41015625, 2.806640625, 3.203125, 3.599609375, 3.99609375, 4.392578125, 4.7890625, 5.185546875, 5.58203125, 5.978515625, 6.375, 6.771484375, 7.16796875, 7.564453125, 7.9609375, 8.357421875, 8.75390625, 9.150390625, 9.546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 17.0, 14.0, 17.0, 41.0, 52.0, 92.0, 141.0, 321.0, 799.0, 4276.0, 81453.0, 939799.0, 18371.0, 2060.0, 540.0, 215.0, 102.0, 62.0, 38.0, 21.0, 25.0, 11.0, 20.0, 14.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.59375, -10.244140625, -9.89453125, -9.544921875, -9.1953125, -8.845703125, -8.49609375, -8.146484375, -7.796875, -7.447265625, -7.09765625, -6.748046875, -6.3984375, -6.048828125, -5.69921875, -5.349609375, -5.0, -4.650390625, -4.30078125, -3.951171875, -3.6015625, -3.251953125, -2.90234375, -2.552734375, -2.203125, -1.853515625, -1.50390625, -1.154296875, -0.8046875, -0.455078125, -0.10546875, 0.244140625, 0.59375, 0.943359375, 1.29296875, 1.642578125, 1.9921875, 2.341796875, 2.69140625, 3.041015625, 3.390625, 3.740234375, 4.08984375, 4.439453125, 4.7890625, 5.138671875, 5.48828125, 5.837890625, 6.1875, 6.537109375, 6.88671875, 7.236328125, 7.5859375, 7.935546875, 8.28515625, 8.634765625, 8.984375, 9.333984375, 9.68359375, 10.033203125, 10.3828125, 10.732421875, 11.08203125, 11.431640625, 11.78125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 14.0, 35.0, 28.0, 55.0, 70.0, 138.0, 253.0, 158.0, 66.0, 68.0, 32.0, 17.0, 25.0, 17.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001239776611328125, -0.0011930614709854126, -0.0011463463306427002, -0.0010996311902999878, -0.0010529160499572754, -0.001006200909614563, -0.0009594857692718506, -0.0009127706289291382, -0.0008660554885864258, -0.0008193403482437134, -0.000772625207901001, -0.0007259100675582886, -0.0006791949272155762, -0.0006324797868728638, -0.0005857646465301514, -0.000539049506187439, -0.0004923343658447266, -0.00044561922550201416, -0.00039890408515930176, -0.00035218894481658936, -0.00030547380447387695, -0.00025875866413116455, -0.00021204352378845215, -0.00016532838344573975, -0.00011861324310302734, -7.189810276031494e-05, -2.518296241760254e-05, 2.1532177925109863e-05, 6.824731826782227e-05, 0.00011496245861053467, 0.00016167759895324707, 0.00020839273929595947, 0.0002551078796386719, 0.0003018230199813843, 0.0003485381603240967, 0.0003952533006668091, 0.0004419684410095215, 0.0004886835813522339, 0.0005353987216949463, 0.0005821138620376587, 0.0006288290023803711, 0.0006755441427230835, 0.0007222592830657959, 0.0007689744234085083, 0.0008156895637512207, 0.0008624047040939331, 0.0009091198444366455, 0.0009558349847793579, 0.0010025501251220703, 0.0010492652654647827, 0.0010959804058074951, 0.0011426955461502075, 0.00118941068649292, 0.0012361258268356323, 0.0012828409671783447, 0.0013295561075210571, 0.0013762712478637695, 0.001422986388206482, 0.0014697015285491943, 0.0015164166688919067, 0.0015631318092346191, 0.0016098469495773315, 0.001656562089920044, 0.0017032772302627563, 0.0017499923706054688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 7.0, 6.0, 14.0, 12.0, 23.0, 31.0, 38.0, 79.0, 150.0, 290.0, 747.0, 2968.0, 20613.0, 957549.0, 59105.0, 4904.0, 1163.0, 379.0, 165.0, 91.0, 69.0, 32.0, 21.0, 25.0, 17.0, 16.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.212158203125, -8.82275390625, -8.433349609375, -8.0439453125, -7.654541015625, -7.26513671875, -6.875732421875, -6.486328125, -6.096923828125, -5.70751953125, -5.318115234375, -4.9287109375, -4.539306640625, -4.14990234375, -3.760498046875, -3.37109375, -2.981689453125, -2.59228515625, -2.202880859375, -1.8134765625, -1.424072265625, -1.03466796875, -0.645263671875, -0.255859375, 0.133544921875, 0.52294921875, 0.912353515625, 1.3017578125, 1.691162109375, 2.08056640625, 2.469970703125, 2.859375, 3.248779296875, 3.63818359375, 4.027587890625, 4.4169921875, 4.806396484375, 5.19580078125, 5.585205078125, 5.974609375, 6.364013671875, 6.75341796875, 7.142822265625, 7.5322265625, 7.921630859375, 8.31103515625, 8.700439453125, 9.08984375, 9.479248046875, 9.86865234375, 10.258056640625, 10.6474609375, 11.036865234375, 11.42626953125, 11.815673828125, 12.205078125, 12.594482421875, 12.98388671875, 13.373291015625, 13.7626953125, 14.152099609375, 14.54150390625, 14.930908203125, 15.3203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 10.0, 10.0, 36.0, 53.0, 97.0, 190.0, 273.0, 134.0, 87.0, 36.0, 22.0, 13.0, 2.0, 7.0, 5.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1768798828125, -7.877197265625, -7.5775146484375, -7.27783203125, -6.9781494140625, -6.678466796875, -6.3787841796875, -6.0791015625, -5.7794189453125, -5.479736328125, -5.1800537109375, -4.88037109375, -4.5806884765625, -4.281005859375, -3.9813232421875, -3.681640625, -3.3819580078125, -3.082275390625, -2.7825927734375, -2.48291015625, -2.1832275390625, -1.883544921875, -1.5838623046875, -1.2841796875, -0.9844970703125, -0.684814453125, -0.3851318359375, -0.08544921875, 0.2142333984375, 0.513916015625, 0.8135986328125, 1.11328125, 1.4129638671875, 1.712646484375, 2.0123291015625, 2.31201171875, 2.6116943359375, 2.911376953125, 3.2110595703125, 3.5107421875, 3.8104248046875, 4.110107421875, 4.4097900390625, 4.70947265625, 5.0091552734375, 5.308837890625, 5.6085205078125, 5.908203125, 6.2078857421875, 6.507568359375, 6.8072509765625, 7.10693359375, 7.4066162109375, 7.706298828125, 8.0059814453125, 8.3056640625, 8.6053466796875, 8.905029296875, 9.2047119140625, 9.50439453125, 9.8040771484375, 10.103759765625, 10.4034423828125, 10.703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 14.0, 54.0, 177.0, 362.0, 260.0, 86.0, 28.0, 7.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.8398895263672, -154.28648376464844, -148.73306274414062, -143.17965698242188, -137.62623596191406, -132.0728302001953, -126.51941680908203, -120.96600341796875, -115.41259002685547, -109.85917663574219, -104.3057632446289, -98.75234985351562, -93.19894409179688, -87.64552307128906, -82.09211730957031, -76.53870391845703, -70.98529052734375, -65.43187713623047, -59.87846374511719, -54.32505416870117, -48.77164077758789, -43.21822738647461, -37.664817810058594, -32.11140441894531, -26.55799102783203, -21.00457763671875, -15.451166152954102, -9.897754669189453, -4.344341278076172, 1.2090721130371094, 6.762481689453125, 12.315895080566406, 17.86932373046875, 23.42273712158203, 28.97614860534668, 34.52956008911133, 40.08297348022461, 45.63638687133789, 51.189796447753906, 56.74320983886719, 62.29662322998047, 67.85003662109375, 73.40345001220703, 78.95686340332031, 84.51026916503906, 90.06369018554688, 95.61709594726562, 101.1705093383789, 106.72392272949219, 112.27733612060547, 117.83074951171875, 123.3841552734375, 128.9375762939453, 134.49098205566406, 140.04440307617188, 145.59780883789062, 151.15121459960938, 156.70462036132812, 162.25804138183594, 167.8114471435547, 173.3648681640625, 178.91827392578125, 184.4716796875, 190.0251007080078, 195.57852172851562]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 5.0, 9.0, 6.0, 10.0, 12.0, 14.0, 29.0, 23.0, 23.0, 27.0, 33.0, 39.0, 43.0, 53.0, 38.0, 49.0, 47.0, 61.0, 52.0, 42.0, 55.0, 45.0, 46.0, 45.0, 26.0, 23.0, 36.0, 25.0, 16.0, 20.0, 13.0, 3.0, 11.0, 8.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-63.142215728759766, -61.37267303466797, -59.60313034057617, -57.833587646484375, -56.064048767089844, -54.29450225830078, -52.52496337890625, -50.75542068481445, -48.985877990722656, -47.21633529663086, -45.44679260253906, -43.677249908447266, -41.90770721435547, -40.13816833496094, -38.36862564086914, -36.599082946777344, -34.82954025268555, -33.05999755859375, -31.290454864501953, -29.52091407775879, -27.751371383666992, -25.981828689575195, -24.21228790283203, -22.442745208740234, -20.673202514648438, -18.90365982055664, -17.134117126464844, -15.36457633972168, -13.595033645629883, -11.825490951538086, -10.055949211120605, -8.286407470703125, -6.516864776611328, -4.7473225593566895, -2.977780342102051, -1.208238124847412, 0.5613040924072266, 2.3308467864990234, 4.100388526916504, 5.869930267333984, 7.639472961425781, 9.409015655517578, 11.178557395935059, 12.948099136352539, 14.717641830444336, 16.487184524536133, 18.256725311279297, 20.026268005371094, 21.79581069946289, 23.565353393554688, 25.334896087646484, 27.10443687438965, 28.873979568481445, 30.643522262573242, 32.413063049316406, 34.1826057434082, 35.9521484375, 37.7216911315918, 39.491233825683594, 41.26077651977539, 43.03031921386719, 44.79985809326172, 46.569400787353516, 48.33894348144531, 50.10848617553711]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 8.0, 12.0, 16.0, 35.0, 57.0, 90.0, 139.0, 259.0, 482.0, 1113.0, 2927.0, 10357.0, 54134.0, 833698.0, 3109158.0, 153093.0, 20739.0, 4924.0, 1633.0, 665.0, 313.0, 179.0, 84.0, 55.0, 27.0, 23.0, 17.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.4317626953125, -6.218994140625, -6.0062255859375, -5.79345703125, -5.5806884765625, -5.367919921875, -5.1551513671875, -4.9423828125, -4.7296142578125, -4.516845703125, -4.3040771484375, -4.09130859375, -3.8785400390625, -3.665771484375, -3.4530029296875, -3.240234375, -3.0274658203125, -2.814697265625, -2.6019287109375, -2.38916015625, -2.1763916015625, -1.963623046875, -1.7508544921875, -1.5380859375, -1.3253173828125, -1.112548828125, -0.8997802734375, -0.68701171875, -0.4742431640625, -0.261474609375, -0.0487060546875, 0.1640625, 0.3768310546875, 0.589599609375, 0.8023681640625, 1.01513671875, 1.2279052734375, 1.440673828125, 1.6534423828125, 1.8662109375, 2.0789794921875, 2.291748046875, 2.5045166015625, 2.71728515625, 2.9300537109375, 3.142822265625, 3.3555908203125, 3.568359375, 3.7811279296875, 3.993896484375, 4.2066650390625, 4.41943359375, 4.6322021484375, 4.844970703125, 5.0577392578125, 5.2705078125, 5.4832763671875, 5.696044921875, 5.9088134765625, 6.12158203125, 6.3343505859375, 6.547119140625, 6.7598876953125, 6.97265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 8.0, 13.0, 13.0, 22.0, 34.0, 45.0, 52.0, 56.0, 56.0, 75.0, 76.0, 84.0, 92.0, 79.0, 67.0, 50.0, 42.0, 44.0, 29.0, 11.0, 20.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.994140625, -3.874176025390625, -3.75421142578125, -3.634246826171875, -3.5142822265625, -3.394317626953125, -3.27435302734375, -3.154388427734375, -3.034423828125, -2.914459228515625, -2.79449462890625, -2.674530029296875, -2.5545654296875, -2.434600830078125, -2.31463623046875, -2.194671630859375, -2.07470703125, -1.954742431640625, -1.83477783203125, -1.714813232421875, -1.5948486328125, -1.474884033203125, -1.35491943359375, -1.234954833984375, -1.114990234375, -0.995025634765625, -0.87506103515625, -0.755096435546875, -0.6351318359375, -0.515167236328125, -0.39520263671875, -0.275238037109375, -0.1552734375, -0.035308837890625, 0.08465576171875, 0.204620361328125, 0.3245849609375, 0.444549560546875, 0.56451416015625, 0.684478759765625, 0.804443359375, 0.924407958984375, 1.04437255859375, 1.164337158203125, 1.2843017578125, 1.404266357421875, 1.52423095703125, 1.644195556640625, 1.76416015625, 1.884124755859375, 2.00408935546875, 2.124053955078125, 2.2440185546875, 2.363983154296875, 2.48394775390625, 2.603912353515625, 2.723876953125, 2.843841552734375, 2.96380615234375, 3.083770751953125, 3.2037353515625, 3.323699951171875, 3.44366455078125, 3.563629150390625, 3.68359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 4.0, 6.0, 16.0, 22.0, 29.0, 48.0, 65.0, 146.0, 409.0, 1966.0, 15730.0, 557515.0, 3569467.0, 43748.0, 3921.0, 700.0, 206.0, 103.0, 49.0, 28.0, 22.0, 19.0, 13.0, 6.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.75, -11.347412109375, -10.94482421875, -10.542236328125, -10.1396484375, -9.737060546875, -9.33447265625, -8.931884765625, -8.529296875, -8.126708984375, -7.72412109375, -7.321533203125, -6.9189453125, -6.516357421875, -6.11376953125, -5.711181640625, -5.30859375, -4.906005859375, -4.50341796875, -4.100830078125, -3.6982421875, -3.295654296875, -2.89306640625, -2.490478515625, -2.087890625, -1.685302734375, -1.28271484375, -0.880126953125, -0.4775390625, -0.074951171875, 0.32763671875, 0.730224609375, 1.1328125, 1.535400390625, 1.93798828125, 2.340576171875, 2.7431640625, 3.145751953125, 3.54833984375, 3.950927734375, 4.353515625, 4.756103515625, 5.15869140625, 5.561279296875, 5.9638671875, 6.366455078125, 6.76904296875, 7.171630859375, 7.57421875, 7.976806640625, 8.37939453125, 8.781982421875, 9.1845703125, 9.587158203125, 9.98974609375, 10.392333984375, 10.794921875, 11.197509765625, 11.60009765625, 12.002685546875, 12.4052734375, 12.807861328125, 13.21044921875, 13.613037109375, 14.015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 8.0, 7.0, 14.0, 13.0, 17.0, 25.0, 54.0, 58.0, 85.0, 159.0, 310.0, 523.0, 922.0, 800.0, 418.0, 240.0, 156.0, 85.0, 46.0, 33.0, 22.0, 13.0, 17.0, 6.0, 9.0, 2.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8707275390625, -5.651611328125, -5.4324951171875, -5.21337890625, -4.9942626953125, -4.775146484375, -4.5560302734375, -4.3369140625, -4.1177978515625, -3.898681640625, -3.6795654296875, -3.46044921875, -3.2413330078125, -3.022216796875, -2.8031005859375, -2.583984375, -2.3648681640625, -2.145751953125, -1.9266357421875, -1.70751953125, -1.4884033203125, -1.269287109375, -1.0501708984375, -0.8310546875, -0.6119384765625, -0.392822265625, -0.1737060546875, 0.04541015625, 0.2645263671875, 0.483642578125, 0.7027587890625, 0.921875, 1.1409912109375, 1.360107421875, 1.5792236328125, 1.79833984375, 2.0174560546875, 2.236572265625, 2.4556884765625, 2.6748046875, 2.8939208984375, 3.113037109375, 3.3321533203125, 3.55126953125, 3.7703857421875, 3.989501953125, 4.2086181640625, 4.427734375, 4.6468505859375, 4.865966796875, 5.0850830078125, 5.30419921875, 5.5233154296875, 5.742431640625, 5.9615478515625, 6.1806640625, 6.3997802734375, 6.618896484375, 6.8380126953125, 7.05712890625, 7.2762451171875, 7.495361328125, 7.7144775390625, 7.93359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 18.0, 91.0, 268.0, 346.0, 178.0, 46.0, 21.0, 8.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.11561584472656, -88.12002563476562, -84.12442779541016, -80.12883758544922, -76.13324737548828, -72.13764953613281, -68.14205932617188, -64.14646911621094, -60.15087890625, -56.1552848815918, -52.15969467163086, -48.164100646972656, -44.16851043701172, -40.172916412353516, -36.17732238769531, -32.181732177734375, -28.186138153076172, -24.1905460357666, -20.19495391845703, -16.199359893798828, -12.203768730163574, -8.208175659179688, -4.212583541870117, -0.21699142456054688, 3.7786006927490234, 7.774192810058594, 11.769784927368164, 15.76537799835205, 19.760971069335938, 23.756563186645508, 27.752155303955078, 31.74774742126465, 35.74333953857422, 39.73893356323242, 43.73452377319336, 47.73011779785156, 51.7257080078125, 55.7213020324707, 59.716896057128906, 63.712486267089844, 67.70807647705078, 71.70366668701172, 75.69926452636719, 79.69485473632812, 83.69044494628906, 87.68603515625, 91.68163299560547, 95.6772232055664, 99.67282104492188, 103.66841125488281, 107.66400909423828, 111.65959930419922, 115.65518951416016, 119.65078735351562, 123.64637756347656, 127.6419677734375, 131.63755798339844, 135.63314819335938, 139.6287384033203, 143.62432861328125, 147.61993408203125, 151.6155242919922, 155.61111450195312, 159.60670471191406, 163.602294921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 3.0, 7.0, 6.0, 11.0, 18.0, 11.0, 15.0, 23.0, 28.0, 29.0, 45.0, 33.0, 45.0, 48.0, 54.0, 55.0, 50.0, 55.0, 52.0, 56.0, 54.0, 43.0, 39.0, 35.0, 33.0, 26.0, 26.0, 14.0, 19.0, 14.0, 14.0, 7.0, 8.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.814090728759766, -33.72774124145508, -32.64139175415039, -31.55504035949707, -30.46868896484375, -29.382339477539062, -28.295989990234375, -27.209640502929688, -26.123289108276367, -25.03693962097168, -23.95058822631836, -22.864238739013672, -21.777889251708984, -20.691537857055664, -19.605188369750977, -18.518836975097656, -17.43248748779297, -16.34613800048828, -15.259786605834961, -14.173437118530273, -13.08708667755127, -12.000736236572266, -10.914386749267578, -9.828036308288574, -8.74168586730957, -7.655335426330566, -6.568985462188721, -5.482635498046875, -4.396285057067871, -3.309934616088867, -2.2235846519470215, -1.1372346878051758, -0.05088043212890625, 1.0354697704315186, 2.1218199729919434, 3.208170175552368, 4.294520378112793, 5.380870819091797, 6.467220783233643, 7.553570747375488, 8.639921188354492, 9.726271629333496, 10.8126220703125, 11.898971557617188, 12.985321998596191, 14.071672439575195, 15.158021926879883, 16.244373321533203, 17.33072280883789, 18.417072296142578, 19.5034236907959, 20.589773178100586, 21.676124572753906, 22.762474060058594, 23.84882354736328, 24.93517303466797, 26.02152442932129, 27.107873916625977, 28.194225311279297, 29.280574798583984, 30.366924285888672, 31.453275680541992, 32.53962707519531, 33.6259765625, 34.71232604980469]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 13.0, 13.0, 12.0, 26.0, 24.0, 47.0, 66.0, 87.0, 191.0, 364.0, 751.0, 1890.0, 5773.0, 23243.0, 134485.0, 677896.0, 165468.0, 27767.0, 6602.0, 2088.0, 813.0, 379.0, 219.0, 90.0, 70.0, 51.0, 37.0, 22.0, 15.0, 13.0, 9.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.71875, -10.3790283203125, -10.039306640625, -9.6995849609375, -9.35986328125, -9.0201416015625, -8.680419921875, -8.3406982421875, -8.0009765625, -7.6612548828125, -7.321533203125, -6.9818115234375, -6.64208984375, -6.3023681640625, -5.962646484375, -5.6229248046875, -5.283203125, -4.9434814453125, -4.603759765625, -4.2640380859375, -3.92431640625, -3.5845947265625, -3.244873046875, -2.9051513671875, -2.5654296875, -2.2257080078125, -1.885986328125, -1.5462646484375, -1.20654296875, -0.8668212890625, -0.527099609375, -0.1873779296875, 0.15234375, 0.4920654296875, 0.831787109375, 1.1715087890625, 1.51123046875, 1.8509521484375, 2.190673828125, 2.5303955078125, 2.8701171875, 3.2098388671875, 3.549560546875, 3.8892822265625, 4.22900390625, 4.5687255859375, 4.908447265625, 5.2481689453125, 5.587890625, 5.9276123046875, 6.267333984375, 6.6070556640625, 6.94677734375, 7.2864990234375, 7.626220703125, 7.9659423828125, 8.3056640625, 8.6453857421875, 8.985107421875, 9.3248291015625, 9.66455078125, 10.0042724609375, 10.343994140625, 10.6837158203125, 11.0234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 12.0, 16.0, 24.0, 29.0, 46.0, 49.0, 62.0, 73.0, 72.0, 82.0, 91.0, 91.0, 77.0, 56.0, 65.0, 44.0, 34.0, 20.0, 13.0, 13.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.910552978515625, -4.77813720703125, -4.645721435546875, -4.5133056640625, -4.380889892578125, -4.24847412109375, -4.116058349609375, -3.983642578125, -3.851226806640625, -3.71881103515625, -3.586395263671875, -3.4539794921875, -3.321563720703125, -3.18914794921875, -3.056732177734375, -2.92431640625, -2.791900634765625, -2.65948486328125, -2.527069091796875, -2.3946533203125, -2.262237548828125, -2.12982177734375, -1.997406005859375, -1.864990234375, -1.732574462890625, -1.60015869140625, -1.467742919921875, -1.3353271484375, -1.202911376953125, -1.07049560546875, -0.938079833984375, -0.8056640625, -0.673248291015625, -0.54083251953125, -0.408416748046875, -0.2760009765625, -0.143585205078125, -0.01116943359375, 0.121246337890625, 0.253662109375, 0.386077880859375, 0.51849365234375, 0.650909423828125, 0.7833251953125, 0.915740966796875, 1.04815673828125, 1.180572509765625, 1.31298828125, 1.445404052734375, 1.57781982421875, 1.710235595703125, 1.8426513671875, 1.975067138671875, 2.10748291015625, 2.239898681640625, 2.372314453125, 2.504730224609375, 2.63714599609375, 2.769561767578125, 2.9019775390625, 3.034393310546875, 3.16680908203125, 3.299224853515625, 3.431640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 4.0, 8.0, 11.0, 17.0, 14.0, 25.0, 39.0, 72.0, 113.0, 147.0, 314.0, 682.0, 1975.0, 10567.0, 795646.0, 229221.0, 6901.0, 1505.0, 543.0, 301.0, 155.0, 89.0, 61.0, 51.0, 29.0, 15.0, 14.0, 8.0, 2.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -33.23681640625, -32.1611328125, -31.08544921875, -30.009765625, -28.93408203125, -27.8583984375, -26.78271484375, -25.70703125, -24.63134765625, -23.5556640625, -22.47998046875, -21.404296875, -20.32861328125, -19.2529296875, -18.17724609375, -17.1015625, -16.02587890625, -14.9501953125, -13.87451171875, -12.798828125, -11.72314453125, -10.6474609375, -9.57177734375, -8.49609375, -7.42041015625, -6.3447265625, -5.26904296875, -4.193359375, -3.11767578125, -2.0419921875, -0.96630859375, 0.109375, 1.18505859375, 2.2607421875, 3.33642578125, 4.412109375, 5.48779296875, 6.5634765625, 7.63916015625, 8.71484375, 9.79052734375, 10.8662109375, 11.94189453125, 13.017578125, 14.09326171875, 15.1689453125, 16.24462890625, 17.3203125, 18.39599609375, 19.4716796875, 20.54736328125, 21.623046875, 22.69873046875, 23.7744140625, 24.85009765625, 25.92578125, 27.00146484375, 28.0771484375, 29.15283203125, 30.228515625, 31.30419921875, 32.3798828125, 33.45556640625, 34.53125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 17.0, 20.0, 26.0, 35.0, 65.0, 59.0, 74.0, 99.0, 115.0, 108.0, 99.0, 64.0, 54.0, 30.0, 33.0, 24.0, 16.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.40966796875, -20.5380859375, -19.66650390625, -18.794921875, -17.92333984375, -17.0517578125, -16.18017578125, -15.30859375, -14.43701171875, -13.5654296875, -12.69384765625, -11.822265625, -10.95068359375, -10.0791015625, -9.20751953125, -8.3359375, -7.46435546875, -6.5927734375, -5.72119140625, -4.849609375, -3.97802734375, -3.1064453125, -2.23486328125, -1.36328125, -0.49169921875, 0.3798828125, 1.25146484375, 2.123046875, 2.99462890625, 3.8662109375, 4.73779296875, 5.609375, 6.48095703125, 7.3525390625, 8.22412109375, 9.095703125, 9.96728515625, 10.8388671875, 11.71044921875, 12.58203125, 13.45361328125, 14.3251953125, 15.19677734375, 16.068359375, 16.93994140625, 17.8115234375, 18.68310546875, 19.5546875, 20.42626953125, 21.2978515625, 22.16943359375, 23.041015625, 23.91259765625, 24.7841796875, 25.65576171875, 26.52734375, 27.39892578125, 28.2705078125, 29.14208984375, 30.013671875, 30.88525390625, 31.7568359375, 32.62841796875, 33.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 18.0, 36.0, 51.0, 72.0, 101.0, 194.0, 362.0, 757.0, 2588.0, 16349.0, 696351.0, 315645.0, 12200.0, 2247.0, 723.0, 307.0, 185.0, 100.0, 59.0, 37.0, 31.0, 24.0, 16.0, 15.0, 5.0, 7.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.7578125, -11.4212646484375, -11.084716796875, -10.7481689453125, -10.41162109375, -10.0750732421875, -9.738525390625, -9.4019775390625, -9.0654296875, -8.7288818359375, -8.392333984375, -8.0557861328125, -7.71923828125, -7.3826904296875, -7.046142578125, -6.7095947265625, -6.373046875, -6.0364990234375, -5.699951171875, -5.3634033203125, -5.02685546875, -4.6903076171875, -4.353759765625, -4.0172119140625, -3.6806640625, -3.3441162109375, -3.007568359375, -2.6710205078125, -2.33447265625, -1.9979248046875, -1.661376953125, -1.3248291015625, -0.98828125, -0.6517333984375, -0.315185546875, 0.0213623046875, 0.35791015625, 0.6944580078125, 1.031005859375, 1.3675537109375, 1.7041015625, 2.0406494140625, 2.377197265625, 2.7137451171875, 3.05029296875, 3.3868408203125, 3.723388671875, 4.0599365234375, 4.396484375, 4.7330322265625, 5.069580078125, 5.4061279296875, 5.74267578125, 6.0792236328125, 6.415771484375, 6.7523193359375, 7.0888671875, 7.4254150390625, 7.761962890625, 8.0985107421875, 8.43505859375, 8.7716064453125, 9.108154296875, 9.4447021484375, 9.78125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 12.0, 8.0, 3.0, 17.0, 20.0, 23.0, 34.0, 30.0, 55.0, 73.0, 147.0, 215.0, 108.0, 64.0, 31.0, 32.0, 27.0, 14.0, 13.0, 16.0, 11.0, 4.0, 15.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001430511474609375, -0.001392170786857605, -0.001353830099105835, -0.001315489411354065, -0.001277148723602295, -0.001238808035850525, -0.0012004673480987549, -0.0011621266603469849, -0.0011237859725952148, -0.0010854452848434448, -0.0010471045970916748, -0.0010087639093399048, -0.0009704232215881348, -0.0009320825338363647, -0.0008937418460845947, -0.0008554011583328247, -0.0008170604705810547, -0.0007787197828292847, -0.0007403790950775146, -0.0007020384073257446, -0.0006636977195739746, -0.0006253570318222046, -0.0005870163440704346, -0.0005486756563186646, -0.0005103349685668945, -0.0004719942808151245, -0.0004336535930633545, -0.00039531290531158447, -0.00035697221755981445, -0.00031863152980804443, -0.0002802908420562744, -0.0002419501543045044, -0.00020360946655273438, -0.00016526877880096436, -0.00012692809104919434, -8.858740329742432e-05, -5.02467155456543e-05, -1.1906027793884277e-05, 2.6434659957885742e-05, 6.477534770965576e-05, 0.00010311603546142578, 0.0001414567232131958, 0.00017979741096496582, 0.00021813809871673584, 0.00025647878646850586, 0.0002948194742202759, 0.0003331601619720459, 0.0003715008497238159, 0.00040984153747558594, 0.00044818222522735596, 0.000486522912979126, 0.000524863600730896, 0.000563204288482666, 0.000601544976234436, 0.0006398856639862061, 0.0006782263517379761, 0.0007165670394897461, 0.0007549077272415161, 0.0007932484149932861, 0.0008315891027450562, 0.0008699297904968262, 0.0009082704782485962, 0.0009466111660003662, 0.0009849518537521362, 0.0010232925415039062]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 8.0, 11.0, 17.0, 24.0, 20.0, 22.0, 29.0, 41.0, 73.0, 87.0, 164.0, 262.0, 489.0, 937.0, 2388.0, 7707.0, 43829.0, 872827.0, 101647.0, 12018.0, 3220.0, 1293.0, 581.0, 310.0, 189.0, 91.0, 61.0, 47.0, 38.0, 27.0, 17.0, 17.0, 18.0, 5.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.625, -9.3389892578125, -9.052978515625, -8.7669677734375, -8.48095703125, -8.1949462890625, -7.908935546875, -7.6229248046875, -7.3369140625, -7.0509033203125, -6.764892578125, -6.4788818359375, -6.19287109375, -5.9068603515625, -5.620849609375, -5.3348388671875, -5.048828125, -4.7628173828125, -4.476806640625, -4.1907958984375, -3.90478515625, -3.6187744140625, -3.332763671875, -3.0467529296875, -2.7607421875, -2.4747314453125, -2.188720703125, -1.9027099609375, -1.61669921875, -1.3306884765625, -1.044677734375, -0.7586669921875, -0.47265625, -0.1866455078125, 0.099365234375, 0.3853759765625, 0.67138671875, 0.9573974609375, 1.243408203125, 1.5294189453125, 1.8154296875, 2.1014404296875, 2.387451171875, 2.6734619140625, 2.95947265625, 3.2454833984375, 3.531494140625, 3.8175048828125, 4.103515625, 4.3895263671875, 4.675537109375, 4.9615478515625, 5.24755859375, 5.5335693359375, 5.819580078125, 6.1055908203125, 6.3916015625, 6.6776123046875, 6.963623046875, 7.2496337890625, 7.53564453125, 7.8216552734375, 8.107666015625, 8.3936767578125, 8.6796875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 5.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 31.0, 38.0, 68.0, 89.0, 113.0, 166.0, 126.0, 93.0, 61.0, 53.0, 33.0, 11.0, 14.0, 7.0, 3.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.41796875, -7.19671630859375, -6.9754638671875, -6.75421142578125, -6.532958984375, -6.31170654296875, -6.0904541015625, -5.86920166015625, -5.64794921875, -5.42669677734375, -5.2054443359375, -4.98419189453125, -4.762939453125, -4.54168701171875, -4.3204345703125, -4.09918212890625, -3.8779296875, -3.65667724609375, -3.4354248046875, -3.21417236328125, -2.992919921875, -2.77166748046875, -2.5504150390625, -2.32916259765625, -2.10791015625, -1.88665771484375, -1.6654052734375, -1.44415283203125, -1.222900390625, -1.00164794921875, -0.7803955078125, -0.55914306640625, -0.337890625, -0.11663818359375, 0.1046142578125, 0.32586669921875, 0.547119140625, 0.76837158203125, 0.9896240234375, 1.21087646484375, 1.43212890625, 1.65338134765625, 1.8746337890625, 2.09588623046875, 2.317138671875, 2.53839111328125, 2.7596435546875, 2.98089599609375, 3.2021484375, 3.42340087890625, 3.6446533203125, 3.86590576171875, 4.087158203125, 4.30841064453125, 4.5296630859375, 4.75091552734375, 4.97216796875, 5.19342041015625, 5.4146728515625, 5.63592529296875, 5.857177734375, 6.07843017578125, 6.2996826171875, 6.52093505859375, 6.7421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 20.0, 43.0, 134.0, 257.0, 274.0, 159.0, 61.0, 16.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.55878448486328, -115.14765930175781, -110.73652648925781, -106.32540130615234, -101.91427612304688, -97.50314331054688, -93.0920181274414, -88.68089294433594, -84.26976013183594, -79.85863494873047, -75.44750213623047, -71.036376953125, -66.625244140625, -62.21411895751953, -57.80299377441406, -53.39186477661133, -48.980735778808594, -44.56960678100586, -40.158477783203125, -35.747352600097656, -31.336223602294922, -26.925094604492188, -22.513967514038086, -18.102840423583984, -13.69171142578125, -9.280583381652832, -4.869455337524414, -0.4583272933959961, 3.952800750732422, 8.363929748535156, 12.775056838989258, 17.18618392944336, 21.597305297851562, 26.008434295654297, 30.4195613861084, 34.8306884765625, 39.241817474365234, 43.65294647216797, 48.06407165527344, 52.47520065307617, 56.886329650878906, 61.29745864868164, 65.70858764648438, 70.11971282958984, 74.53083801269531, 78.94197082519531, 83.35309600830078, 87.76422119140625, 92.17535400390625, 96.58647918701172, 100.99761199951172, 105.40873718261719, 109.81986999511719, 114.23099517822266, 118.64212036132812, 123.05325317382812, 127.4643783569336, 131.87550354003906, 136.28663635253906, 140.69776916503906, 145.10888671875, 149.52001953125, 153.93115234375, 158.34226989746094, 162.75340270996094]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 12.0, 17.0, 18.0, 13.0, 15.0, 22.0, 31.0, 37.0, 26.0, 28.0, 39.0, 41.0, 45.0, 46.0, 54.0, 45.0, 63.0, 59.0, 44.0, 31.0, 44.0, 32.0, 32.0, 24.0, 26.0, 22.0, 20.0, 19.0, 11.0, 14.0, 11.0, 8.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.614585876464844, -48.00837707519531, -46.40216827392578, -44.795963287353516, -43.189754486083984, -41.58354568481445, -39.97734069824219, -38.371131896972656, -36.764923095703125, -35.158714294433594, -33.55250549316406, -31.946300506591797, -30.340091705322266, -28.733882904052734, -27.127676010131836, -25.521469116210938, -23.915260314941406, -22.309051513671875, -20.702844619750977, -19.096637725830078, -17.490428924560547, -15.884221076965332, -14.278013229370117, -12.671805381774902, -11.065597534179688, -9.459389686584473, -7.853181838989258, -6.246973991394043, -4.640766143798828, -3.0345582962036133, -1.4283504486083984, 0.1778573989868164, 1.7840614318847656, 3.3902692794799805, 4.996477127075195, 6.60268497467041, 8.208892822265625, 9.81510066986084, 11.421308517456055, 13.02751636505127, 14.633724212646484, 16.239933013916016, 17.846139907836914, 19.452346801757812, 21.058555603027344, 22.664764404296875, 24.270971298217773, 25.877178192138672, 27.483386993408203, 29.089595794677734, 30.695802688598633, 32.30200958251953, 33.90821838378906, 35.514427185058594, 37.120635986328125, 38.72684097290039, 40.33304977416992, 41.93925857543945, 43.54546356201172, 45.15167236328125, 46.75788116455078, 48.36408996582031, 49.970298767089844, 51.57650375366211, 53.18271255493164]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 6.0, 5.0, 8.0, 17.0, 20.0, 24.0, 42.0, 55.0, 111.0, 166.0, 339.0, 769.0, 3438.0, 66978.0, 4064155.0, 53953.0, 2872.0, 618.0, 269.0, 145.0, 91.0, 67.0, 46.0, 26.0, 16.0, 8.0, 9.0, 8.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.171630859375, -13.65576171875, -13.139892578125, -12.6240234375, -12.108154296875, -11.59228515625, -11.076416015625, -10.560546875, -10.044677734375, -9.52880859375, -9.012939453125, -8.4970703125, -7.981201171875, -7.46533203125, -6.949462890625, -6.43359375, -5.917724609375, -5.40185546875, -4.885986328125, -4.3701171875, -3.854248046875, -3.33837890625, -2.822509765625, -2.306640625, -1.790771484375, -1.27490234375, -0.759033203125, -0.2431640625, 0.272705078125, 0.78857421875, 1.304443359375, 1.8203125, 2.336181640625, 2.85205078125, 3.367919921875, 3.8837890625, 4.399658203125, 4.91552734375, 5.431396484375, 5.947265625, 6.463134765625, 6.97900390625, 7.494873046875, 8.0107421875, 8.526611328125, 9.04248046875, 9.558349609375, 10.07421875, 10.590087890625, 11.10595703125, 11.621826171875, 12.1376953125, 12.653564453125, 13.16943359375, 13.685302734375, 14.201171875, 14.717041015625, 15.23291015625, 15.748779296875, 16.2646484375, 16.780517578125, 17.29638671875, 17.812255859375, 18.328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 13.0, 16.0, 22.0, 39.0, 63.0, 67.0, 91.0, 96.0, 98.0, 95.0, 94.0, 91.0, 81.0, 41.0, 42.0, 20.0, 20.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.9818115234375, -4.815185546875, -4.6485595703125, -4.48193359375, -4.3153076171875, -4.148681640625, -3.9820556640625, -3.8154296875, -3.6488037109375, -3.482177734375, -3.3155517578125, -3.14892578125, -2.9822998046875, -2.815673828125, -2.6490478515625, -2.482421875, -2.3157958984375, -2.149169921875, -1.9825439453125, -1.81591796875, -1.6492919921875, -1.482666015625, -1.3160400390625, -1.1494140625, -0.9827880859375, -0.816162109375, -0.6495361328125, -0.48291015625, -0.3162841796875, -0.149658203125, 0.0169677734375, 0.18359375, 0.3502197265625, 0.516845703125, 0.6834716796875, 0.85009765625, 1.0167236328125, 1.183349609375, 1.3499755859375, 1.5166015625, 1.6832275390625, 1.849853515625, 2.0164794921875, 2.18310546875, 2.3497314453125, 2.516357421875, 2.6829833984375, 2.849609375, 3.0162353515625, 3.182861328125, 3.3494873046875, 3.51611328125, 3.6827392578125, 3.849365234375, 4.0159912109375, 4.1826171875, 4.3492431640625, 4.515869140625, 4.6824951171875, 4.84912109375, 5.0157470703125, 5.182373046875, 5.3489990234375, 5.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 11.0, 8.0, 10.0, 32.0, 60.0, 113.0, 282.0, 1056.0, 5905.0, 68094.0, 3743887.0, 357624.0, 14348.0, 2008.0, 457.0, 177.0, 96.0, 47.0, 26.0, 20.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.078125, -10.663330078125, -10.24853515625, -9.833740234375, -9.4189453125, -9.004150390625, -8.58935546875, -8.174560546875, -7.759765625, -7.344970703125, -6.93017578125, -6.515380859375, -6.1005859375, -5.685791015625, -5.27099609375, -4.856201171875, -4.44140625, -4.026611328125, -3.61181640625, -3.197021484375, -2.7822265625, -2.367431640625, -1.95263671875, -1.537841796875, -1.123046875, -0.708251953125, -0.29345703125, 0.121337890625, 0.5361328125, 0.950927734375, 1.36572265625, 1.780517578125, 2.1953125, 2.610107421875, 3.02490234375, 3.439697265625, 3.8544921875, 4.269287109375, 4.68408203125, 5.098876953125, 5.513671875, 5.928466796875, 6.34326171875, 6.758056640625, 7.1728515625, 7.587646484375, 8.00244140625, 8.417236328125, 8.83203125, 9.246826171875, 9.66162109375, 10.076416015625, 10.4912109375, 10.906005859375, 11.32080078125, 11.735595703125, 12.150390625, 12.565185546875, 12.97998046875, 13.394775390625, 13.8095703125, 14.224365234375, 14.63916015625, 15.053955078125, 15.46875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 11.0, 11.0, 19.0, 21.0, 26.0, 37.0, 85.0, 107.0, 205.0, 377.0, 694.0, 875.0, 653.0, 381.0, 223.0, 112.0, 49.0, 49.0, 43.0, 24.0, 20.0, 6.0, 9.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.4609375, -7.23126220703125, -7.0015869140625, -6.77191162109375, -6.542236328125, -6.31256103515625, -6.0828857421875, -5.85321044921875, -5.62353515625, -5.39385986328125, -5.1641845703125, -4.93450927734375, -4.704833984375, -4.47515869140625, -4.2454833984375, -4.01580810546875, -3.7861328125, -3.55645751953125, -3.3267822265625, -3.09710693359375, -2.867431640625, -2.63775634765625, -2.4080810546875, -2.17840576171875, -1.94873046875, -1.71905517578125, -1.4893798828125, -1.25970458984375, -1.030029296875, -0.80035400390625, -0.5706787109375, -0.34100341796875, -0.111328125, 0.11834716796875, 0.3480224609375, 0.57769775390625, 0.807373046875, 1.03704833984375, 1.2667236328125, 1.49639892578125, 1.72607421875, 1.95574951171875, 2.1854248046875, 2.41510009765625, 2.644775390625, 2.87445068359375, 3.1041259765625, 3.33380126953125, 3.5634765625, 3.79315185546875, 4.0228271484375, 4.25250244140625, 4.482177734375, 4.71185302734375, 4.9415283203125, 5.17120361328125, 5.40087890625, 5.63055419921875, 5.8602294921875, 6.08990478515625, 6.319580078125, 6.54925537109375, 6.7789306640625, 7.00860595703125, 7.23828125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 29.0, 63.0, 198.0, 285.0, 239.0, 91.0, 44.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.26390075683594, -42.34092712402344, -39.41795349121094, -36.49497985839844, -33.57200622558594, -30.649032592773438, -27.72606086730957, -24.80308723449707, -21.88011360168457, -18.95713996887207, -16.03416633605957, -13.111193656921387, -10.188220024108887, -7.265246391296387, -4.342273712158203, -1.4193000793457031, 1.5036735534667969, 4.426647186279297, 7.349620342254639, 10.27259349822998, 13.19556713104248, 16.118541717529297, 19.041513442993164, 21.964487075805664, 24.887460708618164, 27.810434341430664, 30.733407974243164, 33.65637969970703, 36.57935333251953, 39.50232696533203, 42.42530059814453, 45.34827423095703, 48.27124786376953, 51.19422149658203, 54.11719512939453, 57.04016876220703, 59.96314239501953, 62.88611602783203, 65.80908966064453, 68.73206329345703, 71.65503692626953, 74.57801055908203, 77.50098419189453, 80.42395782470703, 83.34693145751953, 86.26990509033203, 89.19287872314453, 92.11585235595703, 95.038818359375, 97.9617919921875, 100.884765625, 103.8077392578125, 106.730712890625, 109.6536865234375, 112.57666015625, 115.4996337890625, 118.422607421875, 121.3455810546875, 124.2685546875, 127.1915283203125, 130.114501953125, 133.0374755859375, 135.96044921875, 138.8834228515625, 141.806396484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 8.0, 4.0, 10.0, 14.0, 21.0, 28.0, 15.0, 30.0, 34.0, 31.0, 39.0, 42.0, 53.0, 43.0, 47.0, 57.0, 65.0, 53.0, 53.0, 53.0, 42.0, 39.0, 29.0, 34.0, 32.0, 27.0, 18.0, 16.0, 14.0, 13.0, 4.0, 7.0, 6.0, 9.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.59016418457031, -33.624176025390625, -32.65818786621094, -31.692201614379883, -30.726213455200195, -29.76022720336914, -28.794239044189453, -27.828250885009766, -26.862262725830078, -25.89627456665039, -24.930288314819336, -23.96430015563965, -22.99831199645996, -22.032325744628906, -21.06633758544922, -20.10034942626953, -19.134363174438477, -18.16837501525879, -17.202388763427734, -16.236400604248047, -15.27041244506836, -14.304425239562988, -13.338438034057617, -12.37244987487793, -11.406462669372559, -10.440475463867188, -9.4744873046875, -8.508500099182129, -7.5425124168396, -6.57652473449707, -5.610537528991699, -4.64454984664917, -3.6785621643066406, -2.7125744819641113, -1.7465870380401611, -0.7805995941162109, 0.18538808822631836, 1.1513757705688477, 2.1173629760742188, 3.083350658416748, 4.049338340759277, 5.015326023101807, 5.981313705444336, 6.947300910949707, 7.913288593292236, 8.879276275634766, 9.845263481140137, 10.811250686645508, 11.777238845825195, 12.743226051330566, 13.709214210510254, 14.675201416015625, 15.641189575195312, 16.607177734375, 17.573163986206055, 18.539152145385742, 19.505138397216797, 20.471126556396484, 21.43711280822754, 22.403100967407227, 23.369089126586914, 24.33507537841797, 25.301063537597656, 26.267051696777344, 27.23303985595703]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 13.0, 25.0, 25.0, 34.0, 74.0, 106.0, 198.0, 335.0, 680.0, 1764.0, 5657.0, 23538.0, 156728.0, 710792.0, 121356.0, 19346.0, 4847.0, 1549.0, 655.0, 315.0, 186.0, 100.0, 70.0, 39.0, 34.0, 13.0, 16.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2265625, -9.890625, -9.5546875, -9.21875, -8.8828125, -8.546875, -8.2109375, -7.875, -7.5390625, -7.203125, -6.8671875, -6.53125, -6.1953125, -5.859375, -5.5234375, -5.1875, -4.8515625, -4.515625, -4.1796875, -3.84375, -3.5078125, -3.171875, -2.8359375, -2.5, -2.1640625, -1.828125, -1.4921875, -1.15625, -0.8203125, -0.484375, -0.1484375, 0.1875, 0.5234375, 0.859375, 1.1953125, 1.53125, 1.8671875, 2.203125, 2.5390625, 2.875, 3.2109375, 3.546875, 3.8828125, 4.21875, 4.5546875, 4.890625, 5.2265625, 5.5625, 5.8984375, 6.234375, 6.5703125, 6.90625, 7.2421875, 7.578125, 7.9140625, 8.25, 8.5859375, 8.921875, 9.2578125, 9.59375, 9.9296875, 10.265625, 10.6015625, 10.9375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 11.0, 13.0, 31.0, 48.0, 51.0, 82.0, 101.0, 99.0, 100.0, 99.0, 101.0, 74.0, 65.0, 48.0, 27.0, 13.0, 17.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.14617919921875, -4.9720458984375, -4.79791259765625, -4.623779296875, -4.44964599609375, -4.2755126953125, -4.10137939453125, -3.92724609375, -3.75311279296875, -3.5789794921875, -3.40484619140625, -3.230712890625, -3.05657958984375, -2.8824462890625, -2.70831298828125, -2.5341796875, -2.36004638671875, -2.1859130859375, -2.01177978515625, -1.837646484375, -1.66351318359375, -1.4893798828125, -1.31524658203125, -1.14111328125, -0.96697998046875, -0.7928466796875, -0.61871337890625, -0.444580078125, -0.27044677734375, -0.0963134765625, 0.07781982421875, 0.251953125, 0.42608642578125, 0.6002197265625, 0.77435302734375, 0.948486328125, 1.12261962890625, 1.2967529296875, 1.47088623046875, 1.64501953125, 1.81915283203125, 1.9932861328125, 2.16741943359375, 2.341552734375, 2.51568603515625, 2.6898193359375, 2.86395263671875, 3.0380859375, 3.21221923828125, 3.3863525390625, 3.56048583984375, 3.734619140625, 3.90875244140625, 4.0828857421875, 4.25701904296875, 4.43115234375, 4.60528564453125, 4.7794189453125, 4.95355224609375, 5.127685546875, 5.30181884765625, 5.4759521484375, 5.65008544921875, 5.82421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 5.0, 12.0, 10.0, 26.0, 36.0, 70.0, 121.0, 222.0, 547.0, 1639.0, 7500.0, 255366.0, 768439.0, 11240.0, 2090.0, 642.0, 282.0, 115.0, 67.0, 42.0, 21.0, 16.0, 14.0, 12.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.984375, -28.021240234375, -27.05810546875, -26.094970703125, -25.1318359375, -24.168701171875, -23.20556640625, -22.242431640625, -21.279296875, -20.316162109375, -19.35302734375, -18.389892578125, -17.4267578125, -16.463623046875, -15.50048828125, -14.537353515625, -13.57421875, -12.611083984375, -11.64794921875, -10.684814453125, -9.7216796875, -8.758544921875, -7.79541015625, -6.832275390625, -5.869140625, -4.906005859375, -3.94287109375, -2.979736328125, -2.0166015625, -1.053466796875, -0.09033203125, 0.872802734375, 1.8359375, 2.799072265625, 3.76220703125, 4.725341796875, 5.6884765625, 6.651611328125, 7.61474609375, 8.577880859375, 9.541015625, 10.504150390625, 11.46728515625, 12.430419921875, 13.3935546875, 14.356689453125, 15.31982421875, 16.282958984375, 17.24609375, 18.209228515625, 19.17236328125, 20.135498046875, 21.0986328125, 22.061767578125, 23.02490234375, 23.988037109375, 24.951171875, 25.914306640625, 26.87744140625, 27.840576171875, 28.8037109375, 29.766845703125, 30.72998046875, 31.693115234375, 32.65625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 9.0, 22.0, 23.0, 33.0, 46.0, 55.0, 59.0, 89.0, 100.0, 85.0, 95.0, 86.0, 79.0, 41.0, 40.0, 38.0, 17.0, 17.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.109375, -23.426025390625, -22.74267578125, -22.059326171875, -21.3759765625, -20.692626953125, -20.00927734375, -19.325927734375, -18.642578125, -17.959228515625, -17.27587890625, -16.592529296875, -15.9091796875, -15.225830078125, -14.54248046875, -13.859130859375, -13.17578125, -12.492431640625, -11.80908203125, -11.125732421875, -10.4423828125, -9.759033203125, -9.07568359375, -8.392333984375, -7.708984375, -7.025634765625, -6.34228515625, -5.658935546875, -4.9755859375, -4.292236328125, -3.60888671875, -2.925537109375, -2.2421875, -1.558837890625, -0.87548828125, -0.192138671875, 0.4912109375, 1.174560546875, 1.85791015625, 2.541259765625, 3.224609375, 3.907958984375, 4.59130859375, 5.274658203125, 5.9580078125, 6.641357421875, 7.32470703125, 8.008056640625, 8.69140625, 9.374755859375, 10.05810546875, 10.741455078125, 11.4248046875, 12.108154296875, 12.79150390625, 13.474853515625, 14.158203125, 14.841552734375, 15.52490234375, 16.208251953125, 16.8916015625, 17.574951171875, 18.25830078125, 18.941650390625, 19.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 8.0, 14.0, 20.0, 25.0, 32.0, 92.0, 127.0, 297.0, 816.0, 3150.0, 40405.0, 979876.0, 20156.0, 2265.0, 657.0, 257.0, 147.0, 68.0, 41.0, 20.0, 17.0, 13.0, 12.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5, -17.9918212890625, -17.483642578125, -16.9754638671875, -16.46728515625, -15.9591064453125, -15.450927734375, -14.9427490234375, -14.4345703125, -13.9263916015625, -13.418212890625, -12.9100341796875, -12.40185546875, -11.8936767578125, -11.385498046875, -10.8773193359375, -10.369140625, -9.8609619140625, -9.352783203125, -8.8446044921875, -8.33642578125, -7.8282470703125, -7.320068359375, -6.8118896484375, -6.3037109375, -5.7955322265625, -5.287353515625, -4.7791748046875, -4.27099609375, -3.7628173828125, -3.254638671875, -2.7464599609375, -2.23828125, -1.7301025390625, -1.221923828125, -0.7137451171875, -0.20556640625, 0.3026123046875, 0.810791015625, 1.3189697265625, 1.8271484375, 2.3353271484375, 2.843505859375, 3.3516845703125, 3.85986328125, 4.3680419921875, 4.876220703125, 5.3843994140625, 5.892578125, 6.4007568359375, 6.908935546875, 7.4171142578125, 7.92529296875, 8.4334716796875, 8.941650390625, 9.4498291015625, 9.9580078125, 10.4661865234375, 10.974365234375, 11.4825439453125, 11.99072265625, 12.4989013671875, 13.007080078125, 13.5152587890625, 14.0234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 15.0, 13.0, 21.0, 20.0, 34.0, 25.0, 54.0, 80.0, 123.0, 157.0, 145.0, 80.0, 64.0, 37.0, 27.0, 22.0, 17.0, 13.0, 3.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0012674331665039062, -0.001233808696269989, -0.0012001842260360718, -0.0011665597558021545, -0.0011329352855682373, -0.00109931081533432, -0.0010656863451004028, -0.0010320618748664856, -0.0009984374046325684, -0.0009648129343986511, -0.0009311884641647339, -0.0008975639939308167, -0.0008639395236968994, -0.0008303150534629822, -0.0007966905832290649, -0.0007630661129951477, -0.0007294416427612305, -0.0006958171725273132, -0.000662192702293396, -0.0006285682320594788, -0.0005949437618255615, -0.0005613192915916443, -0.000527694821357727, -0.0004940703511238098, -0.0004604458808898926, -0.00042682141065597534, -0.0003931969404220581, -0.00035957247018814087, -0.00032594799995422363, -0.0002923235297203064, -0.00025869905948638916, -0.00022507458925247192, -0.0001914501190185547, -0.00015782564878463745, -0.00012420117855072021, -9.057670831680298e-05, -5.695223808288574e-05, -2.3327767848968506e-05, 1.029670238494873e-05, 4.392117261886597e-05, 7.75456428527832e-05, 0.00011117011308670044, 0.00014479458332061768, 0.0001784190535545349, 0.00021204352378845215, 0.0002456679940223694, 0.0002792924642562866, 0.00031291693449020386, 0.0003465414047241211, 0.00038016587495803833, 0.00041379034519195557, 0.0004474148154258728, 0.00048103928565979004, 0.0005146637558937073, 0.0005482882261276245, 0.0005819126963615417, 0.000615537166595459, 0.0006491616368293762, 0.0006827861070632935, 0.0007164105772972107, 0.0007500350475311279, 0.0007836595177650452, 0.0008172839879989624, 0.0008509084582328796, 0.0008845329284667969]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 9.0, 14.0, 20.0, 28.0, 34.0, 63.0, 94.0, 136.0, 300.0, 558.0, 1302.0, 3815.0, 12171.0, 81755.0, 854895.0, 75364.0, 11866.0, 3566.0, 1271.0, 552.0, 271.0, 148.0, 95.0, 64.0, 46.0, 25.0, 18.0, 19.0, 11.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.40277099609375, -6.1610107421875, -5.91925048828125, -5.677490234375, -5.43572998046875, -5.1939697265625, -4.95220947265625, -4.71044921875, -4.46868896484375, -4.2269287109375, -3.98516845703125, -3.743408203125, -3.50164794921875, -3.2598876953125, -3.01812744140625, -2.7763671875, -2.53460693359375, -2.2928466796875, -2.05108642578125, -1.809326171875, -1.56756591796875, -1.3258056640625, -1.08404541015625, -0.84228515625, -0.60052490234375, -0.3587646484375, -0.11700439453125, 0.124755859375, 0.36651611328125, 0.6082763671875, 0.85003662109375, 1.091796875, 1.33355712890625, 1.5753173828125, 1.81707763671875, 2.058837890625, 2.30059814453125, 2.5423583984375, 2.78411865234375, 3.02587890625, 3.26763916015625, 3.5093994140625, 3.75115966796875, 3.992919921875, 4.23468017578125, 4.4764404296875, 4.71820068359375, 4.9599609375, 5.20172119140625, 5.4434814453125, 5.68524169921875, 5.927001953125, 6.16876220703125, 6.4105224609375, 6.65228271484375, 6.89404296875, 7.13580322265625, 7.3775634765625, 7.61932373046875, 7.861083984375, 8.10284423828125, 8.3446044921875, 8.58636474609375, 8.828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 8.0, 1.0, 1.0, 6.0, 9.0, 11.0, 16.0, 28.0, 35.0, 69.0, 88.0, 129.0, 149.0, 129.0, 105.0, 78.0, 45.0, 30.0, 15.0, 6.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9609375, -5.75848388671875, -5.5560302734375, -5.35357666015625, -5.151123046875, -4.94866943359375, -4.7462158203125, -4.54376220703125, -4.34130859375, -4.13885498046875, -3.9364013671875, -3.73394775390625, -3.531494140625, -3.32904052734375, -3.1265869140625, -2.92413330078125, -2.7216796875, -2.51922607421875, -2.3167724609375, -2.11431884765625, -1.911865234375, -1.70941162109375, -1.5069580078125, -1.30450439453125, -1.10205078125, -0.89959716796875, -0.6971435546875, -0.49468994140625, -0.292236328125, -0.08978271484375, 0.1126708984375, 0.31512451171875, 0.517578125, 0.72003173828125, 0.9224853515625, 1.12493896484375, 1.327392578125, 1.52984619140625, 1.7322998046875, 1.93475341796875, 2.13720703125, 2.33966064453125, 2.5421142578125, 2.74456787109375, 2.947021484375, 3.14947509765625, 3.3519287109375, 3.55438232421875, 3.7568359375, 3.95928955078125, 4.1617431640625, 4.36419677734375, 4.566650390625, 4.76910400390625, 4.9715576171875, 5.17401123046875, 5.37646484375, 5.57891845703125, 5.7813720703125, 5.98382568359375, 6.186279296875, 6.38873291015625, 6.5911865234375, 6.79364013671875, 6.99609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 23.0, 85.0, 240.0, 346.0, 191.0, 56.0, 15.0, 12.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-170.98623657226562, -166.50924682617188, -162.03225708007812, -157.55528259277344, -153.0782928466797, -148.60130310058594, -144.1243133544922, -139.64732360839844, -135.17034912109375, -130.693359375, -126.21637725830078, -121.73938751220703, -117.26240539550781, -112.78541564941406, -108.30842590332031, -103.83143615722656, -99.35444641113281, -94.87745666503906, -90.40047454833984, -85.9234848022461, -81.44650268554688, -76.96951293945312, -72.49252319335938, -68.01553344726562, -63.538551330566406, -59.06156539916992, -54.58457946777344, -50.10758972167969, -45.6306037902832, -41.15361785888672, -36.67662811279297, -32.199642181396484, -27.72266387939453, -23.245677947998047, -18.76869010925293, -14.291703224182129, -9.814716339111328, -5.337730407714844, -0.8607425689697266, 3.6162452697753906, 8.093231201171875, 12.570218086242676, 17.047204971313477, 21.524192810058594, 26.001178741455078, 30.478164672851562, 34.95515441894531, 39.4321403503418, 43.90912628173828, 48.386112213134766, 52.86309814453125, 57.340087890625, 61.817073822021484, 66.29405975341797, 70.77104949951172, 75.24803161621094, 79.72502136230469, 84.20201110839844, 88.67899322509766, 93.1559829711914, 97.63296508789062, 102.10995483398438, 106.58694458007812, 111.06393432617188, 115.5409164428711]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 8.0, 11.0, 11.0, 24.0, 20.0, 30.0, 29.0, 38.0, 43.0, 44.0, 63.0, 72.0, 71.0, 69.0, 77.0, 64.0, 51.0, 48.0, 49.0, 32.0, 26.0, 21.0, 26.0, 10.0, 24.0, 10.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.24105072021484, -68.01504516601562, -65.7890396118164, -63.56303024291992, -61.3370246887207, -59.111019134521484, -56.885009765625, -54.65900421142578, -52.43299865722656, -50.206993103027344, -47.980987548828125, -45.75497817993164, -43.52897262573242, -41.3029670715332, -39.07695770263672, -36.8509521484375, -34.62494659423828, -32.39894104003906, -30.17293357849121, -27.94692611694336, -25.72092056274414, -23.494915008544922, -21.26890754699707, -19.04290008544922, -16.81689453125, -14.590888023376465, -12.36488151550293, -10.138875007629395, -7.912868499755859, -5.686861991882324, -3.460855484008789, -1.234848976135254, 0.99114990234375, 3.217156410217285, 5.44316291809082, 7.6691694259643555, 9.89517593383789, 12.121182441711426, 14.347188949584961, 16.573196411132812, 18.79920196533203, 21.02520751953125, 23.2512149810791, 25.477222442626953, 27.703227996826172, 29.92923355102539, 32.155242919921875, 34.381248474121094, 36.60725402832031, 38.83325958251953, 41.05926513671875, 43.285274505615234, 45.51128005981445, 47.73728561401367, 49.963294982910156, 52.189300537109375, 54.415306091308594, 56.64131164550781, 58.86731719970703, 61.093326568603516, 63.319332122802734, 65.54534149169922, 67.77134704589844, 69.99735260009766, 72.22335815429688]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 13.0, 22.0, 21.0, 53.0, 97.0, 204.0, 441.0, 1146.0, 3869.0, 37867.0, 3132717.0, 995478.0, 18327.0, 2600.0, 759.0, 265.0, 140.0, 69.0, 47.0, 26.0, 26.0, 21.0, 8.0, 15.0, 3.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.84375, -10.4400634765625, -10.036376953125, -9.6326904296875, -9.22900390625, -8.8253173828125, -8.421630859375, -8.0179443359375, -7.6142578125, -7.2105712890625, -6.806884765625, -6.4031982421875, -5.99951171875, -5.5958251953125, -5.192138671875, -4.7884521484375, -4.384765625, -3.9810791015625, -3.577392578125, -3.1737060546875, -2.77001953125, -2.3663330078125, -1.962646484375, -1.5589599609375, -1.1552734375, -0.7515869140625, -0.347900390625, 0.0557861328125, 0.45947265625, 0.8631591796875, 1.266845703125, 1.6705322265625, 2.07421875, 2.4779052734375, 2.881591796875, 3.2852783203125, 3.68896484375, 4.0926513671875, 4.496337890625, 4.9000244140625, 5.3037109375, 5.7073974609375, 6.111083984375, 6.5147705078125, 6.91845703125, 7.3221435546875, 7.725830078125, 8.1295166015625, 8.533203125, 8.9368896484375, 9.340576171875, 9.7442626953125, 10.14794921875, 10.5516357421875, 10.955322265625, 11.3590087890625, 11.7626953125, 12.1663818359375, 12.570068359375, 12.9737548828125, 13.37744140625, 13.7811279296875, 14.184814453125, 14.5885009765625, 14.9921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 9.0, 11.0, 13.0, 23.0, 33.0, 45.0, 49.0, 37.0, 55.0, 64.0, 64.0, 67.0, 58.0, 56.0, 61.0, 49.0, 47.0, 41.0, 42.0, 44.0, 28.0, 18.0, 16.0, 12.0, 13.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.876953125, -3.7701416015625, -3.663330078125, -3.5565185546875, -3.44970703125, -3.3428955078125, -3.236083984375, -3.1292724609375, -3.0224609375, -2.9156494140625, -2.808837890625, -2.7020263671875, -2.59521484375, -2.4884033203125, -2.381591796875, -2.2747802734375, -2.16796875, -2.0611572265625, -1.954345703125, -1.8475341796875, -1.74072265625, -1.6339111328125, -1.527099609375, -1.4202880859375, -1.3134765625, -1.2066650390625, -1.099853515625, -0.9930419921875, -0.88623046875, -0.7794189453125, -0.672607421875, -0.5657958984375, -0.458984375, -0.3521728515625, -0.245361328125, -0.1385498046875, -0.03173828125, 0.0750732421875, 0.181884765625, 0.2886962890625, 0.3955078125, 0.5023193359375, 0.609130859375, 0.7159423828125, 0.82275390625, 0.9295654296875, 1.036376953125, 1.1431884765625, 1.25, 1.3568115234375, 1.463623046875, 1.5704345703125, 1.67724609375, 1.7840576171875, 1.890869140625, 1.9976806640625, 2.1044921875, 2.2113037109375, 2.318115234375, 2.4249267578125, 2.53173828125, 2.6385498046875, 2.745361328125, 2.8521728515625, 2.958984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 16.0, 20.0, 25.0, 29.0, 59.0, 101.0, 199.0, 567.0, 1914.0, 12546.0, 214492.0, 3755646.0, 195373.0, 10789.0, 1631.0, 496.0, 170.0, 76.0, 47.0, 29.0, 16.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.71875, -14.326171875, -13.93359375, -13.541015625, -13.1484375, -12.755859375, -12.36328125, -11.970703125, -11.578125, -11.185546875, -10.79296875, -10.400390625, -10.0078125, -9.615234375, -9.22265625, -8.830078125, -8.4375, -8.044921875, -7.65234375, -7.259765625, -6.8671875, -6.474609375, -6.08203125, -5.689453125, -5.296875, -4.904296875, -4.51171875, -4.119140625, -3.7265625, -3.333984375, -2.94140625, -2.548828125, -2.15625, -1.763671875, -1.37109375, -0.978515625, -0.5859375, -0.193359375, 0.19921875, 0.591796875, 0.984375, 1.376953125, 1.76953125, 2.162109375, 2.5546875, 2.947265625, 3.33984375, 3.732421875, 4.125, 4.517578125, 4.91015625, 5.302734375, 5.6953125, 6.087890625, 6.48046875, 6.873046875, 7.265625, 7.658203125, 8.05078125, 8.443359375, 8.8359375, 9.228515625, 9.62109375, 10.013671875, 10.40625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 5.0, 10.0, 20.0, 27.0, 46.0, 67.0, 73.0, 107.0, 151.0, 238.0, 404.0, 562.0, 638.0, 575.0, 381.0, 253.0, 162.0, 101.0, 67.0, 56.0, 34.0, 16.0, 10.0, 9.0, 13.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.185302734375, -7.93310546875, -7.680908203125, -7.4287109375, -7.176513671875, -6.92431640625, -6.672119140625, -6.419921875, -6.167724609375, -5.91552734375, -5.663330078125, -5.4111328125, -5.158935546875, -4.90673828125, -4.654541015625, -4.40234375, -4.150146484375, -3.89794921875, -3.645751953125, -3.3935546875, -3.141357421875, -2.88916015625, -2.636962890625, -2.384765625, -2.132568359375, -1.88037109375, -1.628173828125, -1.3759765625, -1.123779296875, -0.87158203125, -0.619384765625, -0.3671875, -0.114990234375, 0.13720703125, 0.389404296875, 0.6416015625, 0.893798828125, 1.14599609375, 1.398193359375, 1.650390625, 1.902587890625, 2.15478515625, 2.406982421875, 2.6591796875, 2.911376953125, 3.16357421875, 3.415771484375, 3.66796875, 3.920166015625, 4.17236328125, 4.424560546875, 4.6767578125, 4.928955078125, 5.18115234375, 5.433349609375, 5.685546875, 5.937744140625, 6.18994140625, 6.442138671875, 6.6943359375, 6.946533203125, 7.19873046875, 7.450927734375, 7.703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 7.0, 22.0, 83.0, 270.0, 346.0, 183.0, 43.0, 25.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-170.75758361816406, -166.4038543701172, -162.05010986328125, -157.69638061523438, -153.3426513671875, -148.98892211914062, -144.63519287109375, -140.2814483642578, -135.92771911621094, -131.57398986816406, -127.22025299072266, -122.86651611328125, -118.51278686523438, -114.1590576171875, -109.8053207397461, -105.45158386230469, -101.09785461425781, -96.74412536621094, -92.39038848876953, -88.03665161132812, -83.68292236328125, -79.32919311523438, -74.97545623779297, -70.62171936035156, -66.26799011230469, -61.91425704956055, -57.560523986816406, -53.206790924072266, -48.853057861328125, -44.499324798583984, -40.145591735839844, -35.7918586730957, -31.438140869140625, -27.084407806396484, -22.730674743652344, -18.376941680908203, -14.023208618164062, -9.669475555419922, -5.315742492675781, -0.9620094299316406, 3.3917236328125, 7.745456695556641, 12.099189758300781, 16.452922821044922, 20.806655883789062, 25.160388946533203, 29.514122009277344, 33.867855072021484, 38.221588134765625, 42.575321197509766, 46.929054260253906, 51.28278732299805, 55.63652038574219, 59.99025344848633, 64.34398651123047, 68.69772338867188, 73.05145263671875, 77.40518188476562, 81.75891876220703, 86.11265563964844, 90.46638488769531, 94.82011413574219, 99.1738510131836, 103.527587890625, 107.88131713867188]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 10.0, 7.0, 10.0, 16.0, 21.0, 26.0, 24.0, 38.0, 37.0, 45.0, 41.0, 44.0, 50.0, 49.0, 53.0, 46.0, 57.0, 46.0, 46.0, 33.0, 41.0, 40.0, 34.0, 32.0, 26.0, 21.0, 19.0, 20.0, 12.0, 9.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.55973815917969, -35.31806182861328, -34.07638168334961, -32.8347053527832, -31.593027114868164, -30.351348876953125, -29.10967254638672, -27.86799430847168, -26.62631607055664, -25.3846378326416, -24.142959594726562, -22.901283264160156, -21.659605026245117, -20.417926788330078, -19.176250457763672, -17.934572219848633, -16.692893981933594, -15.451215744018555, -14.209538459777832, -12.96786117553711, -11.72618293762207, -10.484504699707031, -9.242827415466309, -8.001150131225586, -6.759471893310547, -5.517794132232666, -4.276116371154785, -3.0344386100769043, -1.7927608489990234, -0.5510830879211426, 0.6905946731567383, 1.932271957397461, 3.1739463806152344, 4.415624141693115, 5.657301902770996, 6.898979663848877, 8.140657424926758, 9.382335662841797, 10.62401294708252, 11.865690231323242, 13.107368469238281, 14.34904670715332, 15.590723991394043, 16.832401275634766, 18.074079513549805, 19.315757751464844, 20.55743408203125, 21.79911231994629, 23.040790557861328, 24.282468795776367, 25.524147033691406, 26.765823364257812, 28.00750160217285, 29.24917984008789, 30.490856170654297, 31.732534408569336, 32.974212646484375, 34.21588897705078, 35.45756912231445, 36.69924545288086, 37.94092559814453, 39.18260192871094, 40.424278259277344, 41.66595458984375, 42.90763473510742]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 12.0, 8.0, 12.0, 19.0, 14.0, 33.0, 64.0, 91.0, 160.0, 316.0, 720.0, 1770.0, 6485.0, 42895.0, 485102.0, 460459.0, 41047.0, 6217.0, 1744.0, 668.0, 288.0, 163.0, 86.0, 59.0, 32.0, 22.0, 22.0, 8.0, 16.0, 6.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7265625, -13.2530517578125, -12.779541015625, -12.3060302734375, -11.83251953125, -11.3590087890625, -10.885498046875, -10.4119873046875, -9.9384765625, -9.4649658203125, -8.991455078125, -8.5179443359375, -8.04443359375, -7.5709228515625, -7.097412109375, -6.6239013671875, -6.150390625, -5.6768798828125, -5.203369140625, -4.7298583984375, -4.25634765625, -3.7828369140625, -3.309326171875, -2.8358154296875, -2.3623046875, -1.8887939453125, -1.415283203125, -0.9417724609375, -0.46826171875, 0.0052490234375, 0.478759765625, 0.9522705078125, 1.42578125, 1.8992919921875, 2.372802734375, 2.8463134765625, 3.31982421875, 3.7933349609375, 4.266845703125, 4.7403564453125, 5.2138671875, 5.6873779296875, 6.160888671875, 6.6343994140625, 7.10791015625, 7.5814208984375, 8.054931640625, 8.5284423828125, 9.001953125, 9.4754638671875, 9.948974609375, 10.4224853515625, 10.89599609375, 11.3695068359375, 11.843017578125, 12.3165283203125, 12.7900390625, 13.2635498046875, 13.737060546875, 14.2105712890625, 14.68408203125, 15.1575927734375, 15.631103515625, 16.1046142578125, 16.578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 8.0, 9.0, 11.0, 4.0, 19.0, 15.0, 24.0, 27.0, 33.0, 40.0, 65.0, 57.0, 56.0, 60.0, 55.0, 61.0, 57.0, 58.0, 46.0, 48.0, 50.0, 41.0, 33.0, 14.0, 27.0, 22.0, 11.0, 13.0, 14.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.23577880859375, -4.1278076171875, -4.01983642578125, -3.911865234375, -3.80389404296875, -3.6959228515625, -3.58795166015625, -3.47998046875, -3.37200927734375, -3.2640380859375, -3.15606689453125, -3.048095703125, -2.94012451171875, -2.8321533203125, -2.72418212890625, -2.6162109375, -2.50823974609375, -2.4002685546875, -2.29229736328125, -2.184326171875, -2.07635498046875, -1.9683837890625, -1.86041259765625, -1.75244140625, -1.64447021484375, -1.5364990234375, -1.42852783203125, -1.320556640625, -1.21258544921875, -1.1046142578125, -0.99664306640625, -0.888671875, -0.78070068359375, -0.6727294921875, -0.56475830078125, -0.456787109375, -0.34881591796875, -0.2408447265625, -0.13287353515625, -0.02490234375, 0.08306884765625, 0.1910400390625, 0.29901123046875, 0.406982421875, 0.51495361328125, 0.6229248046875, 0.73089599609375, 0.8388671875, 0.94683837890625, 1.0548095703125, 1.16278076171875, 1.270751953125, 1.37872314453125, 1.4866943359375, 1.59466552734375, 1.70263671875, 1.81060791015625, 1.9185791015625, 2.02655029296875, 2.134521484375, 2.24249267578125, 2.3504638671875, 2.45843505859375, 2.56640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 18.0, 17.0, 23.0, 17.0, 25.0, 39.0, 67.0, 112.0, 185.0, 329.0, 580.0, 1226.0, 3168.0, 12275.0, 197893.0, 800229.0, 24099.0, 4774.0, 1682.0, 736.0, 407.0, 232.0, 132.0, 90.0, 60.0, 31.0, 28.0, 21.0, 14.0, 8.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.046875, -29.16748046875, -28.2880859375, -27.40869140625, -26.529296875, -25.64990234375, -24.7705078125, -23.89111328125, -23.01171875, -22.13232421875, -21.2529296875, -20.37353515625, -19.494140625, -18.61474609375, -17.7353515625, -16.85595703125, -15.9765625, -15.09716796875, -14.2177734375, -13.33837890625, -12.458984375, -11.57958984375, -10.7001953125, -9.82080078125, -8.94140625, -8.06201171875, -7.1826171875, -6.30322265625, -5.423828125, -4.54443359375, -3.6650390625, -2.78564453125, -1.90625, -1.02685546875, -0.1474609375, 0.73193359375, 1.611328125, 2.49072265625, 3.3701171875, 4.24951171875, 5.12890625, 6.00830078125, 6.8876953125, 7.76708984375, 8.646484375, 9.52587890625, 10.4052734375, 11.28466796875, 12.1640625, 13.04345703125, 13.9228515625, 14.80224609375, 15.681640625, 16.56103515625, 17.4404296875, 18.31982421875, 19.19921875, 20.07861328125, 20.9580078125, 21.83740234375, 22.716796875, 23.59619140625, 24.4755859375, 25.35498046875, 26.234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 5.0, 4.0, 6.0, 12.0, 13.0, 18.0, 22.0, 26.0, 35.0, 37.0, 45.0, 47.0, 56.0, 66.0, 91.0, 63.0, 69.0, 64.0, 70.0, 55.0, 43.0, 33.0, 28.0, 23.0, 18.0, 14.0, 11.0, 2.0, 7.0, 1.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.671875, -23.046875, -22.421875, -21.796875, -21.171875, -20.546875, -19.921875, -19.296875, -18.671875, -18.046875, -17.421875, -16.796875, -16.171875, -15.546875, -14.921875, -14.296875, -13.671875, -13.046875, -12.421875, -11.796875, -11.171875, -10.546875, -9.921875, -9.296875, -8.671875, -8.046875, -7.421875, -6.796875, -6.171875, -5.546875, -4.921875, -4.296875, -3.671875, -3.046875, -2.421875, -1.796875, -1.171875, -0.546875, 0.078125, 0.703125, 1.328125, 1.953125, 2.578125, 3.203125, 3.828125, 4.453125, 5.078125, 5.703125, 6.328125, 6.953125, 7.578125, 8.203125, 8.828125, 9.453125, 10.078125, 10.703125, 11.328125, 11.953125, 12.578125, 13.203125, 13.828125, 14.453125, 15.078125, 15.703125, 16.328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 26.0, 26.0, 22.0, 33.0, 50.0, 105.0, 172.0, 345.0, 717.0, 2232.0, 11799.0, 141572.0, 837640.0, 45473.0, 5737.0, 1417.0, 512.0, 257.0, 156.0, 82.0, 55.0, 25.0, 17.0, 19.0, 9.0, 8.0, 4.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.96484375, -7.68341064453125, -7.4019775390625, -7.12054443359375, -6.839111328125, -6.55767822265625, -6.2762451171875, -5.99481201171875, -5.71337890625, -5.43194580078125, -5.1505126953125, -4.86907958984375, -4.587646484375, -4.30621337890625, -4.0247802734375, -3.74334716796875, -3.4619140625, -3.18048095703125, -2.8990478515625, -2.61761474609375, -2.336181640625, -2.05474853515625, -1.7733154296875, -1.49188232421875, -1.21044921875, -0.92901611328125, -0.6475830078125, -0.36614990234375, -0.084716796875, 0.19671630859375, 0.4781494140625, 0.75958251953125, 1.041015625, 1.32244873046875, 1.6038818359375, 1.88531494140625, 2.166748046875, 2.44818115234375, 2.7296142578125, 3.01104736328125, 3.29248046875, 3.57391357421875, 3.8553466796875, 4.13677978515625, 4.418212890625, 4.69964599609375, 4.9810791015625, 5.26251220703125, 5.5439453125, 5.82537841796875, 6.1068115234375, 6.38824462890625, 6.669677734375, 6.95111083984375, 7.2325439453125, 7.51397705078125, 7.79541015625, 8.07684326171875, 8.3582763671875, 8.63970947265625, 8.921142578125, 9.20257568359375, 9.4840087890625, 9.76544189453125, 10.046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 5.0, 2.0, 5.0, 9.0, 9.0, 10.0, 23.0, 26.0, 25.0, 33.0, 40.0, 64.0, 81.0, 162.0, 180.0, 73.0, 49.0, 44.0, 33.0, 27.0, 24.0, 15.0, 9.0, 12.0, 8.0, 14.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015125274658203125, -0.0014680325984954834, -0.0014235377311706543, -0.0013790428638458252, -0.001334547996520996, -0.001290053129196167, -0.0012455582618713379, -0.0012010633945465088, -0.0011565685272216797, -0.0011120736598968506, -0.0010675787925720215, -0.0010230839252471924, -0.0009785890579223633, -0.0009340941905975342, -0.0008895993232727051, -0.000845104455947876, -0.0008006095886230469, -0.0007561147212982178, -0.0007116198539733887, -0.0006671249866485596, -0.0006226301193237305, -0.0005781352519989014, -0.0005336403846740723, -0.0004891455173492432, -0.00044465065002441406, -0.00040015578269958496, -0.00035566091537475586, -0.00031116604804992676, -0.00026667118072509766, -0.00022217631340026855, -0.00017768144607543945, -0.00013318657875061035, -8.869171142578125e-05, -4.419684410095215e-05, 2.980232238769531e-07, 4.4792890548706055e-05, 8.928775787353516e-05, 0.00013378262519836426, 0.00017827749252319336, 0.00022277235984802246, 0.00026726722717285156, 0.00031176209449768066, 0.00035625696182250977, 0.00040075182914733887, 0.00044524669647216797, 0.0004897415637969971, 0.0005342364311218262, 0.0005787312984466553, 0.0006232261657714844, 0.0006677210330963135, 0.0007122159004211426, 0.0007567107677459717, 0.0008012056350708008, 0.0008457005023956299, 0.000890195369720459, 0.0009346902370452881, 0.0009791851043701172, 0.0010236799716949463, 0.0010681748390197754, 0.0011126697063446045, 0.0011571645736694336, 0.0012016594409942627, 0.0012461543083190918, 0.001290649175643921, 0.00133514404296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 7.0, 5.0, 6.0, 7.0, 8.0, 20.0, 21.0, 27.0, 35.0, 58.0, 65.0, 99.0, 151.0, 237.0, 429.0, 783.0, 1798.0, 4907.0, 18791.0, 151134.0, 799291.0, 54384.0, 10428.0, 3150.0, 1183.0, 581.0, 341.0, 193.0, 134.0, 92.0, 70.0, 29.0, 19.0, 15.0, 17.0, 16.0, 11.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-9.4765625, -9.23541259765625, -8.9942626953125, -8.75311279296875, -8.511962890625, -8.27081298828125, -8.0296630859375, -7.78851318359375, -7.54736328125, -7.30621337890625, -7.0650634765625, -6.82391357421875, -6.582763671875, -6.34161376953125, -6.1004638671875, -5.85931396484375, -5.6181640625, -5.37701416015625, -5.1358642578125, -4.89471435546875, -4.653564453125, -4.41241455078125, -4.1712646484375, -3.93011474609375, -3.68896484375, -3.44781494140625, -3.2066650390625, -2.96551513671875, -2.724365234375, -2.48321533203125, -2.2420654296875, -2.00091552734375, -1.759765625, -1.51861572265625, -1.2774658203125, -1.03631591796875, -0.795166015625, -0.55401611328125, -0.3128662109375, -0.07171630859375, 0.16943359375, 0.41058349609375, 0.6517333984375, 0.89288330078125, 1.134033203125, 1.37518310546875, 1.6163330078125, 1.85748291015625, 2.0986328125, 2.33978271484375, 2.5809326171875, 2.82208251953125, 3.063232421875, 3.30438232421875, 3.5455322265625, 3.78668212890625, 4.02783203125, 4.26898193359375, 4.5101318359375, 4.75128173828125, 4.992431640625, 5.23358154296875, 5.4747314453125, 5.71588134765625, 5.95703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 9.0, 9.0, 10.0, 17.0, 11.0, 22.0, 44.0, 41.0, 63.0, 93.0, 145.0, 128.0, 98.0, 65.0, 42.0, 48.0, 33.0, 22.0, 17.0, 12.0, 10.0, 13.0, 11.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.0926513671875, -6.880615234375, -6.6685791015625, -6.45654296875, -6.2445068359375, -6.032470703125, -5.8204345703125, -5.6083984375, -5.3963623046875, -5.184326171875, -4.9722900390625, -4.76025390625, -4.5482177734375, -4.336181640625, -4.1241455078125, -3.912109375, -3.7000732421875, -3.488037109375, -3.2760009765625, -3.06396484375, -2.8519287109375, -2.639892578125, -2.4278564453125, -2.2158203125, -2.0037841796875, -1.791748046875, -1.5797119140625, -1.36767578125, -1.1556396484375, -0.943603515625, -0.7315673828125, -0.51953125, -0.3074951171875, -0.095458984375, 0.1165771484375, 0.32861328125, 0.5406494140625, 0.752685546875, 0.9647216796875, 1.1767578125, 1.3887939453125, 1.600830078125, 1.8128662109375, 2.02490234375, 2.2369384765625, 2.448974609375, 2.6610107421875, 2.873046875, 3.0850830078125, 3.297119140625, 3.5091552734375, 3.72119140625, 3.9332275390625, 4.145263671875, 4.3572998046875, 4.5693359375, 4.7813720703125, 4.993408203125, 5.2054443359375, 5.41748046875, 5.6295166015625, 5.841552734375, 6.0535888671875, 6.265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 30.0, 73.0, 163.0, 322.0, 215.0, 104.0, 47.0, 8.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.19256591796875, -138.37570190429688, -133.558837890625, -128.74197387695312, -123.92511749267578, -119.1082534790039, -114.29139709472656, -109.47453308105469, -104.65766906738281, -99.84080505371094, -95.02394104003906, -90.20708465576172, -85.39022064208984, -80.57335662841797, -75.75650024414062, -70.93963623046875, -66.12277221679688, -61.305908203125, -56.48904800415039, -51.67218780517578, -46.855323791503906, -42.03845977783203, -37.22159957885742, -32.40473937988281, -27.587875366210938, -22.771013259887695, -17.954151153564453, -13.137289047241211, -8.320426940917969, -3.5035648345947266, 1.3132972717285156, 6.130157470703125, 10.947021484375, 15.763883590698242, 20.580745697021484, 25.397607803344727, 30.21446990966797, 35.031333923339844, 39.84819412231445, 44.66505432128906, 49.48191833496094, 54.29878234863281, 59.11564254760742, 63.93250274658203, 68.7493667602539, 73.56623077392578, 78.38308715820312, 83.199951171875, 88.01681518554688, 92.83367919921875, 97.65054321289062, 102.46739959716797, 107.28426361083984, 112.10112762451172, 116.91798400878906, 121.73484802246094, 126.55171203613281, 131.3685760498047, 136.18544006347656, 141.00230407714844, 145.81915283203125, 150.63601684570312, 155.452880859375, 160.26974487304688, 165.08660888671875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 6.0, 10.0, 6.0, 3.0, 8.0, 9.0, 15.0, 13.0, 27.0, 22.0, 21.0, 32.0, 29.0, 23.0, 35.0, 41.0, 34.0, 38.0, 59.0, 70.0, 64.0, 70.0, 40.0, 40.0, 28.0, 37.0, 33.0, 25.0, 23.0, 19.0, 18.0, 26.0, 9.0, 12.0, 8.0, 10.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.53842544555664, -47.97980880737305, -46.42118835449219, -44.862571716308594, -43.303951263427734, -41.74533462524414, -40.18671417236328, -38.62809753417969, -37.069480895996094, -35.5108642578125, -33.95224380493164, -32.39362716674805, -30.835006713867188, -29.276390075683594, -27.717771530151367, -26.15915298461914, -24.60053253173828, -23.041913986206055, -21.483295440673828, -19.924678802490234, -18.366058349609375, -16.80744171142578, -15.248823165893555, -13.690204620361328, -12.131586074829102, -10.572967529296875, -9.014348983764648, -7.455731391906738, -5.897112846374512, -4.338494300842285, -2.779876708984375, -1.2212581634521484, 0.3373565673828125, 1.89597487449646, 3.4545931816101074, 5.013211250305176, 6.571829795837402, 8.130448341369629, 9.689065933227539, 11.247684478759766, 12.806303024291992, 14.364921569824219, 15.923540115356445, 17.482158660888672, 19.040775299072266, 20.599395751953125, 22.15801239013672, 23.716630935668945, 25.275249481201172, 26.8338680267334, 28.392486572265625, 29.95110321044922, 31.509723663330078, 33.06834030151367, 34.62696075439453, 36.185577392578125, 37.74419403076172, 39.30281066894531, 40.86143112182617, 42.420047760009766, 43.978668212890625, 45.53728485107422, 47.09590148925781, 48.65452194213867, 50.21314239501953]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 15.0, 11.0, 20.0, 21.0, 27.0, 59.0, 84.0, 130.0, 273.0, 519.0, 1311.0, 4830.0, 44206.0, 2963287.0, 1148282.0, 25295.0, 3788.0, 1137.0, 470.0, 199.0, 97.0, 91.0, 43.0, 14.0, 18.0, 10.0, 8.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.313232421875, -8.93896484375, -8.564697265625, -8.1904296875, -7.816162109375, -7.44189453125, -7.067626953125, -6.693359375, -6.319091796875, -5.94482421875, -5.570556640625, -5.1962890625, -4.822021484375, -4.44775390625, -4.073486328125, -3.69921875, -3.324951171875, -2.95068359375, -2.576416015625, -2.2021484375, -1.827880859375, -1.45361328125, -1.079345703125, -0.705078125, -0.330810546875, 0.04345703125, 0.417724609375, 0.7919921875, 1.166259765625, 1.54052734375, 1.914794921875, 2.2890625, 2.663330078125, 3.03759765625, 3.411865234375, 3.7861328125, 4.160400390625, 4.53466796875, 4.908935546875, 5.283203125, 5.657470703125, 6.03173828125, 6.406005859375, 6.7802734375, 7.154541015625, 7.52880859375, 7.903076171875, 8.27734375, 8.651611328125, 9.02587890625, 9.400146484375, 9.7744140625, 10.148681640625, 10.52294921875, 10.897216796875, 11.271484375, 11.645751953125, 12.02001953125, 12.394287109375, 12.7685546875, 13.142822265625, 13.51708984375, 13.891357421875, 14.265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 11.0, 27.0, 22.0, 49.0, 46.0, 67.0, 71.0, 92.0, 83.0, 88.0, 88.0, 90.0, 65.0, 58.0, 34.0, 23.0, 28.0, 25.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.34521484375, -6.1865234375, -6.02783203125, -5.869140625, -5.71044921875, -5.5517578125, -5.39306640625, -5.234375, -5.07568359375, -4.9169921875, -4.75830078125, -4.599609375, -4.44091796875, -4.2822265625, -4.12353515625, -3.96484375, -3.80615234375, -3.6474609375, -3.48876953125, -3.330078125, -3.17138671875, -3.0126953125, -2.85400390625, -2.6953125, -2.53662109375, -2.3779296875, -2.21923828125, -2.060546875, -1.90185546875, -1.7431640625, -1.58447265625, -1.42578125, -1.26708984375, -1.1083984375, -0.94970703125, -0.791015625, -0.63232421875, -0.4736328125, -0.31494140625, -0.15625, 0.00244140625, 0.1611328125, 0.31982421875, 0.478515625, 0.63720703125, 0.7958984375, 0.95458984375, 1.11328125, 1.27197265625, 1.4306640625, 1.58935546875, 1.748046875, 1.90673828125, 2.0654296875, 2.22412109375, 2.3828125, 2.54150390625, 2.7001953125, 2.85888671875, 3.017578125, 3.17626953125, 3.3349609375, 3.49365234375, 3.65234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 9.0, 20.0, 26.0, 41.0, 64.0, 95.0, 161.0, 289.0, 608.0, 1274.0, 3689.0, 17944.0, 194957.0, 3630733.0, 316006.0, 21202.0, 4169.0, 1438.0, 686.0, 341.0, 186.0, 122.0, 73.0, 46.0, 23.0, 15.0, 14.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.125, -10.7611083984375, -10.397216796875, -10.0333251953125, -9.66943359375, -9.3055419921875, -8.941650390625, -8.5777587890625, -8.2138671875, -7.8499755859375, -7.486083984375, -7.1221923828125, -6.75830078125, -6.3944091796875, -6.030517578125, -5.6666259765625, -5.302734375, -4.9388427734375, -4.574951171875, -4.2110595703125, -3.84716796875, -3.4832763671875, -3.119384765625, -2.7554931640625, -2.3916015625, -2.0277099609375, -1.663818359375, -1.2999267578125, -0.93603515625, -0.5721435546875, -0.208251953125, 0.1556396484375, 0.51953125, 0.8834228515625, 1.247314453125, 1.6112060546875, 1.97509765625, 2.3389892578125, 2.702880859375, 3.0667724609375, 3.4306640625, 3.7945556640625, 4.158447265625, 4.5223388671875, 4.88623046875, 5.2501220703125, 5.614013671875, 5.9779052734375, 6.341796875, 6.7056884765625, 7.069580078125, 7.4334716796875, 7.79736328125, 8.1612548828125, 8.525146484375, 8.8890380859375, 9.2529296875, 9.6168212890625, 9.980712890625, 10.3446044921875, 10.70849609375, 11.0723876953125, 11.436279296875, 11.8001708984375, 12.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 10.0, 10.0, 23.0, 23.0, 44.0, 63.0, 100.0, 211.0, 448.0, 883.0, 1012.0, 642.0, 306.0, 143.0, 69.0, 25.0, 23.0, 14.0, 4.0, 8.0, 8.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.484375, -13.0653076171875, -12.646240234375, -12.2271728515625, -11.80810546875, -11.3890380859375, -10.969970703125, -10.5509033203125, -10.1318359375, -9.7127685546875, -9.293701171875, -8.8746337890625, -8.45556640625, -8.0364990234375, -7.617431640625, -7.1983642578125, -6.779296875, -6.3602294921875, -5.941162109375, -5.5220947265625, -5.10302734375, -4.6839599609375, -4.264892578125, -3.8458251953125, -3.4267578125, -3.0076904296875, -2.588623046875, -2.1695556640625, -1.75048828125, -1.3314208984375, -0.912353515625, -0.4932861328125, -0.07421875, 0.3448486328125, 0.763916015625, 1.1829833984375, 1.60205078125, 2.0211181640625, 2.440185546875, 2.8592529296875, 3.2783203125, 3.6973876953125, 4.116455078125, 4.5355224609375, 4.95458984375, 5.3736572265625, 5.792724609375, 6.2117919921875, 6.630859375, 7.0499267578125, 7.468994140625, 7.8880615234375, 8.30712890625, 8.7261962890625, 9.145263671875, 9.5643310546875, 9.9833984375, 10.4024658203125, 10.821533203125, 11.2406005859375, 11.65966796875, 12.0787353515625, 12.497802734375, 12.9168701171875, 13.3359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 11.0, 15.0, 34.0, 66.0, 115.0, 197.0, 229.0, 152.0, 75.0, 40.0, 26.0, 6.0, 9.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.24626922607422, -101.27145385742188, -98.29664611816406, -95.32183074951172, -92.34701538085938, -89.37220764160156, -86.39739227294922, -83.42257690429688, -80.44776916503906, -77.47295379638672, -74.4981460571289, -71.52333068847656, -68.54852294921875, -65.5737075805664, -62.59889221191406, -59.624080657958984, -56.649269104003906, -53.67445755004883, -50.69964599609375, -47.724830627441406, -44.75001907348633, -41.77520751953125, -38.800392150878906, -35.82558059692383, -32.85076904296875, -29.875957489013672, -26.90114402770996, -23.92633056640625, -20.951519012451172, -17.976707458496094, -15.001893997192383, -12.027080535888672, -9.052268981933594, -6.077456474304199, -3.1026439666748047, -0.12783145904541016, 2.8469810485839844, 5.821793556213379, 8.796606063842773, 11.771419525146484, 14.746231079101562, 17.72104263305664, 20.69585609436035, 23.670669555664062, 26.64548110961914, 29.62029266357422, 32.59510803222656, 35.56991958618164, 38.54473114013672, 41.5195426940918, 44.494354248046875, 47.46916961669922, 50.4439811706543, 53.418792724609375, 56.39360809326172, 59.3684196472168, 62.343231201171875, 65.31804656982422, 68.29285430908203, 71.26766967773438, 74.24247741699219, 77.21729278564453, 80.19210815429688, 83.16691589355469, 86.14173126220703]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 14.0, 20.0, 17.0, 18.0, 19.0, 34.0, 22.0, 42.0, 54.0, 43.0, 41.0, 49.0, 69.0, 75.0, 52.0, 55.0, 49.0, 36.0, 42.0, 42.0, 30.0, 24.0, 24.0, 29.0, 11.0, 14.0, 7.0, 15.0, 8.0, 12.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-50.59830093383789, -49.202613830566406, -47.80692672729492, -46.41123962402344, -45.01555633544922, -43.619869232177734, -42.22418212890625, -40.828495025634766, -39.43280792236328, -38.0371208190918, -36.64143371582031, -35.24574661254883, -33.850059509277344, -32.454376220703125, -31.05868911743164, -29.663002014160156, -28.267314910888672, -26.871627807617188, -25.475940704345703, -24.08025550842285, -22.684568405151367, -21.288881301879883, -19.89319610595703, -18.497509002685547, -17.101821899414062, -15.706134796142578, -14.31044864654541, -12.914762496948242, -11.519075393676758, -10.123388290405273, -8.727702140808105, -7.3320159912109375, -5.9363250732421875, -4.540638446807861, -3.144951820373535, -1.749265193939209, -0.3535785675048828, 1.0421080589294434, 2.4377946853637695, 3.8334808349609375, 5.229167938232422, 6.624854564666748, 8.020541191101074, 9.416227340698242, 10.811914443969727, 12.207601547241211, 13.603287696838379, 14.998973846435547, 16.39466094970703, 17.790348052978516, 19.18603515625, 20.58172035217285, 21.977407455444336, 23.37309455871582, 24.768779754638672, 26.164466857910156, 27.56015396118164, 28.955841064453125, 30.35152816772461, 31.74721336364746, 33.14289855957031, 34.5385856628418, 35.93427276611328, 37.329959869384766, 38.72564697265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 13.0, 17.0, 29.0, 37.0, 56.0, 82.0, 163.0, 283.0, 589.0, 1658.0, 6508.0, 46912.0, 726023.0, 242877.0, 17926.0, 3388.0, 1023.0, 438.0, 180.0, 112.0, 59.0, 57.0, 34.0, 21.0, 12.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.459228515625, -14.90283203125, -14.346435546875, -13.7900390625, -13.233642578125, -12.67724609375, -12.120849609375, -11.564453125, -11.008056640625, -10.45166015625, -9.895263671875, -9.3388671875, -8.782470703125, -8.22607421875, -7.669677734375, -7.11328125, -6.556884765625, -6.00048828125, -5.444091796875, -4.8876953125, -4.331298828125, -3.77490234375, -3.218505859375, -2.662109375, -2.105712890625, -1.54931640625, -0.992919921875, -0.4365234375, 0.119873046875, 0.67626953125, 1.232666015625, 1.7890625, 2.345458984375, 2.90185546875, 3.458251953125, 4.0146484375, 4.571044921875, 5.12744140625, 5.683837890625, 6.240234375, 6.796630859375, 7.35302734375, 7.909423828125, 8.4658203125, 9.022216796875, 9.57861328125, 10.135009765625, 10.69140625, 11.247802734375, 11.80419921875, 12.360595703125, 12.9169921875, 13.473388671875, 14.02978515625, 14.586181640625, 15.142578125, 15.698974609375, 16.25537109375, 16.811767578125, 17.3681640625, 17.924560546875, 18.48095703125, 19.037353515625, 19.59375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 14.0, 19.0, 28.0, 37.0, 33.0, 62.0, 64.0, 72.0, 77.0, 74.0, 95.0, 65.0, 81.0, 73.0, 38.0, 45.0, 34.0, 22.0, 16.0, 15.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.11578369140625, -5.9581298828125, -5.80047607421875, -5.642822265625, -5.48516845703125, -5.3275146484375, -5.16986083984375, -5.01220703125, -4.85455322265625, -4.6968994140625, -4.53924560546875, -4.381591796875, -4.22393798828125, -4.0662841796875, -3.90863037109375, -3.7509765625, -3.59332275390625, -3.4356689453125, -3.27801513671875, -3.120361328125, -2.96270751953125, -2.8050537109375, -2.64739990234375, -2.48974609375, -2.33209228515625, -2.1744384765625, -2.01678466796875, -1.859130859375, -1.70147705078125, -1.5438232421875, -1.38616943359375, -1.228515625, -1.07086181640625, -0.9132080078125, -0.75555419921875, -0.597900390625, -0.44024658203125, -0.2825927734375, -0.12493896484375, 0.03271484375, 0.19036865234375, 0.3480224609375, 0.50567626953125, 0.663330078125, 0.82098388671875, 0.9786376953125, 1.13629150390625, 1.2939453125, 1.45159912109375, 1.6092529296875, 1.76690673828125, 1.924560546875, 2.08221435546875, 2.2398681640625, 2.39752197265625, 2.55517578125, 2.71282958984375, 2.8704833984375, 3.02813720703125, 3.185791015625, 3.34344482421875, 3.5010986328125, 3.65875244140625, 3.81640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 15.0, 17.0, 29.0, 46.0, 106.0, 204.0, 499.0, 1652.0, 9763.0, 920773.0, 109273.0, 4514.0, 980.0, 355.0, 143.0, 66.0, 36.0, 34.0, 14.0, 12.0, 11.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-50.59375, -49.140625, -47.6875, -46.234375, -44.78125, -43.328125, -41.875, -40.421875, -38.96875, -37.515625, -36.0625, -34.609375, -33.15625, -31.703125, -30.25, -28.796875, -27.34375, -25.890625, -24.4375, -22.984375, -21.53125, -20.078125, -18.625, -17.171875, -15.71875, -14.265625, -12.8125, -11.359375, -9.90625, -8.453125, -7.0, -5.546875, -4.09375, -2.640625, -1.1875, 0.265625, 1.71875, 3.171875, 4.625, 6.078125, 7.53125, 8.984375, 10.4375, 11.890625, 13.34375, 14.796875, 16.25, 17.703125, 19.15625, 20.609375, 22.0625, 23.515625, 24.96875, 26.421875, 27.875, 29.328125, 30.78125, 32.234375, 33.6875, 35.140625, 36.59375, 38.046875, 39.5, 40.953125, 42.40625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 4.0, 10.0, 25.0, 17.0, 31.0, 45.0, 60.0, 91.0, 92.0, 88.0, 108.0, 113.0, 82.0, 74.0, 46.0, 28.0, 29.0, 17.0, 14.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.25, -30.38330078125, -29.5166015625, -28.64990234375, -27.783203125, -26.91650390625, -26.0498046875, -25.18310546875, -24.31640625, -23.44970703125, -22.5830078125, -21.71630859375, -20.849609375, -19.98291015625, -19.1162109375, -18.24951171875, -17.3828125, -16.51611328125, -15.6494140625, -14.78271484375, -13.916015625, -13.04931640625, -12.1826171875, -11.31591796875, -10.44921875, -9.58251953125, -8.7158203125, -7.84912109375, -6.982421875, -6.11572265625, -5.2490234375, -4.38232421875, -3.515625, -2.64892578125, -1.7822265625, -0.91552734375, -0.048828125, 0.81787109375, 1.6845703125, 2.55126953125, 3.41796875, 4.28466796875, 5.1513671875, 6.01806640625, 6.884765625, 7.75146484375, 8.6181640625, 9.48486328125, 10.3515625, 11.21826171875, 12.0849609375, 12.95166015625, 13.818359375, 14.68505859375, 15.5517578125, 16.41845703125, 17.28515625, 18.15185546875, 19.0185546875, 19.88525390625, 20.751953125, 21.61865234375, 22.4853515625, 23.35205078125, 24.21875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 8.0, 1.0, 6.0, 5.0, 10.0, 19.0, 25.0, 24.0, 55.0, 104.0, 163.0, 292.0, 906.0, 3776.0, 32341.0, 933851.0, 68944.0, 5913.0, 1284.0, 394.0, 185.0, 85.0, 65.0, 23.0, 15.0, 13.0, 12.0, 10.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.467041015625, -9.08251953125, -8.697998046875, -8.3134765625, -7.928955078125, -7.54443359375, -7.159912109375, -6.775390625, -6.390869140625, -6.00634765625, -5.621826171875, -5.2373046875, -4.852783203125, -4.46826171875, -4.083740234375, -3.69921875, -3.314697265625, -2.93017578125, -2.545654296875, -2.1611328125, -1.776611328125, -1.39208984375, -1.007568359375, -0.623046875, -0.238525390625, 0.14599609375, 0.530517578125, 0.9150390625, 1.299560546875, 1.68408203125, 2.068603515625, 2.453125, 2.837646484375, 3.22216796875, 3.606689453125, 3.9912109375, 4.375732421875, 4.76025390625, 5.144775390625, 5.529296875, 5.913818359375, 6.29833984375, 6.682861328125, 7.0673828125, 7.451904296875, 7.83642578125, 8.220947265625, 8.60546875, 8.989990234375, 9.37451171875, 9.759033203125, 10.1435546875, 10.528076171875, 10.91259765625, 11.297119140625, 11.681640625, 12.066162109375, 12.45068359375, 12.835205078125, 13.2197265625, 13.604248046875, 13.98876953125, 14.373291015625, 14.7578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 5.0, 8.0, 13.0, 12.0, 12.0, 24.0, 27.0, 31.0, 72.0, 144.0, 254.0, 158.0, 77.0, 42.0, 26.0, 24.0, 11.0, 16.0, 11.0, 4.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002162933349609375, -0.0021020472049713135, -0.002041161060333252, -0.0019802749156951904, -0.001919388771057129, -0.0018585026264190674, -0.0017976164817810059, -0.0017367303371429443, -0.0016758441925048828, -0.0016149580478668213, -0.0015540719032287598, -0.0014931857585906982, -0.0014322996139526367, -0.0013714134693145752, -0.0013105273246765137, -0.0012496411800384521, -0.0011887550354003906, -0.001127868890762329, -0.0010669827461242676, -0.001006096601486206, -0.0009452104568481445, -0.000884324312210083, -0.0008234381675720215, -0.00076255202293396, -0.0007016658782958984, -0.0006407797336578369, -0.0005798935890197754, -0.0005190074443817139, -0.00045812129974365234, -0.0003972351551055908, -0.0003363490104675293, -0.0002754628658294678, -0.00021457672119140625, -0.00015369057655334473, -9.28044319152832e-05, -3.191828727722168e-05, 2.8967857360839844e-05, 8.985400199890137e-05, 0.0001507401466369629, 0.00021162629127502441, 0.00027251243591308594, 0.00033339858055114746, 0.000394284725189209, 0.0004551708698272705, 0.000516057014465332, 0.0005769431591033936, 0.0006378293037414551, 0.0006987154483795166, 0.0007596015930175781, 0.0008204877376556396, 0.0008813738822937012, 0.0009422600269317627, 0.0010031461715698242, 0.0010640323162078857, 0.0011249184608459473, 0.0011858046054840088, 0.0012466907501220703, 0.0013075768947601318, 0.0013684630393981934, 0.0014293491840362549, 0.0014902353286743164, 0.001551121473312378, 0.0016120076179504395, 0.001672893762588501, 0.0017337799072265625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 2.0, 7.0, 7.0, 29.0, 26.0, 31.0, 28.0, 46.0, 73.0, 99.0, 134.0, 196.0, 308.0, 459.0, 847.0, 1641.0, 3896.0, 10797.0, 39327.0, 357377.0, 569921.0, 43502.0, 11671.0, 4043.0, 1708.0, 877.0, 473.0, 288.0, 222.0, 140.0, 117.0, 58.0, 45.0, 37.0, 33.0, 28.0, 17.0, 10.0, 7.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-5.77734375, -5.60760498046875, -5.4378662109375, -5.26812744140625, -5.098388671875, -4.92864990234375, -4.7589111328125, -4.58917236328125, -4.41943359375, -4.24969482421875, -4.0799560546875, -3.91021728515625, -3.740478515625, -3.57073974609375, -3.4010009765625, -3.23126220703125, -3.0615234375, -2.89178466796875, -2.7220458984375, -2.55230712890625, -2.382568359375, -2.21282958984375, -2.0430908203125, -1.87335205078125, -1.70361328125, -1.53387451171875, -1.3641357421875, -1.19439697265625, -1.024658203125, -0.85491943359375, -0.6851806640625, -0.51544189453125, -0.345703125, -0.17596435546875, -0.0062255859375, 0.16351318359375, 0.333251953125, 0.50299072265625, 0.6727294921875, 0.84246826171875, 1.01220703125, 1.18194580078125, 1.3516845703125, 1.52142333984375, 1.691162109375, 1.86090087890625, 2.0306396484375, 2.20037841796875, 2.3701171875, 2.53985595703125, 2.7095947265625, 2.87933349609375, 3.049072265625, 3.21881103515625, 3.3885498046875, 3.55828857421875, 3.72802734375, 3.89776611328125, 4.0675048828125, 4.23724365234375, 4.406982421875, 4.57672119140625, 4.7464599609375, 4.91619873046875, 5.0859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 8.0, 3.0, 3.0, 12.0, 8.0, 15.0, 20.0, 17.0, 37.0, 59.0, 97.0, 143.0, 153.0, 139.0, 93.0, 55.0, 41.0, 23.0, 19.0, 14.0, 10.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.84765625, -6.66571044921875, -6.4837646484375, -6.30181884765625, -6.119873046875, -5.93792724609375, -5.7559814453125, -5.57403564453125, -5.39208984375, -5.21014404296875, -5.0281982421875, -4.84625244140625, -4.664306640625, -4.48236083984375, -4.3004150390625, -4.11846923828125, -3.9365234375, -3.75457763671875, -3.5726318359375, -3.39068603515625, -3.208740234375, -3.02679443359375, -2.8448486328125, -2.66290283203125, -2.48095703125, -2.29901123046875, -2.1170654296875, -1.93511962890625, -1.753173828125, -1.57122802734375, -1.3892822265625, -1.20733642578125, -1.025390625, -0.84344482421875, -0.6614990234375, -0.47955322265625, -0.297607421875, -0.11566162109375, 0.0662841796875, 0.24822998046875, 0.43017578125, 0.61212158203125, 0.7940673828125, 0.97601318359375, 1.157958984375, 1.33990478515625, 1.5218505859375, 1.70379638671875, 1.8857421875, 2.06768798828125, 2.2496337890625, 2.43157958984375, 2.613525390625, 2.79547119140625, 2.9774169921875, 3.15936279296875, 3.34130859375, 3.52325439453125, 3.7052001953125, 3.88714599609375, 4.069091796875, 4.25103759765625, 4.4329833984375, 4.61492919921875, 4.796875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 7.0, 3.0, 6.0, 7.0, 7.0, 12.0, 15.0, 30.0, 58.0, 98.0, 184.0, 232.0, 125.0, 100.0, 42.0, 30.0, 13.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.38017272949219, -101.65333557128906, -98.92649841308594, -96.19966125488281, -93.47282409667969, -90.74598693847656, -88.01914978027344, -85.29231262207031, -82.56547546386719, -79.83863830566406, -77.11180114746094, -74.38496398925781, -71.65812683105469, -68.93128967285156, -66.20445251464844, -63.47761535644531, -60.75078201293945, -58.02394485473633, -55.2971076965332, -52.57027053833008, -49.84343338012695, -47.11659622192383, -44.38976287841797, -41.662925720214844, -38.93608856201172, -36.209251403808594, -33.48241424560547, -30.755577087402344, -28.02873992919922, -25.301902770996094, -22.5750675201416, -19.848230361938477, -17.12139129638672, -14.394554138183594, -11.667716979980469, -8.94088077545166, -6.214043617248535, -3.48720645904541, -0.7603702545166016, 1.9664669036865234, 4.693304061889648, 7.420141220092773, 10.146978378295898, 12.873814582824707, 15.600651741027832, 18.32748794555664, 21.054325103759766, 23.78116226196289, 26.507999420166016, 29.23483657836914, 31.961673736572266, 34.68851089477539, 37.415348052978516, 40.14218521118164, 42.8690185546875, 45.595855712890625, 48.32269287109375, 51.049530029296875, 53.7763671875, 56.503204345703125, 59.23004150390625, 61.956878662109375, 64.6837158203125, 67.41055297851562, 70.13739013671875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 7.0, 9.0, 5.0, 12.0, 14.0, 15.0, 27.0, 23.0, 26.0, 45.0, 31.0, 44.0, 46.0, 49.0, 86.0, 69.0, 81.0, 67.0, 53.0, 36.0, 42.0, 29.0, 32.0, 29.0, 24.0, 21.0, 23.0, 25.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.79753494262695, -56.685508728027344, -54.573486328125, -52.46146011352539, -50.34943389892578, -48.23740768432617, -46.12538146972656, -44.01335906982422, -41.90133285522461, -39.789306640625, -37.677284240722656, -35.56525802612305, -33.45323181152344, -31.341205596923828, -29.22918128967285, -27.117156982421875, -25.005130767822266, -22.893104553222656, -20.78108024597168, -18.669055938720703, -16.557029724121094, -14.4450044631958, -12.332979202270508, -10.220953941345215, -8.108928680419922, -5.996903419494629, -3.884878158569336, -1.772852897644043, 0.33917236328125, 2.451197624206543, 4.563222885131836, 6.675248146057129, 8.787277221679688, 10.89930248260498, 13.011327743530273, 15.123353004455566, 17.23537826538086, 19.34740447998047, 21.459428787231445, 23.571453094482422, 25.68347930908203, 27.79550552368164, 29.907529830932617, 32.019554138183594, 34.1315803527832, 36.24360656738281, 38.355628967285156, 40.467655181884766, 42.579681396484375, 44.691707611083984, 46.803733825683594, 48.91575622558594, 51.02778244018555, 53.139808654785156, 55.2518310546875, 57.36385726928711, 59.47588348388672, 61.58790969848633, 63.69993591308594, 65.81195831298828, 67.92398071289062, 70.0360107421875, 72.14803314208984, 74.26006317138672, 76.37208557128906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 7.0, 6.0, 12.0, 15.0, 20.0, 25.0, 35.0, 41.0, 88.0, 139.0, 255.0, 699.0, 2341.0, 13985.0, 696478.0, 3442882.0, 31230.0, 3901.0, 1120.0, 436.0, 245.0, 121.0, 64.0, 49.0, 28.0, 17.0, 13.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.450439453125, -9.97900390625, -9.507568359375, -9.0361328125, -8.564697265625, -8.09326171875, -7.621826171875, -7.150390625, -6.678955078125, -6.20751953125, -5.736083984375, -5.2646484375, -4.793212890625, -4.32177734375, -3.850341796875, -3.37890625, -2.907470703125, -2.43603515625, -1.964599609375, -1.4931640625, -1.021728515625, -0.55029296875, -0.078857421875, 0.392578125, 0.864013671875, 1.33544921875, 1.806884765625, 2.2783203125, 2.749755859375, 3.22119140625, 3.692626953125, 4.1640625, 4.635498046875, 5.10693359375, 5.578369140625, 6.0498046875, 6.521240234375, 6.99267578125, 7.464111328125, 7.935546875, 8.406982421875, 8.87841796875, 9.349853515625, 9.8212890625, 10.292724609375, 10.76416015625, 11.235595703125, 11.70703125, 12.178466796875, 12.64990234375, 13.121337890625, 13.5927734375, 14.064208984375, 14.53564453125, 15.007080078125, 15.478515625, 15.949951171875, 16.42138671875, 16.892822265625, 17.3642578125, 17.835693359375, 18.30712890625, 18.778564453125, 19.25]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 20.0, 26.0, 44.0, 65.0, 104.0, 99.0, 152.0, 128.0, 124.0, 91.0, 68.0, 41.0, 28.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.66876220703125, -7.4117431640625, -7.15472412109375, -6.897705078125, -6.64068603515625, -6.3836669921875, -6.12664794921875, -5.86962890625, -5.61260986328125, -5.3555908203125, -5.09857177734375, -4.841552734375, -4.58453369140625, -4.3275146484375, -4.07049560546875, -3.8134765625, -3.55645751953125, -3.2994384765625, -3.04241943359375, -2.785400390625, -2.52838134765625, -2.2713623046875, -2.01434326171875, -1.75732421875, -1.50030517578125, -1.2432861328125, -0.98626708984375, -0.729248046875, -0.47222900390625, -0.2152099609375, 0.04180908203125, 0.298828125, 0.55584716796875, 0.8128662109375, 1.06988525390625, 1.326904296875, 1.58392333984375, 1.8409423828125, 2.09796142578125, 2.35498046875, 2.61199951171875, 2.8690185546875, 3.12603759765625, 3.383056640625, 3.64007568359375, 3.8970947265625, 4.15411376953125, 4.4111328125, 4.66815185546875, 4.9251708984375, 5.18218994140625, 5.439208984375, 5.69622802734375, 5.9532470703125, 6.21026611328125, 6.46728515625, 6.72430419921875, 6.9813232421875, 7.23834228515625, 7.495361328125, 7.75238037109375, 8.0093994140625, 8.26641845703125, 8.5234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 6.0, 14.0, 12.0, 24.0, 55.0, 105.0, 257.0, 658.0, 1686.0, 5124.0, 63821.0, 4030088.0, 82116.0, 6382.0, 2268.0, 876.0, 400.0, 173.0, 100.0, 40.0, 19.0, 17.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.109375, -23.4111328125, -22.712890625, -22.0146484375, -21.31640625, -20.6181640625, -19.919921875, -19.2216796875, -18.5234375, -17.8251953125, -17.126953125, -16.4287109375, -15.73046875, -15.0322265625, -14.333984375, -13.6357421875, -12.9375, -12.2392578125, -11.541015625, -10.8427734375, -10.14453125, -9.4462890625, -8.748046875, -8.0498046875, -7.3515625, -6.6533203125, -5.955078125, -5.2568359375, -4.55859375, -3.8603515625, -3.162109375, -2.4638671875, -1.765625, -1.0673828125, -0.369140625, 0.3291015625, 1.02734375, 1.7255859375, 2.423828125, 3.1220703125, 3.8203125, 4.5185546875, 5.216796875, 5.9150390625, 6.61328125, 7.3115234375, 8.009765625, 8.7080078125, 9.40625, 10.1044921875, 10.802734375, 11.5009765625, 12.19921875, 12.8974609375, 13.595703125, 14.2939453125, 14.9921875, 15.6904296875, 16.388671875, 17.0869140625, 17.78515625, 18.4833984375, 19.181640625, 19.8798828125, 20.578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 14.0, 33.0, 47.0, 114.0, 237.0, 658.0, 1266.0, 962.0, 429.0, 140.0, 66.0, 37.0, 16.0, 15.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6484375, -13.1375732421875, -12.626708984375, -12.1158447265625, -11.60498046875, -11.0941162109375, -10.583251953125, -10.0723876953125, -9.5615234375, -9.0506591796875, -8.539794921875, -8.0289306640625, -7.51806640625, -7.0072021484375, -6.496337890625, -5.9854736328125, -5.474609375, -4.9637451171875, -4.452880859375, -3.9420166015625, -3.43115234375, -2.9202880859375, -2.409423828125, -1.8985595703125, -1.3876953125, -0.8768310546875, -0.365966796875, 0.1448974609375, 0.65576171875, 1.1666259765625, 1.677490234375, 2.1883544921875, 2.69921875, 3.2100830078125, 3.720947265625, 4.2318115234375, 4.74267578125, 5.2535400390625, 5.764404296875, 6.2752685546875, 6.7861328125, 7.2969970703125, 7.807861328125, 8.3187255859375, 8.82958984375, 9.3404541015625, 9.851318359375, 10.3621826171875, 10.873046875, 11.3839111328125, 11.894775390625, 12.4056396484375, 12.91650390625, 13.4273681640625, 13.938232421875, 14.4490966796875, 14.9599609375, 15.4708251953125, 15.981689453125, 16.4925537109375, 17.00341796875, 17.5142822265625, 18.025146484375, 18.5360107421875, 19.046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 12.0, 23.0, 99.0, 396.0, 336.0, 92.0, 20.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.88661193847656, -124.31285095214844, -117.73908996582031, -111.16532897949219, -104.59156799316406, -98.01780700683594, -91.44403839111328, -84.87027740478516, -78.29651641845703, -71.7227554321289, -65.14899444580078, -58.57522964477539, -52.001468658447266, -45.42770767211914, -38.85394287109375, -32.280181884765625, -25.7064208984375, -19.132659912109375, -12.558897018432617, -5.985134124755859, 0.5886268615722656, 7.162387847900391, 13.736152648925781, 20.309913635253906, 26.88367462158203, 33.457435607910156, 40.03119659423828, 46.60496139526367, 53.1787223815918, 59.75248336791992, 66.32624816894531, 72.90000915527344, 79.47378540039062, 86.04754638671875, 92.62130737304688, 99.195068359375, 105.76882934570312, 112.34259033203125, 118.9163589477539, 125.49011993408203, 132.06387329101562, 138.63763427734375, 145.21139526367188, 151.78515625, 158.35891723632812, 164.93267822265625, 171.50643920898438, 178.0802001953125, 184.6539764404297, 191.2277374267578, 197.80149841308594, 204.37525939941406, 210.9490203857422, 217.5227813720703, 224.0965576171875, 230.67031860351562, 237.24407958984375, 243.81784057617188, 250.3916015625, 256.9653625488281, 263.53912353515625, 270.1128845214844, 276.6866455078125, 283.2604064941406, 289.83416748046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 9.0, 19.0, 29.0, 50.0, 63.0, 86.0, 115.0, 115.0, 143.0, 111.0, 88.0, 63.0, 49.0, 35.0, 15.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5604019165039, -80.48870086669922, -77.41700744628906, -74.34530639648438, -71.27360534667969, -68.20191192626953, -65.13021087646484, -62.05851364135742, -58.98681640625, -55.91511917114258, -52.843421936035156, -49.77172088623047, -46.70002365112305, -43.628326416015625, -40.55662536621094, -37.484928131103516, -34.413230895996094, -31.341533660888672, -28.269834518432617, -25.198135375976562, -22.12643814086914, -19.05474090576172, -15.983041763305664, -12.91134262084961, -9.839645385742188, -6.767947196960449, -3.696249008178711, -0.6245508193969727, 2.4471473693847656, 5.518845558166504, 8.590543746948242, 11.662242889404297, 14.733932495117188, 17.80562973022461, 20.877328872680664, 23.94902801513672, 27.02072525024414, 30.092422485351562, 33.16412353515625, 36.23582077026367, 39.307518005371094, 42.379215240478516, 45.45091247558594, 48.522613525390625, 51.59431076049805, 54.66600799560547, 57.737709045410156, 60.80940628051758, 63.881103515625, 66.95280456542969, 70.02449798583984, 73.09619903564453, 76.16789245605469, 79.23959350585938, 82.31129455566406, 85.38299560546875, 88.4546890258789, 91.5263900756836, 94.59808349609375, 97.66978454589844, 100.74148559570312, 103.81317901611328, 106.88488006591797, 109.95657348632812, 113.02827453613281]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 0.0, 8.0, 10.0, 11.0, 21.0, 27.0, 25.0, 35.0, 56.0, 98.0, 156.0, 303.0, 629.0, 1452.0, 5344.0, 31965.0, 495113.0, 474632.0, 30897.0, 5013.0, 1391.0, 603.0, 284.0, 158.0, 100.0, 54.0, 48.0, 39.0, 26.0, 17.0, 13.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.5028076171875, -12.099365234375, -11.6959228515625, -11.29248046875, -10.8890380859375, -10.485595703125, -10.0821533203125, -9.6787109375, -9.2752685546875, -8.871826171875, -8.4683837890625, -8.06494140625, -7.6614990234375, -7.258056640625, -6.8546142578125, -6.451171875, -6.0477294921875, -5.644287109375, -5.2408447265625, -4.83740234375, -4.4339599609375, -4.030517578125, -3.6270751953125, -3.2236328125, -2.8201904296875, -2.416748046875, -2.0133056640625, -1.60986328125, -1.2064208984375, -0.802978515625, -0.3995361328125, 0.00390625, 0.4073486328125, 0.810791015625, 1.2142333984375, 1.61767578125, 2.0211181640625, 2.424560546875, 2.8280029296875, 3.2314453125, 3.6348876953125, 4.038330078125, 4.4417724609375, 4.84521484375, 5.2486572265625, 5.652099609375, 6.0555419921875, 6.458984375, 6.8624267578125, 7.265869140625, 7.6693115234375, 8.07275390625, 8.4761962890625, 8.879638671875, 9.2830810546875, 9.6865234375, 10.0899658203125, 10.493408203125, 10.8968505859375, 11.30029296875, 11.7037353515625, 12.107177734375, 12.5106201171875, 12.9140625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 26.0, 28.0, 35.0, 53.0, 76.0, 93.0, 105.0, 121.0, 117.0, 97.0, 67.0, 49.0, 47.0, 41.0, 13.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28125, -6.0523681640625, -5.823486328125, -5.5946044921875, -5.36572265625, -5.1368408203125, -4.907958984375, -4.6790771484375, -4.4501953125, -4.2213134765625, -3.992431640625, -3.7635498046875, -3.53466796875, -3.3057861328125, -3.076904296875, -2.8480224609375, -2.619140625, -2.3902587890625, -2.161376953125, -1.9324951171875, -1.70361328125, -1.4747314453125, -1.245849609375, -1.0169677734375, -0.7880859375, -0.5592041015625, -0.330322265625, -0.1014404296875, 0.12744140625, 0.3563232421875, 0.585205078125, 0.8140869140625, 1.04296875, 1.2718505859375, 1.500732421875, 1.7296142578125, 1.95849609375, 2.1873779296875, 2.416259765625, 2.6451416015625, 2.8740234375, 3.1029052734375, 3.331787109375, 3.5606689453125, 3.78955078125, 4.0184326171875, 4.247314453125, 4.4761962890625, 4.705078125, 4.9339599609375, 5.162841796875, 5.3917236328125, 5.62060546875, 5.8494873046875, 6.078369140625, 6.3072509765625, 6.5361328125, 6.7650146484375, 6.993896484375, 7.2227783203125, 7.45166015625, 7.6805419921875, 7.909423828125, 8.1383056640625, 8.3671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 23.0, 29.0, 40.0, 50.0, 106.0, 197.0, 378.0, 830.0, 2086.0, 7150.0, 39280.0, 588309.0, 366967.0, 33113.0, 6342.0, 1983.0, 790.0, 364.0, 186.0, 109.0, 64.0, 55.0, 16.0, 20.0, 11.0, 6.0, 8.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.6649169921875, -9.306396484375, -8.9478759765625, -8.58935546875, -8.2308349609375, -7.872314453125, -7.5137939453125, -7.1552734375, -6.7967529296875, -6.438232421875, -6.0797119140625, -5.72119140625, -5.3626708984375, -5.004150390625, -4.6456298828125, -4.287109375, -3.9285888671875, -3.570068359375, -3.2115478515625, -2.85302734375, -2.4945068359375, -2.135986328125, -1.7774658203125, -1.4189453125, -1.0604248046875, -0.701904296875, -0.3433837890625, 0.01513671875, 0.3736572265625, 0.732177734375, 1.0906982421875, 1.44921875, 1.8077392578125, 2.166259765625, 2.5247802734375, 2.88330078125, 3.2418212890625, 3.600341796875, 3.9588623046875, 4.3173828125, 4.6759033203125, 5.034423828125, 5.3929443359375, 5.75146484375, 6.1099853515625, 6.468505859375, 6.8270263671875, 7.185546875, 7.5440673828125, 7.902587890625, 8.2611083984375, 8.61962890625, 8.9781494140625, 9.336669921875, 9.6951904296875, 10.0537109375, 10.4122314453125, 10.770751953125, 11.1292724609375, 11.48779296875, 11.8463134765625, 12.204833984375, 12.5633544921875, 12.921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 10.0, 17.0, 19.0, 33.0, 41.0, 54.0, 55.0, 55.0, 62.0, 77.0, 71.0, 68.0, 76.0, 60.0, 44.0, 33.0, 48.0, 34.0, 25.0, 29.0, 22.0, 6.0, 10.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.0322265625, -15.470703125, -14.9091796875, -14.34765625, -13.7861328125, -13.224609375, -12.6630859375, -12.1015625, -11.5400390625, -10.978515625, -10.4169921875, -9.85546875, -9.2939453125, -8.732421875, -8.1708984375, -7.609375, -7.0478515625, -6.486328125, -5.9248046875, -5.36328125, -4.8017578125, -4.240234375, -3.6787109375, -3.1171875, -2.5556640625, -1.994140625, -1.4326171875, -0.87109375, -0.3095703125, 0.251953125, 0.8134765625, 1.375, 1.9365234375, 2.498046875, 3.0595703125, 3.62109375, 4.1826171875, 4.744140625, 5.3056640625, 5.8671875, 6.4287109375, 6.990234375, 7.5517578125, 8.11328125, 8.6748046875, 9.236328125, 9.7978515625, 10.359375, 10.9208984375, 11.482421875, 12.0439453125, 12.60546875, 13.1669921875, 13.728515625, 14.2900390625, 14.8515625, 15.4130859375, 15.974609375, 16.5361328125, 17.09765625, 17.6591796875, 18.220703125, 18.7822265625, 19.34375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 27.0, 36.0, 112.0, 295.0, 1173.0, 6891.0, 83251.0, 887615.0, 62108.0, 5647.0, 958.0, 253.0, 86.0, 35.0, 19.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39453125, -6.203369140625, -6.01220703125, -5.821044921875, -5.6298828125, -5.438720703125, -5.24755859375, -5.056396484375, -4.865234375, -4.674072265625, -4.48291015625, -4.291748046875, -4.1005859375, -3.909423828125, -3.71826171875, -3.527099609375, -3.3359375, -3.144775390625, -2.95361328125, -2.762451171875, -2.5712890625, -2.380126953125, -2.18896484375, -1.997802734375, -1.806640625, -1.615478515625, -1.42431640625, -1.233154296875, -1.0419921875, -0.850830078125, -0.65966796875, -0.468505859375, -0.27734375, -0.086181640625, 0.10498046875, 0.296142578125, 0.4873046875, 0.678466796875, 0.86962890625, 1.060791015625, 1.251953125, 1.443115234375, 1.63427734375, 1.825439453125, 2.0166015625, 2.207763671875, 2.39892578125, 2.590087890625, 2.78125, 2.972412109375, 3.16357421875, 3.354736328125, 3.5458984375, 3.737060546875, 3.92822265625, 4.119384765625, 4.310546875, 4.501708984375, 4.69287109375, 4.884033203125, 5.0751953125, 5.266357421875, 5.45751953125, 5.648681640625, 5.83984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 3.0, 10.0, 9.0, 15.0, 27.0, 36.0, 51.0, 69.0, 85.0, 113.0, 109.0, 128.0, 84.0, 61.0, 49.0, 29.0, 13.0, 24.0, 20.0, 14.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006747245788574219, -0.0006526336073875427, -0.0006305426359176636, -0.0006084516644477844, -0.0005863606929779053, -0.0005642697215080261, -0.000542178750038147, -0.0005200877785682678, -0.0004979968070983887, -0.0004759058356285095, -0.00045381486415863037, -0.0004317238926887512, -0.00040963292121887207, -0.0003875419497489929, -0.00036545097827911377, -0.0003433600068092346, -0.00032126903533935547, -0.0002991780638694763, -0.00027708709239959717, -0.000254996120929718, -0.00023290514945983887, -0.00021081417798995972, -0.00018872320652008057, -0.00016663223505020142, -0.00014454126358032227, -0.00012245029211044312, -0.00010035932064056396, -7.826834917068481e-05, -5.6177377700805664e-05, -3.4086406230926514e-05, -1.1995434761047363e-05, 1.0095536708831787e-05, 3.218650817871094e-05, 5.427747964859009e-05, 7.636845111846924e-05, 9.845942258834839e-05, 0.00012055039405822754, 0.0001426413655281067, 0.00016473233699798584, 0.000186823308467865, 0.00020891427993774414, 0.0002310052514076233, 0.00025309622287750244, 0.0002751871943473816, 0.00029727816581726074, 0.0003193691372871399, 0.00034146010875701904, 0.0003635510802268982, 0.00038564205169677734, 0.0004077330231666565, 0.00042982399463653564, 0.0004519149661064148, 0.00047400593757629395, 0.0004960969090461731, 0.0005181878805160522, 0.0005402788519859314, 0.0005623698234558105, 0.0005844607949256897, 0.0006065517663955688, 0.000628642737865448, 0.0006507337093353271, 0.0006728246808052063, 0.0006949156522750854, 0.0007170066237449646, 0.0007390975952148438]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 11.0, 15.0, 26.0, 16.0, 37.0, 72.0, 122.0, 188.0, 396.0, 803.0, 1736.0, 4096.0, 11167.0, 39672.0, 216333.0, 644211.0, 95866.0, 21794.0, 6800.0, 2669.0, 1205.0, 590.0, 310.0, 152.0, 91.0, 73.0, 33.0, 18.0, 12.0, 9.0, 11.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3671875, -3.268951416015625, -3.17071533203125, -3.072479248046875, -2.9742431640625, -2.876007080078125, -2.77777099609375, -2.679534912109375, -2.581298828125, -2.483062744140625, -2.38482666015625, -2.286590576171875, -2.1883544921875, -2.090118408203125, -1.99188232421875, -1.893646240234375, -1.79541015625, -1.697174072265625, -1.59893798828125, -1.500701904296875, -1.4024658203125, -1.304229736328125, -1.20599365234375, -1.107757568359375, -1.009521484375, -0.911285400390625, -0.81304931640625, -0.714813232421875, -0.6165771484375, -0.518341064453125, -0.42010498046875, -0.321868896484375, -0.2236328125, -0.125396728515625, -0.02716064453125, 0.071075439453125, 0.1693115234375, 0.267547607421875, 0.36578369140625, 0.464019775390625, 0.562255859375, 0.660491943359375, 0.75872802734375, 0.856964111328125, 0.9552001953125, 1.053436279296875, 1.15167236328125, 1.249908447265625, 1.34814453125, 1.446380615234375, 1.54461669921875, 1.642852783203125, 1.7410888671875, 1.839324951171875, 1.93756103515625, 2.035797119140625, 2.134033203125, 2.232269287109375, 2.33050537109375, 2.428741455078125, 2.5269775390625, 2.625213623046875, 2.72344970703125, 2.821685791015625, 2.919921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 19.0, 16.0, 18.0, 31.0, 36.0, 30.0, 72.0, 81.0, 102.0, 118.0, 88.0, 102.0, 64.0, 53.0, 39.0, 25.0, 15.0, 13.0, 6.0, 11.0, 8.0, 3.0, 5.0, 8.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.01092529296875, -2.9085693359375, -2.80621337890625, -2.703857421875, -2.60150146484375, -2.4991455078125, -2.39678955078125, -2.29443359375, -2.19207763671875, -2.0897216796875, -1.98736572265625, -1.885009765625, -1.78265380859375, -1.6802978515625, -1.57794189453125, -1.4755859375, -1.37322998046875, -1.2708740234375, -1.16851806640625, -1.066162109375, -0.96380615234375, -0.8614501953125, -0.75909423828125, -0.65673828125, -0.55438232421875, -0.4520263671875, -0.34967041015625, -0.247314453125, -0.14495849609375, -0.0426025390625, 0.05975341796875, 0.162109375, 0.26446533203125, 0.3668212890625, 0.46917724609375, 0.571533203125, 0.67388916015625, 0.7762451171875, 0.87860107421875, 0.98095703125, 1.08331298828125, 1.1856689453125, 1.28802490234375, 1.390380859375, 1.49273681640625, 1.5950927734375, 1.69744873046875, 1.7998046875, 1.90216064453125, 2.0045166015625, 2.10687255859375, 2.209228515625, 2.31158447265625, 2.4139404296875, 2.51629638671875, 2.61865234375, 2.72100830078125, 2.8233642578125, 2.92572021484375, 3.028076171875, 3.13043212890625, 3.2327880859375, 3.33514404296875, 3.4375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 15.0, 38.0, 84.0, 217.0, 344.0, 146.0, 72.0, 33.0, 10.0, 5.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.04656219482422, -104.08979034423828, -101.13301849365234, -98.1762466430664, -95.21947479248047, -92.26270294189453, -89.30592346191406, -86.34915161132812, -83.39237976074219, -80.43560791015625, -77.47883605957031, -74.52206420898438, -71.56529235839844, -68.6085205078125, -65.65174865722656, -62.69497299194336, -59.73820495605469, -56.78143310546875, -53.82466125488281, -50.867889404296875, -47.91111755371094, -44.954345703125, -41.9975700378418, -39.04079818725586, -36.08402633666992, -33.127254486083984, -30.170482635498047, -27.213708877563477, -24.25693702697754, -21.3001651763916, -18.34339141845703, -15.386619567871094, -12.429855346679688, -9.47308349609375, -6.516310691833496, -3.559537887573242, -0.6027660369873047, 2.354005813598633, 5.310779571533203, 8.26755142211914, 11.224323272705078, 14.181095123291016, 17.137866973876953, 20.094640731811523, 23.05141258239746, 26.0081844329834, 28.96495819091797, 31.921730041503906, 34.878501892089844, 37.83527374267578, 40.79204559326172, 43.748817443847656, 46.705589294433594, 49.66236114501953, 52.619136810302734, 55.57590866088867, 58.53268051147461, 61.48945236206055, 64.44622802734375, 67.40299987792969, 70.35977172851562, 73.31654357910156, 76.2733154296875, 79.23008728027344, 82.18685913085938]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 5.0, 16.0, 25.0, 43.0, 51.0, 68.0, 74.0, 115.0, 150.0, 149.0, 75.0, 62.0, 52.0, 32.0, 28.0, 17.0, 14.0, 13.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.08719635009766, -107.681396484375, -104.27558898925781, -100.86978912353516, -97.46398162841797, -94.05818176269531, -90.65237426757812, -87.24657440185547, -83.84077453613281, -80.43497467041016, -77.02916717529297, -73.62336730957031, -70.21755981445312, -66.81175994873047, -63.40595626831055, -60.000152587890625, -56.59434509277344, -53.188541412353516, -49.782737731933594, -46.37693786621094, -42.97113037109375, -39.565330505371094, -36.15952682495117, -32.75372314453125, -29.347919464111328, -25.942115783691406, -22.536312103271484, -19.130510330200195, -15.724706649780273, -12.318902969360352, -8.913101196289062, -5.507297515869141, -2.1014862060546875, 1.3043169975280762, 4.71012020111084, 8.115922927856445, 11.521726608276367, 14.927530288696289, 18.333332061767578, 21.7391357421875, 25.144939422607422, 28.550743103027344, 31.956546783447266, 35.36235046386719, 38.768150329589844, 42.17395782470703, 45.57975769042969, 48.98556137084961, 52.39136505126953, 55.79716873168945, 59.202972412109375, 62.60877227783203, 66.01457977294922, 69.42037963867188, 72.82618713378906, 76.23198699951172, 79.63778686523438, 83.04358673095703, 86.44939422607422, 89.85519409179688, 93.26100158691406, 96.66680145263672, 100.07260131835938, 103.47840881347656, 106.88421630859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0, 8.0, 1.0, 8.0, 4.0, 13.0, 17.0, 24.0, 54.0, 62.0, 113.0, 190.0, 399.0, 942.0, 3357.0, 18943.0, 797485.0, 3316752.0, 48150.0, 5417.0, 1341.0, 494.0, 201.0, 111.0, 64.0, 39.0, 29.0, 23.0, 17.0, 5.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.984375, -10.6204833984375, -10.256591796875, -9.8927001953125, -9.52880859375, -9.1649169921875, -8.801025390625, -8.4371337890625, -8.0732421875, -7.7093505859375, -7.345458984375, -6.9815673828125, -6.61767578125, -6.2537841796875, -5.889892578125, -5.5260009765625, -5.162109375, -4.7982177734375, -4.434326171875, -4.0704345703125, -3.70654296875, -3.3426513671875, -2.978759765625, -2.6148681640625, -2.2509765625, -1.8870849609375, -1.523193359375, -1.1593017578125, -0.79541015625, -0.4315185546875, -0.067626953125, 0.2962646484375, 0.66015625, 1.0240478515625, 1.387939453125, 1.7518310546875, 2.11572265625, 2.4796142578125, 2.843505859375, 3.2073974609375, 3.5712890625, 3.9351806640625, 4.299072265625, 4.6629638671875, 5.02685546875, 5.3907470703125, 5.754638671875, 6.1185302734375, 6.482421875, 6.8463134765625, 7.210205078125, 7.5740966796875, 7.93798828125, 8.3018798828125, 8.665771484375, 9.0296630859375, 9.3935546875, 9.7574462890625, 10.121337890625, 10.4852294921875, 10.84912109375, 11.2130126953125, 11.576904296875, 11.9407958984375, 12.3046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 8.0, 7.0, 12.0, 22.0, 19.0, 26.0, 41.0, 28.0, 42.0, 67.0, 65.0, 64.0, 71.0, 63.0, 78.0, 72.0, 72.0, 49.0, 36.0, 40.0, 28.0, 21.0, 17.0, 20.0, 13.0, 7.0, 9.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.484375, -5.337371826171875, -5.19036865234375, -5.043365478515625, -4.8963623046875, -4.749359130859375, -4.60235595703125, -4.455352783203125, -4.308349609375, -4.161346435546875, -4.01434326171875, -3.867340087890625, -3.7203369140625, -3.573333740234375, -3.42633056640625, -3.279327392578125, -3.13232421875, -2.985321044921875, -2.83831787109375, -2.691314697265625, -2.5443115234375, -2.397308349609375, -2.25030517578125, -2.103302001953125, -1.956298828125, -1.809295654296875, -1.66229248046875, -1.515289306640625, -1.3682861328125, -1.221282958984375, -1.07427978515625, -0.927276611328125, -0.7802734375, -0.633270263671875, -0.48626708984375, -0.339263916015625, -0.1922607421875, -0.045257568359375, 0.10174560546875, 0.248748779296875, 0.395751953125, 0.542755126953125, 0.68975830078125, 0.836761474609375, 0.9837646484375, 1.130767822265625, 1.27777099609375, 1.424774169921875, 1.57177734375, 1.718780517578125, 1.86578369140625, 2.012786865234375, 2.1597900390625, 2.306793212890625, 2.45379638671875, 2.600799560546875, 2.747802734375, 2.894805908203125, 3.04180908203125, 3.188812255859375, 3.3358154296875, 3.482818603515625, 3.62982177734375, 3.776824951171875, 3.923828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 10.0, 6.0, 8.0, 16.0, 26.0, 31.0, 44.0, 122.0, 262.0, 738.0, 3479.0, 35294.0, 3529818.0, 609016.0, 12762.0, 1798.0, 475.0, 165.0, 72.0, 46.0, 31.0, 15.0, 15.0, 7.0, 3.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.515380859375, -13.04638671875, -12.577392578125, -12.1083984375, -11.639404296875, -11.17041015625, -10.701416015625, -10.232421875, -9.763427734375, -9.29443359375, -8.825439453125, -8.3564453125, -7.887451171875, -7.41845703125, -6.949462890625, -6.48046875, -6.011474609375, -5.54248046875, -5.073486328125, -4.6044921875, -4.135498046875, -3.66650390625, -3.197509765625, -2.728515625, -2.259521484375, -1.79052734375, -1.321533203125, -0.8525390625, -0.383544921875, 0.08544921875, 0.554443359375, 1.0234375, 1.492431640625, 1.96142578125, 2.430419921875, 2.8994140625, 3.368408203125, 3.83740234375, 4.306396484375, 4.775390625, 5.244384765625, 5.71337890625, 6.182373046875, 6.6513671875, 7.120361328125, 7.58935546875, 8.058349609375, 8.52734375, 8.996337890625, 9.46533203125, 9.934326171875, 10.4033203125, 10.872314453125, 11.34130859375, 11.810302734375, 12.279296875, 12.748291015625, 13.21728515625, 13.686279296875, 14.1552734375, 14.624267578125, 15.09326171875, 15.562255859375, 16.03125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 12.0, 11.0, 17.0, 15.0, 31.0, 39.0, 63.0, 111.0, 193.0, 302.0, 490.0, 703.0, 687.0, 564.0, 312.0, 181.0, 116.0, 69.0, 50.0, 36.0, 18.0, 11.0, 11.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0234375, -7.7811279296875, -7.538818359375, -7.2965087890625, -7.05419921875, -6.8118896484375, -6.569580078125, -6.3272705078125, -6.0849609375, -5.8426513671875, -5.600341796875, -5.3580322265625, -5.11572265625, -4.8734130859375, -4.631103515625, -4.3887939453125, -4.146484375, -3.9041748046875, -3.661865234375, -3.4195556640625, -3.17724609375, -2.9349365234375, -2.692626953125, -2.4503173828125, -2.2080078125, -1.9656982421875, -1.723388671875, -1.4810791015625, -1.23876953125, -0.9964599609375, -0.754150390625, -0.5118408203125, -0.26953125, -0.0272216796875, 0.215087890625, 0.4573974609375, 0.69970703125, 0.9420166015625, 1.184326171875, 1.4266357421875, 1.6689453125, 1.9112548828125, 2.153564453125, 2.3958740234375, 2.63818359375, 2.8804931640625, 3.122802734375, 3.3651123046875, 3.607421875, 3.8497314453125, 4.092041015625, 4.3343505859375, 4.57666015625, 4.8189697265625, 5.061279296875, 5.3035888671875, 5.5458984375, 5.7882080078125, 6.030517578125, 6.2728271484375, 6.51513671875, 6.7574462890625, 6.999755859375, 7.2420654296875, 7.484375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 16.0, 28.0, 51.0, 90.0, 178.0, 202.0, 191.0, 116.0, 63.0, 31.0, 13.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-118.08943176269531, -115.71792602539062, -113.34642028808594, -110.97492218017578, -108.6034164428711, -106.2319107055664, -103.86040496826172, -101.48889923095703, -99.11740112304688, -96.74589538574219, -94.3743896484375, -92.00289154052734, -89.63138580322266, -87.25988006591797, -84.88837432861328, -82.5168685913086, -80.1453628540039, -77.77385711669922, -75.40235137939453, -73.03085327148438, -70.65934753417969, -68.287841796875, -65.91633605957031, -63.544830322265625, -61.1733283996582, -58.801822662353516, -56.430320739746094, -54.058815002441406, -51.68730926513672, -49.3158073425293, -46.94430160522461, -44.57279968261719, -42.20128631591797, -39.82978057861328, -37.45827865600586, -35.08677291870117, -32.71527099609375, -30.343765258789062, -27.972259521484375, -25.60075569152832, -23.229251861572266, -20.85774803161621, -18.486244201660156, -16.11473846435547, -13.743234634399414, -11.37173080444336, -9.000226020812988, -6.628721237182617, -4.2572174072265625, -1.8857131004333496, 0.4857912063598633, 2.857295513153076, 5.228799819946289, 7.600303649902344, 9.971808433532715, 12.343313217163086, 14.71481704711914, 17.086320877075195, 19.45782470703125, 21.829330444335938, 24.200834274291992, 26.572338104248047, 28.943843841552734, 31.31534767150879, 33.686851501464844]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 7.0, 6.0, 6.0, 12.0, 12.0, 16.0, 13.0, 26.0, 30.0, 21.0, 34.0, 26.0, 28.0, 47.0, 34.0, 36.0, 47.0, 34.0, 49.0, 52.0, 43.0, 52.0, 43.0, 24.0, 39.0, 41.0, 24.0, 32.0, 23.0, 21.0, 14.0, 13.0, 8.0, 18.0, 10.0, 12.0, 7.0, 8.0, 3.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.146305084228516, -21.35926628112793, -20.572229385375977, -19.78519058227539, -18.998153686523438, -18.21111488342285, -17.4240779876709, -16.637039184570312, -15.85000228881836, -15.06296443939209, -14.27592658996582, -13.48888874053955, -12.701850891113281, -11.914813041687012, -11.127775192260742, -10.340736389160156, -9.553698539733887, -8.766660690307617, -7.979622840881348, -7.192584991455078, -6.405547142028809, -5.618509292602539, -4.831470966339111, -4.044433116912842, -3.2573952674865723, -2.4703574180603027, -1.6833194494247437, -0.8962814807891846, -0.10924363136291504, 0.6777942180633545, 1.4648323059082031, 2.2518701553344727, 3.038908004760742, 3.8259458541870117, 4.612983703613281, 5.400021553039551, 6.18705940246582, 6.97409725189209, 7.761135578155518, 8.548173904418945, 9.335210800170898, 10.122248649597168, 10.909286499023438, 11.696324348449707, 12.483362197875977, 13.270400047302246, 14.057437896728516, 14.844476699829102, 15.631514549255371, 16.41855239868164, 17.205591201782227, 17.99262809753418, 18.779666900634766, 19.56670379638672, 20.353742599487305, 21.140779495239258, 21.927818298339844, 22.71485710144043, 23.501893997192383, 24.28893280029297, 25.075969696044922, 25.863008499145508, 26.65004539489746, 27.437084197998047, 28.22412109375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 13.0, 12.0, 24.0, 44.0, 72.0, 170.0, 485.0, 2014.0, 20448.0, 757071.0, 258026.0, 8367.0, 1205.0, 315.0, 134.0, 60.0, 41.0, 17.0, 16.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.7452392578125, -19.209228515625, -18.6732177734375, -18.13720703125, -17.6011962890625, -17.065185546875, -16.5291748046875, -15.9931640625, -15.4571533203125, -14.921142578125, -14.3851318359375, -13.84912109375, -13.3131103515625, -12.777099609375, -12.2410888671875, -11.705078125, -11.1690673828125, -10.633056640625, -10.0970458984375, -9.56103515625, -9.0250244140625, -8.489013671875, -7.9530029296875, -7.4169921875, -6.8809814453125, -6.344970703125, -5.8089599609375, -5.27294921875, -4.7369384765625, -4.200927734375, -3.6649169921875, -3.12890625, -2.5928955078125, -2.056884765625, -1.5208740234375, -0.98486328125, -0.4488525390625, 0.087158203125, 0.6231689453125, 1.1591796875, 1.6951904296875, 2.231201171875, 2.7672119140625, 3.30322265625, 3.8392333984375, 4.375244140625, 4.9112548828125, 5.447265625, 5.9832763671875, 6.519287109375, 7.0552978515625, 7.59130859375, 8.1273193359375, 8.663330078125, 9.1993408203125, 9.7353515625, 10.2713623046875, 10.807373046875, 11.3433837890625, 11.87939453125, 12.4154052734375, 12.951416015625, 13.4874267578125, 14.0234375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 8.0, 5.0, 11.0, 11.0, 13.0, 11.0, 10.0, 24.0, 26.0, 24.0, 30.0, 36.0, 33.0, 50.0, 47.0, 30.0, 54.0, 46.0, 40.0, 47.0, 36.0, 53.0, 42.0, 43.0, 43.0, 28.0, 29.0, 19.0, 29.0, 27.0, 17.0, 12.0, 11.0, 9.0, 9.0, 9.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.26953125, -3.166015625, -3.0625, -2.958984375, -2.85546875, -2.751953125, -2.6484375, -2.544921875, -2.44140625, -2.337890625, -2.234375, -2.130859375, -2.02734375, -1.923828125, -1.8203125, -1.716796875, -1.61328125, -1.509765625, -1.40625, -1.302734375, -1.19921875, -1.095703125, -0.9921875, -0.888671875, -0.78515625, -0.681640625, -0.578125, -0.474609375, -0.37109375, -0.267578125, -0.1640625, -0.060546875, 0.04296875, 0.146484375, 0.25, 0.353515625, 0.45703125, 0.560546875, 0.6640625, 0.767578125, 0.87109375, 0.974609375, 1.078125, 1.181640625, 1.28515625, 1.388671875, 1.4921875, 1.595703125, 1.69921875, 1.802734375, 1.90625, 2.009765625, 2.11328125, 2.216796875, 2.3203125, 2.423828125, 2.52734375, 2.630859375, 2.734375, 2.837890625, 2.94140625, 3.044921875, 3.1484375, 3.251953125, 3.35546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 9.0, 9.0, 11.0, 10.0, 18.0, 35.0, 34.0, 61.0, 75.0, 109.0, 153.0, 293.0, 532.0, 1033.0, 2400.0, 7369.0, 32431.0, 271395.0, 663208.0, 52728.0, 10619.0, 3211.0, 1242.0, 597.0, 335.0, 197.0, 136.0, 83.0, 44.0, 42.0, 35.0, 19.0, 17.0, 14.0, 13.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.0625, -9.7677001953125, -9.472900390625, -9.1781005859375, -8.88330078125, -8.5885009765625, -8.293701171875, -7.9989013671875, -7.7041015625, -7.4093017578125, -7.114501953125, -6.8197021484375, -6.52490234375, -6.2301025390625, -5.935302734375, -5.6405029296875, -5.345703125, -5.0509033203125, -4.756103515625, -4.4613037109375, -4.16650390625, -3.8717041015625, -3.576904296875, -3.2821044921875, -2.9873046875, -2.6925048828125, -2.397705078125, -2.1029052734375, -1.80810546875, -1.5133056640625, -1.218505859375, -0.9237060546875, -0.62890625, -0.3341064453125, -0.039306640625, 0.2554931640625, 0.55029296875, 0.8450927734375, 1.139892578125, 1.4346923828125, 1.7294921875, 2.0242919921875, 2.319091796875, 2.6138916015625, 2.90869140625, 3.2034912109375, 3.498291015625, 3.7930908203125, 4.087890625, 4.3826904296875, 4.677490234375, 4.9722900390625, 5.26708984375, 5.5618896484375, 5.856689453125, 6.1514892578125, 6.4462890625, 6.7410888671875, 7.035888671875, 7.3306884765625, 7.62548828125, 7.9202880859375, 8.215087890625, 8.5098876953125, 8.8046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 1.0, 5.0, 3.0, 9.0, 16.0, 9.0, 10.0, 13.0, 25.0, 32.0, 30.0, 37.0, 52.0, 51.0, 51.0, 53.0, 65.0, 59.0, 46.0, 51.0, 64.0, 61.0, 42.0, 33.0, 35.0, 25.0, 17.0, 20.0, 19.0, 14.0, 10.0, 7.0, 7.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.35888671875, -13.9052734375, -13.45166015625, -12.998046875, -12.54443359375, -12.0908203125, -11.63720703125, -11.18359375, -10.72998046875, -10.2763671875, -9.82275390625, -9.369140625, -8.91552734375, -8.4619140625, -8.00830078125, -7.5546875, -7.10107421875, -6.6474609375, -6.19384765625, -5.740234375, -5.28662109375, -4.8330078125, -4.37939453125, -3.92578125, -3.47216796875, -3.0185546875, -2.56494140625, -2.111328125, -1.65771484375, -1.2041015625, -0.75048828125, -0.296875, 0.15673828125, 0.6103515625, 1.06396484375, 1.517578125, 1.97119140625, 2.4248046875, 2.87841796875, 3.33203125, 3.78564453125, 4.2392578125, 4.69287109375, 5.146484375, 5.60009765625, 6.0537109375, 6.50732421875, 6.9609375, 7.41455078125, 7.8681640625, 8.32177734375, 8.775390625, 9.22900390625, 9.6826171875, 10.13623046875, 10.58984375, 11.04345703125, 11.4970703125, 11.95068359375, 12.404296875, 12.85791015625, 13.3115234375, 13.76513671875, 14.21875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 16.0, 14.0, 21.0, 46.0, 92.0, 169.0, 386.0, 1071.0, 3548.0, 14711.0, 125439.0, 844980.0, 46521.0, 8101.0, 2124.0, 704.0, 279.0, 122.0, 71.0, 32.0, 28.0, 17.0, 7.0, 5.0, 11.0, 4.0, 0.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.5625, -5.41339111328125, -5.2642822265625, -5.11517333984375, -4.966064453125, -4.81695556640625, -4.6678466796875, -4.51873779296875, -4.36962890625, -4.22052001953125, -4.0714111328125, -3.92230224609375, -3.773193359375, -3.62408447265625, -3.4749755859375, -3.32586669921875, -3.1767578125, -3.02764892578125, -2.8785400390625, -2.72943115234375, -2.580322265625, -2.43121337890625, -2.2821044921875, -2.13299560546875, -1.98388671875, -1.83477783203125, -1.6856689453125, -1.53656005859375, -1.387451171875, -1.23834228515625, -1.0892333984375, -0.94012451171875, -0.791015625, -0.64190673828125, -0.4927978515625, -0.34368896484375, -0.194580078125, -0.04547119140625, 0.1036376953125, 0.25274658203125, 0.40185546875, 0.55096435546875, 0.7000732421875, 0.84918212890625, 0.998291015625, 1.14739990234375, 1.2965087890625, 1.44561767578125, 1.5947265625, 1.74383544921875, 1.8929443359375, 2.04205322265625, 2.191162109375, 2.34027099609375, 2.4893798828125, 2.63848876953125, 2.78759765625, 2.93670654296875, 3.0858154296875, 3.23492431640625, 3.384033203125, 3.53314208984375, 3.6822509765625, 3.83135986328125, 3.98046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 13.0, 19.0, 22.0, 47.0, 58.0, 89.0, 123.0, 183.0, 142.0, 90.0, 51.0, 27.0, 23.0, 22.0, 17.0, 13.0, 6.0, 9.0, 6.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0009393692016601562, -0.000912882387638092, -0.0008863955736160278, -0.0008599087595939636, -0.0008334219455718994, -0.0008069351315498352, -0.000780448317527771, -0.0007539615035057068, -0.0007274746894836426, -0.0007009878754615784, -0.0006745010614395142, -0.00064801424741745, -0.0006215274333953857, -0.0005950406193733215, -0.0005685538053512573, -0.0005420669913291931, -0.0005155801773071289, -0.0004890933632850647, -0.0004626065492630005, -0.0004361197352409363, -0.00040963292121887207, -0.00038314610719680786, -0.00035665929317474365, -0.00033017247915267944, -0.00030368566513061523, -0.000277198851108551, -0.0002507120370864868, -0.0002242252230644226, -0.0001977384090423584, -0.0001712515950202942, -0.00014476478099822998, -0.00011827796697616577, -9.179115295410156e-05, -6.530433893203735e-05, -3.8817524909973145e-05, -1.2330710887908936e-05, 1.4156103134155273e-05, 4.064291715621948e-05, 6.712973117828369e-05, 9.36165452003479e-05, 0.00012010335922241211, 0.00014659017324447632, 0.00017307698726654053, 0.00019956380128860474, 0.00022605061531066895, 0.00025253742933273315, 0.00027902424335479736, 0.00030551105737686157, 0.0003319978713989258, 0.00035848468542099, 0.0003849714994430542, 0.0004114583134651184, 0.0004379451274871826, 0.0004644319415092468, 0.000490918755531311, 0.0005174055695533752, 0.0005438923835754395, 0.0005703791975975037, 0.0005968660116195679, 0.0006233528256416321, 0.0006498396396636963, 0.0006763264536857605, 0.0007028132677078247, 0.0007293000817298889, 0.0007557868957519531]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 9.0, 13.0, 10.0, 26.0, 30.0, 40.0, 67.0, 118.0, 222.0, 348.0, 714.0, 1550.0, 4074.0, 12677.0, 58722.0, 755827.0, 177276.0, 25470.0, 6815.0, 2315.0, 1057.0, 448.0, 273.0, 163.0, 96.0, 63.0, 40.0, 26.0, 20.0, 13.0, 10.0, 7.0, 2.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.671875, -3.552459716796875, -3.43304443359375, -3.313629150390625, -3.1942138671875, -3.074798583984375, -2.95538330078125, -2.835968017578125, -2.716552734375, -2.597137451171875, -2.47772216796875, -2.358306884765625, -2.2388916015625, -2.119476318359375, -2.00006103515625, -1.880645751953125, -1.76123046875, -1.641815185546875, -1.52239990234375, -1.402984619140625, -1.2835693359375, -1.164154052734375, -1.04473876953125, -0.925323486328125, -0.805908203125, -0.686492919921875, -0.56707763671875, -0.447662353515625, -0.3282470703125, -0.208831787109375, -0.08941650390625, 0.029998779296875, 0.1494140625, 0.268829345703125, 0.38824462890625, 0.507659912109375, 0.6270751953125, 0.746490478515625, 0.86590576171875, 0.985321044921875, 1.104736328125, 1.224151611328125, 1.34356689453125, 1.462982177734375, 1.5823974609375, 1.701812744140625, 1.82122802734375, 1.940643310546875, 2.06005859375, 2.179473876953125, 2.29888916015625, 2.418304443359375, 2.5377197265625, 2.657135009765625, 2.77655029296875, 2.895965576171875, 3.015380859375, 3.134796142578125, 3.25421142578125, 3.373626708984375, 3.4930419921875, 3.612457275390625, 3.73187255859375, 3.851287841796875, 3.970703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 13.0, 6.0, 19.0, 28.0, 27.0, 48.0, 61.0, 134.0, 170.0, 185.0, 97.0, 60.0, 39.0, 28.0, 19.0, 14.0, 7.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.76171875, -4.625274658203125, -4.48883056640625, -4.352386474609375, -4.2159423828125, -4.079498291015625, -3.94305419921875, -3.806610107421875, -3.670166015625, -3.533721923828125, -3.39727783203125, -3.260833740234375, -3.1243896484375, -2.987945556640625, -2.85150146484375, -2.715057373046875, -2.57861328125, -2.442169189453125, -2.30572509765625, -2.169281005859375, -2.0328369140625, -1.896392822265625, -1.75994873046875, -1.623504638671875, -1.487060546875, -1.350616455078125, -1.21417236328125, -1.077728271484375, -0.9412841796875, -0.804840087890625, -0.66839599609375, -0.531951904296875, -0.3955078125, -0.259063720703125, -0.12261962890625, 0.013824462890625, 0.1502685546875, 0.286712646484375, 0.42315673828125, 0.559600830078125, 0.696044921875, 0.832489013671875, 0.96893310546875, 1.105377197265625, 1.2418212890625, 1.378265380859375, 1.51470947265625, 1.651153564453125, 1.78759765625, 1.924041748046875, 2.06048583984375, 2.196929931640625, 2.3333740234375, 2.469818115234375, 2.60626220703125, 2.742706298828125, 2.879150390625, 3.015594482421875, 3.15203857421875, 3.288482666015625, 3.4249267578125, 3.561370849609375, 3.69781494140625, 3.834259033203125, 3.970703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 14.0, 16.0, 33.0, 93.0, 134.0, 334.0, 142.0, 95.0, 39.0, 42.0, 15.0, 6.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.75296020507812, -90.52107238769531, -88.28919219970703, -86.05730438232422, -83.8254165649414, -81.59353637695312, -79.36164855957031, -77.1297607421875, -74.89788055419922, -72.6659927368164, -70.43411254882812, -68.20222473144531, -65.9703369140625, -63.73845672607422, -61.506568908691406, -59.27468490600586, -57.04279708862305, -54.8109130859375, -52.57902526855469, -50.34714126586914, -48.115257263183594, -45.88336944580078, -43.651485443115234, -41.41960144042969, -39.187713623046875, -36.95582962036133, -34.723941802978516, -32.49205780029297, -30.260173797607422, -28.028287887573242, -25.796401977539062, -23.564517974853516, -21.332630157470703, -19.100744247436523, -16.868860244750977, -14.636974334716797, -12.405089378356934, -10.17320442199707, -7.941318511962891, -5.709433555603027, -3.477548599243164, -1.2456634044647217, 0.9862217903137207, 3.218107223510742, 5.4499921798706055, 7.681877136230469, 9.913763046264648, 12.145648002624512, 14.377532958984375, 16.609418869018555, 18.8413028717041, 21.07318878173828, 23.305072784423828, 25.536958694458008, 27.768844604492188, 30.000728607177734, 32.23261260986328, 34.46449661254883, 36.69638442993164, 38.92826843261719, 41.160152435302734, 43.39203643798828, 45.623924255371094, 47.85580825805664, 50.08769607543945]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 10.0, 3.0, 7.0, 6.0, 8.0, 4.0, 10.0, 13.0, 28.0, 18.0, 16.0, 30.0, 23.0, 23.0, 36.0, 26.0, 31.0, 35.0, 64.0, 104.0, 82.0, 74.0, 41.0, 31.0, 35.0, 28.0, 38.0, 25.0, 13.0, 23.0, 12.0, 13.0, 15.0, 16.0, 17.0, 11.0, 8.0, 3.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-54.47209930419922, -52.918243408203125, -51.3643913269043, -49.81053924560547, -48.256683349609375, -46.70282745361328, -45.14897537231445, -43.595123291015625, -42.04126739501953, -40.48741149902344, -38.93355941772461, -37.37970733642578, -35.82585144042969, -34.271995544433594, -32.718143463134766, -31.164289474487305, -29.610435485839844, -28.056581497192383, -26.502727508544922, -24.94887351989746, -23.39501953125, -21.84116554260254, -20.287311553955078, -18.733457565307617, -17.179603576660156, -15.625749588012695, -14.071895599365234, -12.518041610717773, -10.964187622070312, -9.410333633422852, -7.856479644775391, -6.30262565612793, -4.748771667480469, -3.194917678833008, -1.6410636901855469, -0.08720970153808594, 1.466644287109375, 3.020498275756836, 4.574352264404297, 6.128206253051758, 7.682060241699219, 9.23591423034668, 10.78976821899414, 12.343622207641602, 13.897476196289062, 15.451330184936523, 17.005184173583984, 18.559038162231445, 20.112892150878906, 21.666746139526367, 23.220600128173828, 24.77445411682129, 26.32830810546875, 27.88216209411621, 29.436016082763672, 30.989870071411133, 32.543724060058594, 34.09757995605469, 35.651432037353516, 37.205284118652344, 38.75914001464844, 40.31299591064453, 41.86684799194336, 43.42070007324219, 44.97455596923828]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 13.0, 17.0, 26.0, 45.0, 93.0, 158.0, 293.0, 793.0, 2418.0, 11951.0, 262018.0, 3776635.0, 128598.0, 8275.0, 1776.0, 632.0, 240.0, 123.0, 65.0, 30.0, 20.0, 15.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.40625, -13.0479736328125, -12.689697265625, -12.3314208984375, -11.97314453125, -11.6148681640625, -11.256591796875, -10.8983154296875, -10.5400390625, -10.1817626953125, -9.823486328125, -9.4652099609375, -9.10693359375, -8.7486572265625, -8.390380859375, -8.0321044921875, -7.673828125, -7.3155517578125, -6.957275390625, -6.5989990234375, -6.24072265625, -5.8824462890625, -5.524169921875, -5.1658935546875, -4.8076171875, -4.4493408203125, -4.091064453125, -3.7327880859375, -3.37451171875, -3.0162353515625, -2.657958984375, -2.2996826171875, -1.94140625, -1.5831298828125, -1.224853515625, -0.8665771484375, -0.50830078125, -0.1500244140625, 0.208251953125, 0.5665283203125, 0.9248046875, 1.2830810546875, 1.641357421875, 1.9996337890625, 2.35791015625, 2.7161865234375, 3.074462890625, 3.4327392578125, 3.791015625, 4.1492919921875, 4.507568359375, 4.8658447265625, 5.22412109375, 5.5823974609375, 5.940673828125, 6.2989501953125, 6.6572265625, 7.0155029296875, 7.373779296875, 7.7320556640625, 8.09033203125, 8.4486083984375, 8.806884765625, 9.1651611328125, 9.5234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 16.0, 27.0, 22.0, 26.0, 28.0, 51.0, 63.0, 70.0, 80.0, 66.0, 89.0, 59.0, 83.0, 45.0, 64.0, 39.0, 41.0, 22.0, 28.0, 25.0, 16.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.43292236328125, -3.2720947265625, -3.11126708984375, -2.950439453125, -2.78961181640625, -2.6287841796875, -2.46795654296875, -2.30712890625, -2.14630126953125, -1.9854736328125, -1.82464599609375, -1.663818359375, -1.50299072265625, -1.3421630859375, -1.18133544921875, -1.0205078125, -0.85968017578125, -0.6988525390625, -0.53802490234375, -0.377197265625, -0.21636962890625, -0.0555419921875, 0.10528564453125, 0.26611328125, 0.42694091796875, 0.5877685546875, 0.74859619140625, 0.909423828125, 1.07025146484375, 1.2310791015625, 1.39190673828125, 1.552734375, 1.71356201171875, 1.8743896484375, 2.03521728515625, 2.196044921875, 2.35687255859375, 2.5177001953125, 2.67852783203125, 2.83935546875, 3.00018310546875, 3.1610107421875, 3.32183837890625, 3.482666015625, 3.64349365234375, 3.8043212890625, 3.96514892578125, 4.1259765625, 4.28680419921875, 4.4476318359375, 4.60845947265625, 4.769287109375, 4.93011474609375, 5.0909423828125, 5.25177001953125, 5.41259765625, 5.57342529296875, 5.7342529296875, 5.89508056640625, 6.055908203125, 6.21673583984375, 6.3775634765625, 6.53839111328125, 6.69921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 15.0, 18.0, 42.0, 75.0, 173.0, 376.0, 1432.0, 9907.0, 455607.0, 3689104.0, 33535.0, 2879.0, 623.0, 236.0, 106.0, 49.0, 28.0, 20.0, 11.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.1441650390625, -7.671142578125, -7.1981201171875, -6.72509765625, -6.2520751953125, -5.779052734375, -5.3060302734375, -4.8330078125, -4.3599853515625, -3.886962890625, -3.4139404296875, -2.94091796875, -2.4678955078125, -1.994873046875, -1.5218505859375, -1.048828125, -0.5758056640625, -0.102783203125, 0.3702392578125, 0.84326171875, 1.3162841796875, 1.789306640625, 2.2623291015625, 2.7353515625, 3.2083740234375, 3.681396484375, 4.1544189453125, 4.62744140625, 5.1004638671875, 5.573486328125, 6.0465087890625, 6.51953125, 6.9925537109375, 7.465576171875, 7.9385986328125, 8.41162109375, 8.8846435546875, 9.357666015625, 9.8306884765625, 10.3037109375, 10.7767333984375, 11.249755859375, 11.7227783203125, 12.19580078125, 12.6688232421875, 13.141845703125, 13.6148681640625, 14.087890625, 14.5609130859375, 15.033935546875, 15.5069580078125, 15.97998046875, 16.4530029296875, 16.926025390625, 17.3990478515625, 17.8720703125, 18.3450927734375, 18.818115234375, 19.2911376953125, 19.76416015625, 20.2371826171875, 20.710205078125, 21.1832275390625, 21.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 13.0, 16.0, 19.0, 25.0, 40.0, 61.0, 109.0, 186.0, 280.0, 458.0, 579.0, 660.0, 537.0, 366.0, 223.0, 171.0, 103.0, 63.0, 45.0, 24.0, 23.0, 17.0, 11.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.203125, -7.98345947265625, -7.7637939453125, -7.54412841796875, -7.324462890625, -7.10479736328125, -6.8851318359375, -6.66546630859375, -6.44580078125, -6.22613525390625, -6.0064697265625, -5.78680419921875, -5.567138671875, -5.34747314453125, -5.1278076171875, -4.90814208984375, -4.6884765625, -4.46881103515625, -4.2491455078125, -4.02947998046875, -3.809814453125, -3.59014892578125, -3.3704833984375, -3.15081787109375, -2.93115234375, -2.71148681640625, -2.4918212890625, -2.27215576171875, -2.052490234375, -1.83282470703125, -1.6131591796875, -1.39349365234375, -1.173828125, -0.95416259765625, -0.7344970703125, -0.51483154296875, -0.295166015625, -0.07550048828125, 0.1441650390625, 0.36383056640625, 0.58349609375, 0.80316162109375, 1.0228271484375, 1.24249267578125, 1.462158203125, 1.68182373046875, 1.9014892578125, 2.12115478515625, 2.3408203125, 2.56048583984375, 2.7801513671875, 2.99981689453125, 3.219482421875, 3.43914794921875, 3.6588134765625, 3.87847900390625, 4.09814453125, 4.31781005859375, 4.5374755859375, 4.75714111328125, 4.976806640625, 5.19647216796875, 5.4161376953125, 5.63580322265625, 5.85546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 13.0, 19.0, 42.0, 84.0, 121.0, 187.0, 181.0, 126.0, 94.0, 49.0, 32.0, 14.0, 5.0, 4.0, 6.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.7541732788086, -72.94255828857422, -71.13094329833984, -69.31932067871094, -67.50770568847656, -65.69609069824219, -63.88447570800781, -62.07286071777344, -60.26124572753906, -58.44963073730469, -56.63801193237305, -54.82639694213867, -53.0147819519043, -51.203163146972656, -49.39154815673828, -47.579933166503906, -45.768314361572266, -43.95669937133789, -42.14508056640625, -40.333465576171875, -38.5218505859375, -36.710235595703125, -34.898616790771484, -33.08700180053711, -31.2753849029541, -29.463768005371094, -27.65215301513672, -25.84053611755371, -24.028919219970703, -22.217304229736328, -20.40568733215332, -18.594070434570312, -16.782455444335938, -14.970839500427246, -13.159223556518555, -11.347606658935547, -9.535990715026855, -7.724374771118164, -5.912757873535156, -4.101141929626465, -2.2895259857177734, -0.47790980339050293, 1.3337063789367676, 3.145322799682617, 4.956938743591309, 6.7685546875, 8.580171585083008, 10.3917875289917, 12.20340347290039, 14.015019416809082, 15.826635360717773, 17.63825225830078, 19.449867248535156, 21.261484146118164, 23.073101043701172, 24.884716033935547, 26.696332931518555, 28.507949829101562, 30.319564819335938, 32.13117980957031, 33.94279861450195, 35.75441360473633, 37.56603240966797, 39.377647399902344, 41.18926239013672]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 3.0, 11.0, 9.0, 11.0, 9.0, 12.0, 18.0, 26.0, 16.0, 29.0, 21.0, 31.0, 39.0, 53.0, 23.0, 51.0, 58.0, 59.0, 45.0, 39.0, 52.0, 40.0, 49.0, 35.0, 41.0, 25.0, 26.0, 24.0, 22.0, 20.0, 12.0, 13.0, 10.0, 10.0, 9.0, 11.0, 8.0, 2.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.491119384765625, -25.68136978149414, -24.87162208557129, -24.061872482299805, -23.252124786376953, -22.44237518310547, -21.632625579833984, -20.8228759765625, -20.01312828063965, -19.203378677368164, -18.393630981445312, -17.583881378173828, -16.774131774902344, -15.964384078979492, -15.154634475708008, -14.34488582611084, -13.535137176513672, -12.725388526916504, -11.915639877319336, -11.105890274047852, -10.296141624450684, -9.486392974853516, -8.676643371582031, -7.866894721984863, -7.057146072387695, -6.247397422790527, -5.437648296356201, -4.627899169921875, -3.818150520324707, -3.008401870727539, -2.198652744293213, -1.3889036178588867, -0.5791549682617188, 0.23059391975402832, 1.0403428077697754, 1.8500916957855225, 2.6598405838012695, 3.4695892333984375, 4.279338359832764, 5.08908748626709, 5.898836135864258, 6.708584785461426, 7.518333911895752, 8.328083038330078, 9.137831687927246, 9.947580337524414, 10.757329940795898, 11.567078590393066, 12.376827239990234, 13.186575889587402, 13.99632453918457, 14.806074142456055, 15.615822792053223, 16.42557144165039, 17.235321044921875, 18.04507064819336, 18.85481834411621, 19.664567947387695, 20.474315643310547, 21.28406524658203, 22.093814849853516, 22.903562545776367, 23.71331214904785, 24.523059844970703, 25.332809448242188]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 3.0, 8.0, 5.0, 14.0, 21.0, 31.0, 49.0, 69.0, 109.0, 208.0, 392.0, 749.0, 1961.0, 6460.0, 26964.0, 158765.0, 646286.0, 167801.0, 28173.0, 6663.0, 2101.0, 787.0, 367.0, 183.0, 124.0, 74.0, 53.0, 42.0, 30.0, 11.0, 13.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.625, -8.351318359375, -8.07763671875, -7.803955078125, -7.5302734375, -7.256591796875, -6.98291015625, -6.709228515625, -6.435546875, -6.161865234375, -5.88818359375, -5.614501953125, -5.3408203125, -5.067138671875, -4.79345703125, -4.519775390625, -4.24609375, -3.972412109375, -3.69873046875, -3.425048828125, -3.1513671875, -2.877685546875, -2.60400390625, -2.330322265625, -2.056640625, -1.782958984375, -1.50927734375, -1.235595703125, -0.9619140625, -0.688232421875, -0.41455078125, -0.140869140625, 0.1328125, 0.406494140625, 0.68017578125, 0.953857421875, 1.2275390625, 1.501220703125, 1.77490234375, 2.048583984375, 2.322265625, 2.595947265625, 2.86962890625, 3.143310546875, 3.4169921875, 3.690673828125, 3.96435546875, 4.238037109375, 4.51171875, 4.785400390625, 5.05908203125, 5.332763671875, 5.6064453125, 5.880126953125, 6.15380859375, 6.427490234375, 6.701171875, 6.974853515625, 7.24853515625, 7.522216796875, 7.7958984375, 8.069580078125, 8.34326171875, 8.616943359375, 8.890625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 11.0, 5.0, 9.0, 11.0, 18.0, 17.0, 22.0, 34.0, 33.0, 34.0, 45.0, 53.0, 57.0, 55.0, 55.0, 63.0, 45.0, 64.0, 62.0, 40.0, 47.0, 28.0, 31.0, 29.0, 22.0, 20.0, 23.0, 17.0, 12.0, 7.0, 12.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.779296875, -3.652496337890625, -3.52569580078125, -3.398895263671875, -3.2720947265625, -3.145294189453125, -3.01849365234375, -2.891693115234375, -2.764892578125, -2.638092041015625, -2.51129150390625, -2.384490966796875, -2.2576904296875, -2.130889892578125, -2.00408935546875, -1.877288818359375, -1.75048828125, -1.623687744140625, -1.49688720703125, -1.370086669921875, -1.2432861328125, -1.116485595703125, -0.98968505859375, -0.862884521484375, -0.736083984375, -0.609283447265625, -0.48248291015625, -0.355682373046875, -0.2288818359375, -0.102081298828125, 0.02471923828125, 0.151519775390625, 0.2783203125, 0.405120849609375, 0.53192138671875, 0.658721923828125, 0.7855224609375, 0.912322998046875, 1.03912353515625, 1.165924072265625, 1.292724609375, 1.419525146484375, 1.54632568359375, 1.673126220703125, 1.7999267578125, 1.926727294921875, 2.05352783203125, 2.180328369140625, 2.30712890625, 2.433929443359375, 2.56072998046875, 2.687530517578125, 2.8143310546875, 2.941131591796875, 3.06793212890625, 3.194732666015625, 3.321533203125, 3.448333740234375, 3.57513427734375, 3.701934814453125, 3.8287353515625, 3.955535888671875, 4.08233642578125, 4.209136962890625, 4.3359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 5.0, 11.0, 24.0, 22.0, 39.0, 54.0, 82.0, 122.0, 244.0, 481.0, 863.0, 2058.0, 6408.0, 33711.0, 630184.0, 334978.0, 29728.0, 5875.0, 1847.0, 756.0, 397.0, 221.0, 144.0, 90.0, 56.0, 42.0, 25.0, 23.0, 14.0, 11.0, 11.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2265625, -11.8665771484375, -11.506591796875, -11.1466064453125, -10.78662109375, -10.4266357421875, -10.066650390625, -9.7066650390625, -9.3466796875, -8.9866943359375, -8.626708984375, -8.2667236328125, -7.90673828125, -7.5467529296875, -7.186767578125, -6.8267822265625, -6.466796875, -6.1068115234375, -5.746826171875, -5.3868408203125, -5.02685546875, -4.6668701171875, -4.306884765625, -3.9468994140625, -3.5869140625, -3.2269287109375, -2.866943359375, -2.5069580078125, -2.14697265625, -1.7869873046875, -1.427001953125, -1.0670166015625, -0.70703125, -0.3470458984375, 0.012939453125, 0.3729248046875, 0.73291015625, 1.0928955078125, 1.452880859375, 1.8128662109375, 2.1728515625, 2.5328369140625, 2.892822265625, 3.2528076171875, 3.61279296875, 3.9727783203125, 4.332763671875, 4.6927490234375, 5.052734375, 5.4127197265625, 5.772705078125, 6.1326904296875, 6.49267578125, 6.8526611328125, 7.212646484375, 7.5726318359375, 7.9326171875, 8.2926025390625, 8.652587890625, 9.0125732421875, 9.37255859375, 9.7325439453125, 10.092529296875, 10.4525146484375, 10.8125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 9.0, 14.0, 11.0, 20.0, 20.0, 32.0, 29.0, 38.0, 53.0, 59.0, 49.0, 68.0, 64.0, 59.0, 73.0, 67.0, 58.0, 45.0, 45.0, 30.0, 37.0, 19.0, 15.0, 21.0, 12.0, 7.0, 9.0, 9.0, 3.0, 2.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.84375, -17.3095703125, -16.775390625, -16.2412109375, -15.70703125, -15.1728515625, -14.638671875, -14.1044921875, -13.5703125, -13.0361328125, -12.501953125, -11.9677734375, -11.43359375, -10.8994140625, -10.365234375, -9.8310546875, -9.296875, -8.7626953125, -8.228515625, -7.6943359375, -7.16015625, -6.6259765625, -6.091796875, -5.5576171875, -5.0234375, -4.4892578125, -3.955078125, -3.4208984375, -2.88671875, -2.3525390625, -1.818359375, -1.2841796875, -0.75, -0.2158203125, 0.318359375, 0.8525390625, 1.38671875, 1.9208984375, 2.455078125, 2.9892578125, 3.5234375, 4.0576171875, 4.591796875, 5.1259765625, 5.66015625, 6.1943359375, 6.728515625, 7.2626953125, 7.796875, 8.3310546875, 8.865234375, 9.3994140625, 9.93359375, 10.4677734375, 11.001953125, 11.5361328125, 12.0703125, 12.6044921875, 13.138671875, 13.6728515625, 14.20703125, 14.7412109375, 15.275390625, 15.8095703125, 16.34375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 10.0, 12.0, 11.0, 21.0, 22.0, 30.0, 60.0, 86.0, 125.0, 254.0, 527.0, 1365.0, 4400.0, 18747.0, 202264.0, 779181.0, 31820.0, 6220.0, 1867.0, 717.0, 306.0, 153.0, 91.0, 63.0, 42.0, 36.0, 27.0, 17.0, 14.0, 9.0, 7.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.788177490234375, -3.64862060546875, -3.509063720703125, -3.3695068359375, -3.229949951171875, -3.09039306640625, -2.950836181640625, -2.811279296875, -2.671722412109375, -2.53216552734375, -2.392608642578125, -2.2530517578125, -2.113494873046875, -1.97393798828125, -1.834381103515625, -1.69482421875, -1.555267333984375, -1.41571044921875, -1.276153564453125, -1.1365966796875, -0.997039794921875, -0.85748291015625, -0.717926025390625, -0.578369140625, -0.438812255859375, -0.29925537109375, -0.159698486328125, -0.0201416015625, 0.119415283203125, 0.25897216796875, 0.398529052734375, 0.5380859375, 0.677642822265625, 0.81719970703125, 0.956756591796875, 1.0963134765625, 1.235870361328125, 1.37542724609375, 1.514984130859375, 1.654541015625, 1.794097900390625, 1.93365478515625, 2.073211669921875, 2.2127685546875, 2.352325439453125, 2.49188232421875, 2.631439208984375, 2.77099609375, 2.910552978515625, 3.05010986328125, 3.189666748046875, 3.3292236328125, 3.468780517578125, 3.60833740234375, 3.747894287109375, 3.887451171875, 4.027008056640625, 4.16656494140625, 4.306121826171875, 4.4456787109375, 4.585235595703125, 4.72479248046875, 4.864349365234375, 5.00390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 14.0, 5.0, 11.0, 5.0, 12.0, 15.0, 27.0, 34.0, 75.0, 108.0, 197.0, 201.0, 104.0, 62.0, 36.0, 26.0, 13.0, 11.0, 6.0, 4.0, 2.0, 5.0, 7.0, 7.0, 5.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00092315673828125, -0.0008932650089263916, -0.0008633732795715332, -0.0008334815502166748, -0.0008035898208618164, -0.000773698091506958, -0.0007438063621520996, -0.0007139146327972412, -0.0006840229034423828, -0.0006541311740875244, -0.000624239444732666, -0.0005943477153778076, -0.0005644559860229492, -0.0005345642566680908, -0.0005046725273132324, -0.000474780797958374, -0.0004448890686035156, -0.0004149973392486572, -0.00038510560989379883, -0.00035521388053894043, -0.00032532215118408203, -0.00029543042182922363, -0.00026553869247436523, -0.00023564696311950684, -0.00020575523376464844, -0.00017586350440979004, -0.00014597177505493164, -0.00011608004570007324, -8.618831634521484e-05, -5.6296586990356445e-05, -2.6404857635498047e-05, 3.4868717193603516e-06, 3.337860107421875e-05, 6.327033042907715e-05, 9.316205978393555e-05, 0.00012305378913879395, 0.00015294551849365234, 0.00018283724784851074, 0.00021272897720336914, 0.00024262070655822754, 0.00027251243591308594, 0.00030240416526794434, 0.00033229589462280273, 0.00036218762397766113, 0.00039207935333251953, 0.00042197108268737793, 0.00045186281204223633, 0.0004817545413970947, 0.0005116462707519531, 0.0005415380001068115, 0.0005714297294616699, 0.0006013214588165283, 0.0006312131881713867, 0.0006611049175262451, 0.0006909966468811035, 0.0007208883762359619, 0.0007507801055908203, 0.0007806718349456787, 0.0008105635643005371, 0.0008404552936553955, 0.0008703470230102539, 0.0009002387523651123, 0.0009301304817199707, 0.0009600222110748291, 0.0009899139404296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 8.0, 12.0, 24.0, 37.0, 48.0, 76.0, 102.0, 128.0, 211.0, 340.0, 658.0, 1280.0, 2666.0, 6031.0, 16809.0, 66922.0, 661865.0, 229144.0, 41299.0, 12052.0, 4430.0, 1998.0, 983.0, 515.0, 322.0, 206.0, 111.0, 69.0, 62.0, 32.0, 21.0, 19.0, 14.0, 12.0, 12.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.447265625, -2.367919921875, -2.28857421875, -2.209228515625, -2.1298828125, -2.050537109375, -1.97119140625, -1.891845703125, -1.8125, -1.733154296875, -1.65380859375, -1.574462890625, -1.4951171875, -1.415771484375, -1.33642578125, -1.257080078125, -1.177734375, -1.098388671875, -1.01904296875, -0.939697265625, -0.8603515625, -0.781005859375, -0.70166015625, -0.622314453125, -0.54296875, -0.463623046875, -0.38427734375, -0.304931640625, -0.2255859375, -0.146240234375, -0.06689453125, 0.012451171875, 0.091796875, 0.171142578125, 0.25048828125, 0.329833984375, 0.4091796875, 0.488525390625, 0.56787109375, 0.647216796875, 0.7265625, 0.805908203125, 0.88525390625, 0.964599609375, 1.0439453125, 1.123291015625, 1.20263671875, 1.281982421875, 1.361328125, 1.440673828125, 1.52001953125, 1.599365234375, 1.6787109375, 1.758056640625, 1.83740234375, 1.916748046875, 1.99609375, 2.075439453125, 2.15478515625, 2.234130859375, 2.3134765625, 2.392822265625, 2.47216796875, 2.551513671875, 2.630859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 12.0, 10.0, 21.0, 26.0, 35.0, 36.0, 49.0, 57.0, 73.0, 95.0, 96.0, 87.0, 72.0, 55.0, 48.0, 37.0, 34.0, 29.0, 21.0, 14.0, 9.0, 8.0, 2.0, 2.0, 5.0, 5.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.208984375, -2.1357421875, -2.0625, -1.9892578125, -1.916015625, -1.8427734375, -1.76953125, -1.6962890625, -1.623046875, -1.5498046875, -1.4765625, -1.4033203125, -1.330078125, -1.2568359375, -1.18359375, -1.1103515625, -1.037109375, -0.9638671875, -0.890625, -0.8173828125, -0.744140625, -0.6708984375, -0.59765625, -0.5244140625, -0.451171875, -0.3779296875, -0.3046875, -0.2314453125, -0.158203125, -0.0849609375, -0.01171875, 0.0615234375, 0.134765625, 0.2080078125, 0.28125, 0.3544921875, 0.427734375, 0.5009765625, 0.57421875, 0.6474609375, 0.720703125, 0.7939453125, 0.8671875, 0.9404296875, 1.013671875, 1.0869140625, 1.16015625, 1.2333984375, 1.306640625, 1.3798828125, 1.453125, 1.5263671875, 1.599609375, 1.6728515625, 1.74609375, 1.8193359375, 1.892578125, 1.9658203125, 2.0390625, 2.1123046875, 2.185546875, 2.2587890625, 2.33203125, 2.4052734375, 2.478515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 12.0, 16.0, 77.0, 319.0, 433.0, 93.0, 24.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.21267700195312, -188.82701110839844, -183.4413604736328, -178.05569458007812, -172.6700439453125, -167.2843780517578, -161.89871215820312, -156.5130615234375, -151.1273956298828, -145.74172973632812, -140.3560791015625, -134.9704132080078, -129.58474731445312, -124.1990966796875, -118.81343078613281, -113.42777252197266, -108.0421142578125, -102.65645599365234, -97.27079772949219, -91.8851318359375, -86.49947357177734, -81.11381530761719, -75.7281494140625, -70.34249114990234, -64.95683288574219, -59.57117462158203, -54.18551254272461, -48.79985046386719, -43.41419219970703, -38.028533935546875, -32.64287185668945, -27.25720977783203, -21.871536254882812, -16.485876083374023, -11.100215911865234, -5.714555740356445, -0.32889556884765625, 5.056764602661133, 10.442424774169922, 15.828086853027344, 21.2137451171875, 26.59940528869629, 31.985065460205078, 37.3707275390625, 42.756385803222656, 48.14204406738281, 53.527706146240234, 58.913368225097656, 64.29902648925781, 69.68468475341797, 75.07034301757812, 80.45600891113281, 85.84166717529297, 91.22732543945312, 96.61299133300781, 101.99864959716797, 107.38430786132812, 112.76996612548828, 118.15562438964844, 123.54129028320312, 128.92694091796875, 134.31260681152344, 139.69827270507812, 145.08392333984375, 150.46958923339844]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 13.0, 10.0, 7.0, 15.0, 13.0, 27.0, 21.0, 22.0, 27.0, 36.0, 40.0, 33.0, 53.0, 107.0, 138.0, 93.0, 45.0, 44.0, 42.0, 38.0, 25.0, 28.0, 19.0, 21.0, 17.0, 11.0, 8.0, 8.0, 6.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.70012664794922, -55.795955657958984, -53.89178466796875, -51.987613677978516, -50.08344268798828, -48.17927169799805, -46.27510070800781, -44.37092971801758, -42.466758728027344, -40.56258773803711, -38.658416748046875, -36.75424575805664, -34.850074768066406, -32.94590377807617, -31.041732788085938, -29.137561798095703, -27.2333927154541, -25.329221725463867, -23.425050735473633, -21.5208797454834, -19.616708755493164, -17.712539672851562, -15.808367729187012, -13.904196739196777, -12.000025749206543, -10.095854759216309, -8.191683769226074, -6.287513256072998, -4.383342266082764, -2.4791717529296875, -0.5750007629394531, 1.3291702270507812, 3.2333412170410156, 5.13751220703125, 7.041683197021484, 8.945854187011719, 10.850025177001953, 12.754195213317871, 14.658366203308105, 16.562538146972656, 18.46670913696289, 20.370880126953125, 22.27505111694336, 24.179222106933594, 26.083393096923828, 27.987564086914062, 29.891735076904297, 31.79590606689453, 33.7000732421875, 35.604244232177734, 37.50841522216797, 39.4125862121582, 41.31675720214844, 43.22092819213867, 45.125099182128906, 47.02927017211914, 48.933441162109375, 50.83761215209961, 52.741783142089844, 54.64595413208008, 56.55012512207031, 58.45429611206055, 60.35846710205078, 62.262638092041016, 64.16680908203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 11.0, 12.0, 11.0, 14.0, 21.0, 33.0, 47.0, 80.0, 123.0, 215.0, 354.0, 627.0, 1300.0, 3342.0, 10723.0, 61036.0, 946600.0, 2906557.0, 229861.0, 24279.0, 5409.0, 1815.0, 814.0, 390.0, 217.0, 132.0, 79.0, 52.0, 39.0, 24.0, 15.0, 14.0, 9.0, 3.0, 4.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.6796875, -10.3267822265625, -9.973876953125, -9.6209716796875, -9.26806640625, -8.9151611328125, -8.562255859375, -8.2093505859375, -7.8564453125, -7.5035400390625, -7.150634765625, -6.7977294921875, -6.44482421875, -6.0919189453125, -5.739013671875, -5.3861083984375, -5.033203125, -4.6802978515625, -4.327392578125, -3.9744873046875, -3.62158203125, -3.2686767578125, -2.915771484375, -2.5628662109375, -2.2099609375, -1.8570556640625, -1.504150390625, -1.1512451171875, -0.79833984375, -0.4454345703125, -0.092529296875, 0.2603759765625, 0.61328125, 0.9661865234375, 1.319091796875, 1.6719970703125, 2.02490234375, 2.3778076171875, 2.730712890625, 3.0836181640625, 3.4365234375, 3.7894287109375, 4.142333984375, 4.4952392578125, 4.84814453125, 5.2010498046875, 5.553955078125, 5.9068603515625, 6.259765625, 6.6126708984375, 6.965576171875, 7.3184814453125, 7.67138671875, 8.0242919921875, 8.377197265625, 8.7301025390625, 9.0830078125, 9.4359130859375, 9.788818359375, 10.1417236328125, 10.49462890625, 10.8475341796875, 11.200439453125, 11.5533447265625, 11.90625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 11.0, 7.0, 8.0, 16.0, 21.0, 27.0, 29.0, 27.0, 43.0, 49.0, 48.0, 46.0, 60.0, 64.0, 71.0, 69.0, 58.0, 54.0, 56.0, 46.0, 48.0, 36.0, 20.0, 21.0, 15.0, 19.0, 14.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.085968017578125, -2.94342041015625, -2.800872802734375, -2.6583251953125, -2.515777587890625, -2.37322998046875, -2.230682373046875, -2.088134765625, -1.945587158203125, -1.80303955078125, -1.660491943359375, -1.5179443359375, -1.375396728515625, -1.23284912109375, -1.090301513671875, -0.94775390625, -0.805206298828125, -0.66265869140625, -0.520111083984375, -0.3775634765625, -0.235015869140625, -0.09246826171875, 0.050079345703125, 0.192626953125, 0.335174560546875, 0.47772216796875, 0.620269775390625, 0.7628173828125, 0.905364990234375, 1.04791259765625, 1.190460205078125, 1.3330078125, 1.475555419921875, 1.61810302734375, 1.760650634765625, 1.9031982421875, 2.045745849609375, 2.18829345703125, 2.330841064453125, 2.473388671875, 2.615936279296875, 2.75848388671875, 2.901031494140625, 3.0435791015625, 3.186126708984375, 3.32867431640625, 3.471221923828125, 3.61376953125, 3.756317138671875, 3.89886474609375, 4.041412353515625, 4.1839599609375, 4.326507568359375, 4.46905517578125, 4.611602783203125, 4.754150390625, 4.896697998046875, 5.03924560546875, 5.181793212890625, 5.3243408203125, 5.466888427734375, 5.60943603515625, 5.751983642578125, 5.89453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 5.0, 1.0, 6.0, 14.0, 14.0, 23.0, 25.0, 60.0, 83.0, 149.0, 331.0, 742.0, 2443.0, 14946.0, 3826519.0, 339138.0, 6959.0, 1593.0, 593.0, 265.0, 145.0, 68.0, 47.0, 32.0, 16.0, 13.0, 10.0, 8.0, 9.0, 0.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.625, -27.55810546875, -26.4912109375, -25.42431640625, -24.357421875, -23.29052734375, -22.2236328125, -21.15673828125, -20.08984375, -19.02294921875, -17.9560546875, -16.88916015625, -15.822265625, -14.75537109375, -13.6884765625, -12.62158203125, -11.5546875, -10.48779296875, -9.4208984375, -8.35400390625, -7.287109375, -6.22021484375, -5.1533203125, -4.08642578125, -3.01953125, -1.95263671875, -0.8857421875, 0.18115234375, 1.248046875, 2.31494140625, 3.3818359375, 4.44873046875, 5.515625, 6.58251953125, 7.6494140625, 8.71630859375, 9.783203125, 10.85009765625, 11.9169921875, 12.98388671875, 14.05078125, 15.11767578125, 16.1845703125, 17.25146484375, 18.318359375, 19.38525390625, 20.4521484375, 21.51904296875, 22.5859375, 23.65283203125, 24.7197265625, 25.78662109375, 26.853515625, 27.92041015625, 28.9873046875, 30.05419921875, 31.12109375, 32.18798828125, 33.2548828125, 34.32177734375, 35.388671875, 36.45556640625, 37.5224609375, 38.58935546875, 39.65625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 20.0, 21.0, 28.0, 51.0, 84.0, 195.0, 364.0, 660.0, 1015.0, 768.0, 415.0, 191.0, 112.0, 56.0, 32.0, 13.0, 12.0, 14.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.296875, -17.677978515625, -17.05908203125, -16.440185546875, -15.8212890625, -15.202392578125, -14.58349609375, -13.964599609375, -13.345703125, -12.726806640625, -12.10791015625, -11.489013671875, -10.8701171875, -10.251220703125, -9.63232421875, -9.013427734375, -8.39453125, -7.775634765625, -7.15673828125, -6.537841796875, -5.9189453125, -5.300048828125, -4.68115234375, -4.062255859375, -3.443359375, -2.824462890625, -2.20556640625, -1.586669921875, -0.9677734375, -0.348876953125, 0.27001953125, 0.888916015625, 1.5078125, 2.126708984375, 2.74560546875, 3.364501953125, 3.9833984375, 4.602294921875, 5.22119140625, 5.840087890625, 6.458984375, 7.077880859375, 7.69677734375, 8.315673828125, 8.9345703125, 9.553466796875, 10.17236328125, 10.791259765625, 11.41015625, 12.029052734375, 12.64794921875, 13.266845703125, 13.8857421875, 14.504638671875, 15.12353515625, 15.742431640625, 16.361328125, 16.980224609375, 17.59912109375, 18.218017578125, 18.8369140625, 19.455810546875, 20.07470703125, 20.693603515625, 21.3125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 15.0, 22.0, 47.0, 139.0, 273.0, 249.0, 141.0, 38.0, 25.0, 17.0, 10.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.3529052734375, -263.3999328613281, -256.44696044921875, -249.4939727783203, -242.54100036621094, -235.5880126953125, -228.63504028320312, -221.68206787109375, -214.72909545898438, -207.776123046875, -200.82313537597656, -193.8701629638672, -186.9171905517578, -179.96420288085938, -173.01123046875, -166.05825805664062, -159.1052703857422, -152.1522979736328, -145.19931030273438, -138.246337890625, -131.29336547851562, -124.34038543701172, -117.38740539550781, -110.43443298339844, -103.48145294189453, -96.52847290039062, -89.57550048828125, -82.62252044677734, -75.66954040527344, -68.71656799316406, -61.763587951660156, -54.810611724853516, -47.85765075683594, -40.9046745300293, -33.951698303222656, -26.99871826171875, -20.04574203491211, -13.092765808105469, -6.1397857666015625, 0.8131904602050781, 7.766166687011719, 14.719143867492676, 21.672121047973633, 28.625099182128906, 35.57807540893555, 42.53105163574219, 49.484031677246094, 56.437007904052734, 63.389984130859375, 70.34296417236328, 77.29593658447266, 84.24891662597656, 91.20188903808594, 98.15486907958984, 105.10784912109375, 112.06082153320312, 119.01380157470703, 125.96678161621094, 132.9197540283203, 139.87274169921875, 146.82571411132812, 153.7786865234375, 160.73165893554688, 167.6846466064453, 174.6376190185547]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 9.0, 4.0, 4.0, 6.0, 7.0, 14.0, 10.0, 17.0, 12.0, 19.0, 29.0, 35.0, 45.0, 49.0, 57.0, 68.0, 60.0, 58.0, 59.0, 80.0, 55.0, 50.0, 34.0, 47.0, 24.0, 22.0, 18.0, 25.0, 22.0, 14.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.27967834472656, -73.81600952148438, -71.35233306884766, -68.88865661621094, -66.42498779296875, -63.9613151550293, -61.497642517089844, -59.03396987915039, -56.57029724121094, -54.106624603271484, -51.64295196533203, -49.17927932739258, -46.715606689453125, -44.25193405151367, -41.78826141357422, -39.324588775634766, -36.86091613769531, -34.39724349975586, -31.933570861816406, -29.469898223876953, -27.0062255859375, -24.542552947998047, -22.078880310058594, -19.61520767211914, -17.151535034179688, -14.687862396240234, -12.224189758300781, -9.760517120361328, -7.296844482421875, -4.833171844482422, -2.3694992065429688, 0.09417343139648438, 2.5578460693359375, 5.021518707275391, 7.485191345214844, 9.948863983154297, 12.41253662109375, 14.876209259033203, 17.339881896972656, 19.80355453491211, 22.267227172851562, 24.730899810791016, 27.19457244873047, 29.658245086669922, 32.121917724609375, 34.58559036254883, 37.04926300048828, 39.512935638427734, 41.97660827636719, 44.44028091430664, 46.903953552246094, 49.36762619018555, 51.831298828125, 54.29497146606445, 56.758644104003906, 59.22231674194336, 61.68598937988281, 64.149658203125, 66.61333465576172, 69.07701110839844, 71.54067993164062, 74.00434875488281, 76.46802520751953, 78.93170166015625, 81.39537048339844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 1.0, 5.0, 9.0, 16.0, 25.0, 41.0, 60.0, 115.0, 236.0, 532.0, 1353.0, 3936.0, 15528.0, 106663.0, 759486.0, 135391.0, 18052.0, 4524.0, 1455.0, 572.0, 250.0, 131.0, 69.0, 30.0, 28.0, 14.0, 10.0, 9.0, 4.0, 4.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.3809814453125, -10.004150390625, -9.6273193359375, -9.25048828125, -8.8736572265625, -8.496826171875, -8.1199951171875, -7.7431640625, -7.3663330078125, -6.989501953125, -6.6126708984375, -6.23583984375, -5.8590087890625, -5.482177734375, -5.1053466796875, -4.728515625, -4.3516845703125, -3.974853515625, -3.5980224609375, -3.22119140625, -2.8443603515625, -2.467529296875, -2.0906982421875, -1.7138671875, -1.3370361328125, -0.960205078125, -0.5833740234375, -0.20654296875, 0.1702880859375, 0.547119140625, 0.9239501953125, 1.30078125, 1.6776123046875, 2.054443359375, 2.4312744140625, 2.80810546875, 3.1849365234375, 3.561767578125, 3.9385986328125, 4.3154296875, 4.6922607421875, 5.069091796875, 5.4459228515625, 5.82275390625, 6.1995849609375, 6.576416015625, 6.9532470703125, 7.330078125, 7.7069091796875, 8.083740234375, 8.4605712890625, 8.83740234375, 9.2142333984375, 9.591064453125, 9.9678955078125, 10.3447265625, 10.7215576171875, 11.098388671875, 11.4752197265625, 11.85205078125, 12.2288818359375, 12.605712890625, 12.9825439453125, 13.359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 9.0, 11.0, 17.0, 22.0, 28.0, 24.0, 34.0, 38.0, 70.0, 55.0, 67.0, 65.0, 76.0, 73.0, 62.0, 64.0, 51.0, 56.0, 35.0, 51.0, 23.0, 21.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.15625, -7.93304443359375, -7.7098388671875, -7.48663330078125, -7.263427734375, -7.04022216796875, -6.8170166015625, -6.59381103515625, -6.37060546875, -6.14739990234375, -5.9241943359375, -5.70098876953125, -5.477783203125, -5.25457763671875, -5.0313720703125, -4.80816650390625, -4.5849609375, -4.36175537109375, -4.1385498046875, -3.91534423828125, -3.692138671875, -3.46893310546875, -3.2457275390625, -3.02252197265625, -2.79931640625, -2.57611083984375, -2.3529052734375, -2.12969970703125, -1.906494140625, -1.68328857421875, -1.4600830078125, -1.23687744140625, -1.013671875, -0.79046630859375, -0.5672607421875, -0.34405517578125, -0.120849609375, 0.10235595703125, 0.3255615234375, 0.54876708984375, 0.77197265625, 0.99517822265625, 1.2183837890625, 1.44158935546875, 1.664794921875, 1.88800048828125, 2.1112060546875, 2.33441162109375, 2.5576171875, 2.78082275390625, 3.0040283203125, 3.22723388671875, 3.450439453125, 3.67364501953125, 3.8968505859375, 4.12005615234375, 4.34326171875, 4.56646728515625, 4.7896728515625, 5.01287841796875, 5.236083984375, 5.45928955078125, 5.6824951171875, 5.90570068359375, 6.12890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 17.0, 23.0, 28.0, 36.0, 56.0, 85.0, 145.0, 257.0, 474.0, 1170.0, 3202.0, 12743.0, 97505.0, 872892.0, 47849.0, 7969.0, 2191.0, 867.0, 429.0, 222.0, 101.0, 75.0, 56.0, 44.0, 24.0, 16.0, 15.0, 13.0, 7.0, 3.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -12.042236328125, -11.70166015625, -11.361083984375, -11.0205078125, -10.679931640625, -10.33935546875, -9.998779296875, -9.658203125, -9.317626953125, -8.97705078125, -8.636474609375, -8.2958984375, -7.955322265625, -7.61474609375, -7.274169921875, -6.93359375, -6.593017578125, -6.25244140625, -5.911865234375, -5.5712890625, -5.230712890625, -4.89013671875, -4.549560546875, -4.208984375, -3.868408203125, -3.52783203125, -3.187255859375, -2.8466796875, -2.506103515625, -2.16552734375, -1.824951171875, -1.484375, -1.143798828125, -0.80322265625, -0.462646484375, -0.1220703125, 0.218505859375, 0.55908203125, 0.899658203125, 1.240234375, 1.580810546875, 1.92138671875, 2.261962890625, 2.6025390625, 2.943115234375, 3.28369140625, 3.624267578125, 3.96484375, 4.305419921875, 4.64599609375, 4.986572265625, 5.3271484375, 5.667724609375, 6.00830078125, 6.348876953125, 6.689453125, 7.030029296875, 7.37060546875, 7.711181640625, 8.0517578125, 8.392333984375, 8.73291015625, 9.073486328125, 9.4140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 4.0, 9.0, 9.0, 10.0, 9.0, 19.0, 23.0, 20.0, 14.0, 21.0, 30.0, 30.0, 39.0, 43.0, 58.0, 69.0, 66.0, 66.0, 71.0, 53.0, 60.0, 38.0, 35.0, 37.0, 26.0, 18.0, 13.0, 22.0, 17.0, 9.0, 11.0, 8.0, 7.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.75, -19.17578125, -18.6015625, -18.02734375, -17.453125, -16.87890625, -16.3046875, -15.73046875, -15.15625, -14.58203125, -14.0078125, -13.43359375, -12.859375, -12.28515625, -11.7109375, -11.13671875, -10.5625, -9.98828125, -9.4140625, -8.83984375, -8.265625, -7.69140625, -7.1171875, -6.54296875, -5.96875, -5.39453125, -4.8203125, -4.24609375, -3.671875, -3.09765625, -2.5234375, -1.94921875, -1.375, -0.80078125, -0.2265625, 0.34765625, 0.921875, 1.49609375, 2.0703125, 2.64453125, 3.21875, 3.79296875, 4.3671875, 4.94140625, 5.515625, 6.08984375, 6.6640625, 7.23828125, 7.8125, 8.38671875, 8.9609375, 9.53515625, 10.109375, 10.68359375, 11.2578125, 11.83203125, 12.40625, 12.98046875, 13.5546875, 14.12890625, 14.703125, 15.27734375, 15.8515625, 16.42578125, 17.0]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 13.0, 6.0, 14.0, 22.0, 36.0, 45.0, 59.0, 88.0, 157.0, 281.0, 553.0, 1152.0, 3473.0, 17350.0, 908133.0, 105122.0, 7986.0, 2205.0, 860.0, 417.0, 202.0, 106.0, 76.0, 56.0, 35.0, 25.0, 13.0, 13.0, 7.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.951171875, -3.834259033203125, -3.71734619140625, -3.600433349609375, -3.4835205078125, -3.366607666015625, -3.24969482421875, -3.132781982421875, -3.015869140625, -2.898956298828125, -2.78204345703125, -2.665130615234375, -2.5482177734375, -2.431304931640625, -2.31439208984375, -2.197479248046875, -2.08056640625, -1.963653564453125, -1.84674072265625, -1.729827880859375, -1.6129150390625, -1.496002197265625, -1.37908935546875, -1.262176513671875, -1.145263671875, -1.028350830078125, -0.91143798828125, -0.794525146484375, -0.6776123046875, -0.560699462890625, -0.44378662109375, -0.326873779296875, -0.2099609375, -0.093048095703125, 0.02386474609375, 0.140777587890625, 0.2576904296875, 0.374603271484375, 0.49151611328125, 0.608428955078125, 0.725341796875, 0.842254638671875, 0.95916748046875, 1.076080322265625, 1.1929931640625, 1.309906005859375, 1.42681884765625, 1.543731689453125, 1.66064453125, 1.777557373046875, 1.89447021484375, 2.011383056640625, 2.1282958984375, 2.245208740234375, 2.36212158203125, 2.479034423828125, 2.595947265625, 2.712860107421875, 2.82977294921875, 2.946685791015625, 3.0635986328125, 3.180511474609375, 3.29742431640625, 3.414337158203125, 3.53125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 9.0, 13.0, 11.0, 21.0, 24.0, 34.0, 43.0, 74.0, 76.0, 101.0, 96.0, 112.0, 91.0, 71.0, 56.0, 34.0, 29.0, 18.0, 13.0, 15.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031065940856933594, -0.0002981610596179962, -0.0002856627106666565, -0.00027316436171531677, -0.00026066601276397705, -0.00024816766381263733, -0.0002356693148612976, -0.00022317096590995789, -0.00021067261695861816, -0.00019817426800727844, -0.00018567591905593872, -0.000173177570104599, -0.00016067922115325928, -0.00014818087220191956, -0.00013568252325057983, -0.0001231841742992401, -0.00011068582534790039, -9.818747639656067e-05, -8.568912744522095e-05, -7.319077849388123e-05, -6.0692429542541504e-05, -4.819408059120178e-05, -3.569573163986206e-05, -2.319738268852234e-05, -1.0699033737182617e-05, 1.7993152141571045e-06, 1.4297664165496826e-05, 2.6796013116836548e-05, 3.929436206817627e-05, 5.179271101951599e-05, 6.429105997085571e-05, 7.678940892219543e-05, 8.928775787353516e-05, 0.00010178610682487488, 0.0001142844557762146, 0.00012678280472755432, 0.00013928115367889404, 0.00015177950263023376, 0.00016427785158157349, 0.0001767762005329132, 0.00018927454948425293, 0.00020177289843559265, 0.00021427124738693237, 0.0002267695963382721, 0.00023926794528961182, 0.00025176629424095154, 0.00026426464319229126, 0.000276762992143631, 0.0002892613410949707, 0.0003017596900463104, 0.00031425803899765015, 0.00032675638794898987, 0.0003392547369003296, 0.0003517530858516693, 0.00036425143480300903, 0.00037674978375434875, 0.0003892481327056885, 0.0004017464816570282, 0.0004142448306083679, 0.00042674317955970764, 0.00043924152851104736, 0.0004517398774623871, 0.0004642382264137268, 0.00047673657536506653, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 14.0, 34.0, 56.0, 73.0, 202.0, 366.0, 825.0, 2094.0, 6582.0, 31099.0, 764383.0, 213300.0, 21435.0, 4995.0, 1730.0, 667.0, 325.0, 154.0, 72.0, 46.0, 36.0, 19.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.156158447265625, -2.07598876953125, -1.995819091796875, -1.9156494140625, -1.835479736328125, -1.75531005859375, -1.675140380859375, -1.594970703125, -1.514801025390625, -1.43463134765625, -1.354461669921875, -1.2742919921875, -1.194122314453125, -1.11395263671875, -1.033782958984375, -0.95361328125, -0.873443603515625, -0.79327392578125, -0.713104248046875, -0.6329345703125, -0.552764892578125, -0.47259521484375, -0.392425537109375, -0.312255859375, -0.232086181640625, -0.15191650390625, -0.071746826171875, 0.0084228515625, 0.088592529296875, 0.16876220703125, 0.248931884765625, 0.3291015625, 0.409271240234375, 0.48944091796875, 0.569610595703125, 0.6497802734375, 0.729949951171875, 0.81011962890625, 0.890289306640625, 0.970458984375, 1.050628662109375, 1.13079833984375, 1.210968017578125, 1.2911376953125, 1.371307373046875, 1.45147705078125, 1.531646728515625, 1.61181640625, 1.691986083984375, 1.77215576171875, 1.852325439453125, 1.9324951171875, 2.012664794921875, 2.09283447265625, 2.173004150390625, 2.253173828125, 2.333343505859375, 2.41351318359375, 2.493682861328125, 2.5738525390625, 2.654022216796875, 2.73419189453125, 2.814361572265625, 2.89453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 11.0, 7.0, 4.0, 6.0, 7.0, 16.0, 20.0, 22.0, 28.0, 40.0, 68.0, 91.0, 132.0, 149.0, 117.0, 84.0, 64.0, 38.0, 27.0, 17.0, 11.0, 13.0, 4.0, 8.0, 8.0, 8.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.471160888671875, -2.38372802734375, -2.296295166015625, -2.2088623046875, -2.121429443359375, -2.03399658203125, -1.946563720703125, -1.859130859375, -1.771697998046875, -1.68426513671875, -1.596832275390625, -1.5093994140625, -1.421966552734375, -1.33453369140625, -1.247100830078125, -1.15966796875, -1.072235107421875, -0.98480224609375, -0.897369384765625, -0.8099365234375, -0.722503662109375, -0.63507080078125, -0.547637939453125, -0.460205078125, -0.372772216796875, -0.28533935546875, -0.197906494140625, -0.1104736328125, -0.023040771484375, 0.06439208984375, 0.151824951171875, 0.2392578125, 0.326690673828125, 0.41412353515625, 0.501556396484375, 0.5889892578125, 0.676422119140625, 0.76385498046875, 0.851287841796875, 0.938720703125, 1.026153564453125, 1.11358642578125, 1.201019287109375, 1.2884521484375, 1.375885009765625, 1.46331787109375, 1.550750732421875, 1.63818359375, 1.725616455078125, 1.81304931640625, 1.900482177734375, 1.9879150390625, 2.075347900390625, 2.16278076171875, 2.250213623046875, 2.337646484375, 2.425079345703125, 2.51251220703125, 2.599945068359375, 2.6873779296875, 2.774810791015625, 2.86224365234375, 2.949676513671875, 3.037109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 11.0, 31.0, 69.0, 422.0, 364.0, 59.0, 28.0, 13.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-257.6507263183594, -252.16146850585938, -246.67221069335938, -241.18295288085938, -235.69371032714844, -230.20445251464844, -224.71519470214844, -219.22593688964844, -213.7366943359375, -208.2474365234375, -202.7581787109375, -197.2689208984375, -191.77967834472656, -186.29042053222656, -180.80116271972656, -175.31190490722656, -169.82264709472656, -164.33338928222656, -158.84413146972656, -153.35488891601562, -147.86563110351562, -142.37637329101562, -136.88711547851562, -131.39785766601562, -125.90860748291016, -120.41934967041016, -114.93009948730469, -109.44084167480469, -103.95158386230469, -98.46233367919922, -92.97307586669922, -87.48382568359375, -81.99456787109375, -76.50531005859375, -71.01605987548828, -65.52680206298828, -60.03754806518555, -54.54829406738281, -49.05903625488281, -43.56978225708008, -38.080528259277344, -32.59127426147461, -27.102018356323242, -21.612762451171875, -16.12350845336914, -10.634254455566406, -5.144996643066406, 0.3442573547363281, 5.8335113525390625, 11.322766304016113, 16.812021255493164, 22.30127716064453, 27.790531158447266, 33.27978515625, 38.76904296875, 44.258296966552734, 49.74755096435547, 55.2368049621582, 60.72605895996094, 66.21531677246094, 71.70457458496094, 77.1938247680664, 82.6830825805664, 88.17233276367188, 93.66159057617188]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 16.0, 10.0, 12.0, 24.0, 25.0, 14.0, 22.0, 35.0, 43.0, 116.0, 149.0, 128.0, 146.0, 47.0, 37.0, 35.0, 23.0, 14.0, 23.0, 16.0, 14.0, 7.0, 8.0, 4.0, 7.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.26123809814453, -59.085784912109375, -56.91032791137695, -54.73487091064453, -52.559417724609375, -50.38396453857422, -48.2085075378418, -46.033050537109375, -43.85759735107422, -41.68214416503906, -39.50668716430664, -37.33123016357422, -35.15577697753906, -32.980323791503906, -30.804866790771484, -28.629411697387695, -26.453956604003906, -24.278501510620117, -22.103046417236328, -19.92759132385254, -17.75213623046875, -15.576681137084961, -13.401226043701172, -11.225770950317383, -9.050315856933594, -6.874860763549805, -4.699405670166016, -2.5239505767822266, -0.3484954833984375, 1.8269596099853516, 4.002414703369141, 6.17786979675293, 8.353317260742188, 10.528772354125977, 12.704227447509766, 14.879682540893555, 17.055137634277344, 19.230592727661133, 21.406047821044922, 23.58150291442871, 25.7569580078125, 27.93241310119629, 30.107868194580078, 32.2833251953125, 34.458778381347656, 36.63423156738281, 38.809688568115234, 40.985145568847656, 43.16059875488281, 45.33605194091797, 47.51150894165039, 49.68696594238281, 51.86241912841797, 54.037872314453125, 56.21332931518555, 58.38878631591797, 60.564239501953125, 62.73969268798828, 64.91514587402344, 67.09060668945312, 69.26605987548828, 71.44151306152344, 73.61697387695312, 75.79242706298828, 77.96788024902344]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 2.0, 11.0, 16.0, 14.0, 24.0, 26.0, 27.0, 40.0, 31.0, 35.0, 42.0, 126.0, 220.0, 76.0, 45.0, 41.0, 40.0, 40.0, 19.0, 22.0, 22.0, 17.0, 9.0, 10.0, 8.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.15625, -6.96435546875, -6.7724609375, -6.58056640625, -6.388671875, -6.19677734375, -6.0048828125, -5.81298828125, -5.62109375, -5.42919921875, -5.2373046875, -5.04541015625, -4.853515625, -4.66162109375, -4.4697265625, -4.27783203125, -4.0859375, -3.89404296875, -3.7021484375, -3.51025390625, -3.318359375, -3.12646484375, -2.9345703125, -2.74267578125, -2.55078125, -2.35888671875, -2.1669921875, -1.97509765625, -1.783203125, -1.59130859375, -1.3994140625, -1.20751953125, -1.015625, -0.82373046875, -0.6318359375, -0.43994140625, -0.248046875, -0.05615234375, 0.1357421875, 0.32763671875, 0.51953125, 0.71142578125, 0.9033203125, 1.09521484375, 1.287109375, 1.47900390625, 1.6708984375, 1.86279296875, 2.0546875, 2.24658203125, 2.4384765625, 2.63037109375, 2.822265625, 3.01416015625, 3.2060546875, 3.39794921875, 3.58984375, 3.78173828125, 3.9736328125, 4.16552734375, 4.357421875, 4.54931640625, 4.7412109375, 4.93310546875, 5.125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 2.0, 11.0, 6.0, 16.0, 34.0, 41.0, 76.0, 176.0, 693.0, 10818.0, 8371318.0, 4643.0, 456.0, 122.0, 54.0, 49.0, 17.0, 19.0, 6.0, 3.0, 8.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0986099243164, -70.21765899658203, -67.33670806884766, -64.45575714111328, -61.574806213378906, -58.69385528564453, -55.81290054321289, -52.931949615478516, -50.05099868774414, -47.170047760009766, -44.28909683227539, -41.40814208984375, -38.527191162109375, -35.646240234375, -32.765289306640625, -29.88433837890625, -27.003387451171875, -24.1224365234375, -21.241485595703125, -18.360532760620117, -15.479581832885742, -12.598630905151367, -9.71767807006836, -6.836727142333984, -3.9557762145996094, -1.0748248100280762, 1.806126594543457, 4.687078475952148, 7.568029403686523, 10.448980331420898, 13.329933166503906, 16.21088409423828, 19.091835021972656, 21.97278594970703, 24.853736877441406, 27.734689712524414, 30.61564064025879, 33.49658966064453, 36.37754440307617, 39.25849533081055, 42.13944625854492, 45.0203971862793, 47.90134811401367, 50.78230285644531, 53.66325378417969, 56.54420471191406, 59.42515563964844, 62.30610656738281, 65.18705749511719, 68.06800842285156, 70.94895935058594, 73.82991027832031, 76.71086120605469, 79.59181213378906, 82.47276306152344, 85.35371398925781, 88.23466491699219, 91.11561584472656, 93.99656677246094, 96.87751770019531, 99.75846862792969, 102.63941955566406, 105.52037048339844, 108.40132141113281, 111.28227996826172]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.46683502197266, -85.97240447998047, -83.47797393798828, -80.98353576660156, -78.48910522460938, -75.99467468261719, -73.500244140625, -71.00581359863281, -68.5113754272461, -66.0169448852539, -63.52251052856445, -61.028079986572266, -58.53364562988281, -56.039215087890625, -53.54478454589844, -51.050350189208984, -48.5559196472168, -46.06148910522461, -43.567054748535156, -41.07262420654297, -38.578189849853516, -36.08375930786133, -33.589324951171875, -31.094894409179688, -28.600461959838867, -26.106029510498047, -23.611597061157227, -21.117164611816406, -18.62273406982422, -16.128299713134766, -13.633869171142578, -11.139436721801758, -8.645004272460938, -6.150571823120117, -3.656139850616455, -1.161707878112793, 1.3327245712280273, 3.8271570205688477, 6.321588516235352, 8.816020965576172, 11.310453414916992, 13.804885864257812, 16.299318313598633, 18.793750762939453, 21.28818130493164, 23.782615661621094, 26.27704620361328, 28.7714786529541, 31.265911102294922, 33.76034164428711, 36.25477600097656, 38.74920654296875, 41.2436408996582, 43.73807144165039, 46.232505798339844, 48.72693634033203, 51.22136688232422, 53.715797424316406, 56.21023178100586, 58.70466232299805, 61.1990966796875, 63.69352722167969, 66.18795776367188, 68.68238830566406, 71.17682647705078]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 10.0, 12.0, 8.0, 7.0, 8.0, 27.0, 15.0, 18.0, 34.0, 44.0, 42.0, 45.0, 44.0, 66.0, 65.0, 60.0, 76.0, 71.0, 60.0, 45.0, 57.0, 33.0, 36.0, 30.0, 16.0, 14.0, 14.0, 8.0, 10.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.474029541015625, -3.31329345703125, -3.152557373046875, -2.9918212890625, -2.831085205078125, -2.67034912109375, -2.509613037109375, -2.348876953125, -2.188140869140625, -2.02740478515625, -1.866668701171875, -1.7059326171875, -1.545196533203125, -1.38446044921875, -1.223724365234375, -1.06298828125, -0.902252197265625, -0.74151611328125, -0.580780029296875, -0.4200439453125, -0.259307861328125, -0.09857177734375, 0.062164306640625, 0.222900390625, 0.383636474609375, 0.54437255859375, 0.705108642578125, 0.8658447265625, 1.026580810546875, 1.18731689453125, 1.348052978515625, 1.5087890625, 1.669525146484375, 1.83026123046875, 1.990997314453125, 2.1517333984375, 2.312469482421875, 2.47320556640625, 2.633941650390625, 2.794677734375, 2.955413818359375, 3.11614990234375, 3.276885986328125, 3.4376220703125, 3.598358154296875, 3.75909423828125, 3.919830322265625, 4.08056640625, 4.241302490234375, 4.40203857421875, 4.562774658203125, 4.7235107421875, 4.884246826171875, 5.04498291015625, 5.205718994140625, 5.366455078125, 5.527191162109375, 5.68792724609375, 5.848663330078125, 6.0093994140625, 6.170135498046875, 6.33087158203125, 6.491607666015625, 6.65234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 21.0, 17.0, 27.0, 30.0, 62.0, 95.0, 154.0, 260.0, 461.0, 927.0, 2113.0, 5590.0, 17209.0, 62360.0, 208124.0, 163701.0, 42910.0, 12484.0, 4213.0, 1738.0, 769.0, 387.0, 229.0, 129.0, 89.0, 69.0, 31.0, 19.0, 13.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.46875, -39.30810546875, -38.1474609375, -36.98681640625, -35.826171875, -34.66552734375, -33.5048828125, -32.34423828125, -31.18359375, -30.02294921875, -28.8623046875, -27.70166015625, -26.541015625, -25.38037109375, -24.2197265625, -23.05908203125, -21.8984375, -20.73779296875, -19.5771484375, -18.41650390625, -17.255859375, -16.09521484375, -14.9345703125, -13.77392578125, -12.61328125, -11.45263671875, -10.2919921875, -9.13134765625, -7.970703125, -6.81005859375, -5.6494140625, -4.48876953125, -3.328125, -2.16748046875, -1.0068359375, 0.15380859375, 1.314453125, 2.47509765625, 3.6357421875, 4.79638671875, 5.95703125, 7.11767578125, 8.2783203125, 9.43896484375, 10.599609375, 11.76025390625, 12.9208984375, 14.08154296875, 15.2421875, 16.40283203125, 17.5634765625, 18.72412109375, 19.884765625, 21.04541015625, 22.2060546875, 23.36669921875, 24.52734375, 25.68798828125, 26.8486328125, 28.00927734375, 29.169921875, 30.33056640625, 31.4912109375, 32.65185546875, 33.8125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 5.0, 8.0, 20.0, 17.0, 21.0, 18.0, 36.0, 35.0, 36.0, 45.0, 46.0, 38.0, 64.0, 53.0, 59.0, 63.0, 54.0, 59.0, 52.0, 52.0, 31.0, 33.0, 20.0, 22.0, 13.0, 16.0, 19.0, 14.0, 11.0, 6.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.55859375, -4.41522216796875, -4.2718505859375, -4.12847900390625, -3.985107421875, -3.84173583984375, -3.6983642578125, -3.55499267578125, -3.41162109375, -3.26824951171875, -3.1248779296875, -2.98150634765625, -2.838134765625, -2.69476318359375, -2.5513916015625, -2.40802001953125, -2.2646484375, -2.12127685546875, -1.9779052734375, -1.83453369140625, -1.691162109375, -1.54779052734375, -1.4044189453125, -1.26104736328125, -1.11767578125, -0.97430419921875, -0.8309326171875, -0.68756103515625, -0.544189453125, -0.40081787109375, -0.2574462890625, -0.11407470703125, 0.029296875, 0.17266845703125, 0.3160400390625, 0.45941162109375, 0.602783203125, 0.74615478515625, 0.8895263671875, 1.03289794921875, 1.17626953125, 1.31964111328125, 1.4630126953125, 1.60638427734375, 1.749755859375, 1.89312744140625, 2.0364990234375, 2.17987060546875, 2.3232421875, 2.46661376953125, 2.6099853515625, 2.75335693359375, 2.896728515625, 3.04010009765625, 3.1834716796875, 3.32684326171875, 3.47021484375, 3.61358642578125, 3.7569580078125, 3.90032958984375, 4.043701171875, 4.18707275390625, 4.3304443359375, 4.47381591796875, 4.6171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 9.0, 14.0, 29.0, 61.0, 126.0, 110.0, 59.0, 26.0, 20.0, 9.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.11520004272461, -23.20858383178711, -21.301965713500977, -19.395349502563477, -17.488731384277344, -15.582115173339844, -13.675498962402344, -11.768881797790527, -9.862264633178711, -7.9556474685668945, -6.049030780792236, -4.142414093017578, -2.2357969284057617, -0.3291797637939453, 1.5774364471435547, 3.484053611755371, 5.3906707763671875, 7.297287940979004, 9.20390510559082, 11.11052131652832, 13.017138481140137, 14.923755645751953, 16.830371856689453, 18.736988067626953, 20.643606185913086, 22.550222396850586, 24.45684051513672, 26.36345672607422, 28.27007293701172, 30.17669105529785, 32.08330535888672, 33.989925384521484, 35.89653778076172, 37.80315399169922, 39.70977020263672, 41.61638641357422, 43.523006439208984, 45.429622650146484, 47.336238861083984, 49.242855072021484, 51.14947509765625, 53.05609130859375, 54.96270751953125, 56.86932373046875, 58.775943756103516, 60.682559967041016, 62.589176177978516, 64.49579620361328, 66.40240478515625, 68.30902099609375, 70.21563720703125, 72.12225341796875, 74.02886962890625, 75.93548583984375, 77.84210205078125, 79.74872589111328, 81.65534210205078, 83.56195831298828, 85.46857452392578, 87.37519073486328, 89.28180694580078, 91.18843078613281, 93.09504699707031, 95.00166320800781, 96.90827941894531]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 10.0, 17.0, 29.0, 39.0, 50.0, 60.0, 49.0, 44.0, 39.0, 23.0, 22.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.789613723754883, -21.070436477661133, -20.351261138916016, -19.632083892822266, -18.912906646728516, -18.193729400634766, -17.47455406188965, -16.7553768157959, -16.03620147705078, -15.317025184631348, -14.597847938537598, -13.878671646118164, -13.159494400024414, -12.44031810760498, -11.721141815185547, -11.001964569091797, -10.282787322998047, -9.563611030578613, -8.844433784484863, -8.12525749206543, -7.406080722808838, -6.686903953552246, -5.9677276611328125, -5.248550891876221, -4.529374122619629, -3.810197353363037, -3.0910208225250244, -2.3718442916870117, -1.65266752243042, -0.9334907531738281, -0.21431446075439453, 0.5048623085021973, 1.2240409851074219, 1.9432176351547241, 2.6623942852020264, 3.381570816040039, 4.100747585296631, 4.819924354553223, 5.539100646972656, 6.258277416229248, 6.97745418548584, 7.696630954742432, 8.415807723999023, 9.134984016418457, 9.85416030883789, 10.57333755493164, 11.292513847351074, 12.011690139770508, 12.730867385864258, 13.450043678283691, 14.169220924377441, 14.888397216796875, 15.607574462890625, 16.326751708984375, 17.045927047729492, 17.765104293823242, 18.48427963256836, 19.20345687866211, 19.922632217407227, 20.641809463500977, 21.360986709594727, 22.080162048339844, 22.799339294433594, 23.518516540527344, 24.237693786621094]}, "eval/loss": 1.5882747173309326, "eval/wer": 0.27844109480364937, "eval/runtime": 637.6994, "eval/samples_per_second": 4.143, "eval/steps_per_second": 0.519} \ No newline at end of file