diff --git "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" --- "a/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" +++ "b/wandb/run-20220315_200222-14cfddr6/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.407, "train/learning_rate": 5.068289786223278e-06, "train/epoch": 16.82, "train/global_step": 15000, "_runtime": 91322, "_timestamp": 1647465864, "_step": 15009, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 8.0, 6.0, 10.0, 12.0, 12.0, 15.0, 13.0, 20.0, 16.0, 17.0, 20.0, 26.0, 33.0, 38.0, 35.0, 47.0, 34.0, 38.0, 30.0, 56.0, 54.0, 39.0, 44.0, 38.0, 32.0, 33.0, 29.0, 33.0, 26.0, 23.0, 20.0, 16.0, 33.0, 19.0, 16.0, 8.0, 9.0, 4.0, 11.0, 7.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0], "bins": [-28.95673179626465, -28.36270523071289, -27.768680572509766, -27.174654006958008, -26.58062744140625, -25.986602783203125, -25.392576217651367, -24.79854965209961, -24.204524993896484, -23.610498428344727, -23.0164737701416, -22.422447204589844, -21.82842254638672, -21.23439598083496, -20.640369415283203, -20.046344757080078, -19.45231819152832, -18.858291625976562, -18.264266967773438, -17.67024040222168, -17.076213836669922, -16.482189178466797, -15.888162612915039, -15.294137001037598, -14.700111389160156, -14.106085777282715, -13.512060165405273, -12.918033599853516, -12.324007987976074, -11.729982376098633, -11.135955810546875, -10.541930198669434, -9.94790267944336, -9.353877067565918, -8.759851455688477, -8.165824890136719, -7.571799278259277, -6.977773666381836, -6.383747577667236, -5.789721488952637, -5.195695877075195, -4.601670265197754, -4.007644176483154, -3.413618326187134, -2.8195924758911133, -2.2255666255950928, -1.6315407752990723, -1.0375146865844727, -0.44348907470703125, 0.15053677558898926, 0.7445626258850098, 1.3385884761810303, 1.9326143264770508, 2.5266401767730713, 3.120666027069092, 3.7146921157836914, 4.308717727661133, 4.902743339538574, 5.496769428253174, 6.090795516967773, 6.684821128845215, 7.278846740722656, 7.872872829437256, 8.466898918151855, 9.060924530029297]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 10.0, 9.0, 17.0, 18.0, 19.0, 24.0, 31.0, 38.0, 29.0, 31.0, 30.0, 46.0, 37.0, 34.0, 49.0, 47.0, 43.0, 51.0, 48.0, 48.0, 35.0, 48.0, 34.0, 29.0, 44.0, 21.0, 17.0, 28.0, 17.0, 12.0, 17.0, 10.0, 4.0, 5.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.945802688598633, -20.255102157592773, -19.56439971923828, -18.873699188232422, -18.182998657226562, -17.492298126220703, -16.80159568786621, -16.11089515686035, -15.420193672180176, -14.7294921875, -14.03879165649414, -13.348090171813965, -12.657388687133789, -11.96668815612793, -11.275986671447754, -10.585285186767578, -9.894584655761719, -9.203883171081543, -8.513182640075684, -7.822481155395508, -7.13178014755249, -6.441079139709473, -5.750377655029297, -5.059676647186279, -4.368975639343262, -3.678274631500244, -2.9875733852386475, -2.296872138977051, -1.6061711311340332, -0.9154701232910156, -0.22476863861083984, 0.46593236923217773, 1.1566352844238281, 1.8473364114761353, 2.5380375385284424, 3.228738784790039, 3.9194397926330566, 4.610140800476074, 5.30084228515625, 5.991543292999268, 6.682244300842285, 7.372945308685303, 8.06364631652832, 8.754347801208496, 9.445049285888672, 10.135749816894531, 10.826451301574707, 11.517152786254883, 12.207853317260742, 12.898554801940918, 13.589255332946777, 14.279956817626953, 14.970657348632812, 15.661358833312988, 16.352060317993164, 17.042760848999023, 17.733463287353516, 18.424163818359375, 19.114866256713867, 19.805566787719727, 20.496267318725586, 21.186969757080078, 21.877670288085938, 22.568370819091797, 23.259071350097656]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 9.0, 25.0, 27.0, 27.0, 47.0, 69.0, 119.0, 210.0, 354.0, 554.0, 817.0, 1277.0, 2081.0, 3226.0, 5063.0, 7985.0, 12982.0, 20665.0, 32723.0, 50968.0, 79661.0, 122164.0, 184971.0, 269876.0, 374009.0, 481122.0, 542440.0, 528671.0, 444904.0, 336738.0, 237256.0, 161762.0, 105898.0, 68870.0, 43319.0, 27443.0, 17293.0, 10880.0, 6669.0, 4241.0, 2566.0, 1655.0, 1030.0, 593.0, 446.0, 233.0, 160.0, 78.0, 41.0, 31.0, 15.0, 12.0, 5.0, 2.0, 4.0, 3.0, 2.0], "bins": [-35.09375, -34.05615234375, -33.0185546875, -31.98095703125, -30.943359375, -29.90576171875, -28.8681640625, -27.83056640625, -26.79296875, -25.75537109375, -24.7177734375, -23.68017578125, -22.642578125, -21.60498046875, -20.5673828125, -19.52978515625, -18.4921875, -17.45458984375, -16.4169921875, -15.37939453125, -14.341796875, -13.30419921875, -12.2666015625, -11.22900390625, -10.19140625, -9.15380859375, -8.1162109375, -7.07861328125, -6.041015625, -5.00341796875, -3.9658203125, -2.92822265625, -1.890625, -0.85302734375, 0.1845703125, 1.22216796875, 2.259765625, 3.29736328125, 4.3349609375, 5.37255859375, 6.41015625, 7.44775390625, 8.4853515625, 9.52294921875, 10.560546875, 11.59814453125, 12.6357421875, 13.67333984375, 14.7109375, 15.74853515625, 16.7861328125, 17.82373046875, 18.861328125, 19.89892578125, 20.9365234375, 21.97412109375, 23.01171875, 24.04931640625, 25.0869140625, 26.12451171875, 27.162109375, 28.19970703125, 29.2373046875, 30.27490234375, 31.3125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 11.0, 16.0, 16.0, 16.0, 24.0, 33.0, 28.0, 23.0, 40.0, 25.0, 34.0, 41.0, 43.0, 42.0, 41.0, 47.0, 35.0, 50.0, 45.0, 44.0, 44.0, 44.0, 22.0, 38.0, 34.0, 29.0, 21.0, 24.0, 11.0, 19.0, 6.0, 11.0, 9.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.078125, -23.328857421875, -22.57958984375, -21.830322265625, -21.0810546875, -20.331787109375, -19.58251953125, -18.833251953125, -18.083984375, -17.334716796875, -16.58544921875, -15.836181640625, -15.0869140625, -14.337646484375, -13.58837890625, -12.839111328125, -12.08984375, -11.340576171875, -10.59130859375, -9.842041015625, -9.0927734375, -8.343505859375, -7.59423828125, -6.844970703125, -6.095703125, -5.346435546875, -4.59716796875, -3.847900390625, -3.0986328125, -2.349365234375, -1.60009765625, -0.850830078125, -0.1015625, 0.647705078125, 1.39697265625, 2.146240234375, 2.8955078125, 3.644775390625, 4.39404296875, 5.143310546875, 5.892578125, 6.641845703125, 7.39111328125, 8.140380859375, 8.8896484375, 9.638916015625, 10.38818359375, 11.137451171875, 11.88671875, 12.635986328125, 13.38525390625, 14.134521484375, 14.8837890625, 15.633056640625, 16.38232421875, 17.131591796875, 17.880859375, 18.630126953125, 19.37939453125, 20.128662109375, 20.8779296875, 21.627197265625, 22.37646484375, 23.125732421875, 23.875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 9.0, 25.0, 31.0, 61.0, 106.0, 165.0, 316.0, 478.0, 760.0, 1139.0, 1980.0, 3118.0, 5040.0, 7906.0, 12632.0, 19650.0, 30312.0, 46414.0, 69647.0, 101415.0, 146392.0, 202362.0, 268835.0, 337960.0, 397390.0, 433418.0, 434615.0, 399124.0, 340668.0, 271133.0, 204819.0, 148003.0, 104393.0, 71290.0, 47536.0, 30513.0, 20039.0, 12926.0, 8146.0, 5080.0, 3190.0, 2060.0, 1251.0, 745.0, 463.0, 300.0, 164.0, 105.0, 63.0, 32.0, 32.0, 10.0, 7.0, 8.0, 4.0, 0.0, 0.0, 2.0], "bins": [-22.546875, -21.8427734375, -21.138671875, -20.4345703125, -19.73046875, -19.0263671875, -18.322265625, -17.6181640625, -16.9140625, -16.2099609375, -15.505859375, -14.8017578125, -14.09765625, -13.3935546875, -12.689453125, -11.9853515625, -11.28125, -10.5771484375, -9.873046875, -9.1689453125, -8.46484375, -7.7607421875, -7.056640625, -6.3525390625, -5.6484375, -4.9443359375, -4.240234375, -3.5361328125, -2.83203125, -2.1279296875, -1.423828125, -0.7197265625, -0.015625, 0.6884765625, 1.392578125, 2.0966796875, 2.80078125, 3.5048828125, 4.208984375, 4.9130859375, 5.6171875, 6.3212890625, 7.025390625, 7.7294921875, 8.43359375, 9.1376953125, 9.841796875, 10.5458984375, 11.25, 11.9541015625, 12.658203125, 13.3623046875, 14.06640625, 14.7705078125, 15.474609375, 16.1787109375, 16.8828125, 17.5869140625, 18.291015625, 18.9951171875, 19.69921875, 20.4033203125, 21.107421875, 21.8115234375, 22.515625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 17.0, 17.0, 21.0, 20.0, 22.0, 57.0, 43.0, 36.0, 59.0, 77.0, 90.0, 103.0, 109.0, 136.0, 125.0, 162.0, 161.0, 163.0, 202.0, 193.0, 207.0, 208.0, 176.0, 189.0, 192.0, 186.0, 155.0, 127.0, 134.0, 121.0, 87.0, 85.0, 55.0, 67.0, 46.0, 44.0, 34.0, 31.0, 22.0, 15.0, 20.0, 18.0, 10.0, 7.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0], "bins": [-12.2421875, -11.8797607421875, -11.517333984375, -11.1549072265625, -10.79248046875, -10.4300537109375, -10.067626953125, -9.7052001953125, -9.3427734375, -8.9803466796875, -8.617919921875, -8.2554931640625, -7.89306640625, -7.5306396484375, -7.168212890625, -6.8057861328125, -6.443359375, -6.0809326171875, -5.718505859375, -5.3560791015625, -4.99365234375, -4.6312255859375, -4.268798828125, -3.9063720703125, -3.5439453125, -3.1815185546875, -2.819091796875, -2.4566650390625, -2.09423828125, -1.7318115234375, -1.369384765625, -1.0069580078125, -0.64453125, -0.2821044921875, 0.080322265625, 0.4427490234375, 0.80517578125, 1.1676025390625, 1.530029296875, 1.8924560546875, 2.2548828125, 2.6173095703125, 2.979736328125, 3.3421630859375, 3.70458984375, 4.0670166015625, 4.429443359375, 4.7918701171875, 5.154296875, 5.5167236328125, 5.879150390625, 6.2415771484375, 6.60400390625, 6.9664306640625, 7.328857421875, 7.6912841796875, 8.0537109375, 8.4161376953125, 8.778564453125, 9.1409912109375, 9.50341796875, 9.8658447265625, 10.228271484375, 10.5906982421875, 10.953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 10.0, 7.0, 10.0, 15.0, 11.0, 14.0, 26.0, 27.0, 34.0, 29.0, 19.0, 26.0, 42.0, 36.0, 33.0, 40.0, 53.0, 34.0, 44.0, 38.0, 43.0, 32.0, 39.0, 38.0, 30.0, 30.0, 30.0, 31.0, 19.0, 22.0, 18.0, 15.0, 18.0, 17.0, 9.0, 11.0, 10.0, 2.0, 11.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.393644332885742, -23.595495223999023, -22.797346115112305, -21.999197006225586, -21.201047897338867, -20.40289878845215, -19.604747772216797, -18.806598663330078, -18.00844955444336, -17.21030044555664, -16.412151336669922, -15.614002227783203, -14.815853118896484, -14.017704010009766, -13.21955394744873, -12.421404838562012, -11.62325668334961, -10.82510757446289, -10.026958465576172, -9.228809356689453, -8.430660247802734, -7.632510662078857, -6.8343610763549805, -6.036211967468262, -5.238062858581543, -4.439913749694824, -3.6417644023895264, -2.8436150550842285, -2.0454659461975098, -1.247316837310791, -0.44916725158691406, 0.3489818572998047, 1.1471309661865234, 1.9452801942825317, 2.74342942237854, 3.541578769683838, 4.339727878570557, 5.137876987457275, 5.936026573181152, 6.734175682067871, 7.53232479095459, 8.330473899841309, 9.128623008728027, 9.926773071289062, 10.724922180175781, 11.5230712890625, 12.321220397949219, 13.119369506835938, 13.917518615722656, 14.715667724609375, 15.513816833496094, 16.311965942382812, 17.11011505126953, 17.90826416015625, 18.70641326904297, 19.504562377929688, 20.302711486816406, 21.100860595703125, 21.899009704589844, 22.697158813476562, 23.49530792236328, 24.29345703125, 25.09160614013672, 25.889755249023438, 26.68790626525879]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 3.0, 6.0, 7.0, 15.0, 13.0, 14.0, 17.0, 31.0, 23.0, 26.0, 28.0, 27.0, 43.0, 23.0, 39.0, 51.0, 34.0, 46.0, 56.0, 48.0, 47.0, 51.0, 38.0, 42.0, 41.0, 27.0, 32.0, 37.0, 25.0, 23.0, 14.0, 13.0, 13.0, 15.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.80069923400879, -27.835338592529297, -26.869979858398438, -25.904619216918945, -24.939258575439453, -23.973899841308594, -23.0085391998291, -22.04317855834961, -21.07781982421875, -20.112459182739258, -19.1471004486084, -18.181739807128906, -17.216379165649414, -16.251018524169922, -15.285659790039062, -14.32029914855957, -13.354938507080078, -12.389578819274902, -11.42421817779541, -10.458858489990234, -9.493497848510742, -8.528138160705566, -7.562778472900391, -6.597418308258057, -5.632058143615723, -4.666697978973389, -3.701338052749634, -2.735978126525879, -1.770617961883545, -0.8052577972412109, 0.16010189056396484, 1.1254620552062988, 2.0908241271972656, 3.0561842918395996, 4.021544456481934, 4.986904144287109, 5.952264308929443, 6.917624473571777, 7.882984161376953, 8.848344802856445, 9.813704490661621, 10.779064178466797, 11.744424819946289, 12.709784507751465, 13.67514419555664, 14.640504837036133, 15.605864524841309, 16.571224212646484, 17.536584854125977, 18.50194549560547, 19.467304229736328, 20.43266487121582, 21.398025512695312, 22.363384246826172, 23.328744888305664, 24.294105529785156, 25.259464263916016, 26.224824905395508, 27.190183639526367, 28.15554428100586, 29.12090492248535, 30.086265563964844, 31.051624298095703, 32.01698303222656, 32.98234558105469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 18.0, 23.0, 27.0, 47.0, 65.0, 105.0, 160.0, 254.0, 419.0, 654.0, 1072.0, 1639.0, 2761.0, 4585.0, 7591.0, 12383.0, 20590.0, 34119.0, 54869.0, 84448.0, 119540.0, 147340.0, 151990.0, 132365.0, 98700.0, 66229.0, 41995.0, 25246.0, 15586.0, 9248.0, 5606.0, 3347.0, 2013.0, 1311.0, 801.0, 496.0, 315.0, 215.0, 125.0, 94.0, 52.0, 30.0, 22.0, 10.0, 15.0, 10.0, 11.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.984375, -11.634033203125, -11.28369140625, -10.933349609375, -10.5830078125, -10.232666015625, -9.88232421875, -9.531982421875, -9.181640625, -8.831298828125, -8.48095703125, -8.130615234375, -7.7802734375, -7.429931640625, -7.07958984375, -6.729248046875, -6.37890625, -6.028564453125, -5.67822265625, -5.327880859375, -4.9775390625, -4.627197265625, -4.27685546875, -3.926513671875, -3.576171875, -3.225830078125, -2.87548828125, -2.525146484375, -2.1748046875, -1.824462890625, -1.47412109375, -1.123779296875, -0.7734375, -0.423095703125, -0.07275390625, 0.277587890625, 0.6279296875, 0.978271484375, 1.32861328125, 1.678955078125, 2.029296875, 2.379638671875, 2.72998046875, 3.080322265625, 3.4306640625, 3.781005859375, 4.13134765625, 4.481689453125, 4.83203125, 5.182373046875, 5.53271484375, 5.883056640625, 6.2333984375, 6.583740234375, 6.93408203125, 7.284423828125, 7.634765625, 7.985107421875, 8.33544921875, 8.685791015625, 9.0361328125, 9.386474609375, 9.73681640625, 10.087158203125, 10.4375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 7.0, 6.0, 14.0, 12.0, 17.0, 19.0, 31.0, 19.0, 26.0, 32.0, 26.0, 40.0, 30.0, 40.0, 50.0, 35.0, 36.0, 63.0, 45.0, 56.0, 43.0, 41.0, 37.0, 41.0, 28.0, 34.0, 33.0, 24.0, 21.0, 20.0, 15.0, 12.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.34375, -28.359375, -27.375, -26.390625, -25.40625, -24.421875, -23.4375, -22.453125, -21.46875, -20.484375, -19.5, -18.515625, -17.53125, -16.546875, -15.5625, -14.578125, -13.59375, -12.609375, -11.625, -10.640625, -9.65625, -8.671875, -7.6875, -6.703125, -5.71875, -4.734375, -3.75, -2.765625, -1.78125, -0.796875, 0.1875, 1.171875, 2.15625, 3.140625, 4.125, 5.109375, 6.09375, 7.078125, 8.0625, 9.046875, 10.03125, 11.015625, 12.0, 12.984375, 13.96875, 14.953125, 15.9375, 16.921875, 17.90625, 18.890625, 19.875, 20.859375, 21.84375, 22.828125, 23.8125, 24.796875, 25.78125, 26.765625, 27.75, 28.734375, 29.71875, 30.703125, 31.6875, 32.671875, 33.65625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 15.0, 13.0, 31.0, 58.0, 84.0, 161.0, 270.0, 511.0, 873.0, 1688.0, 3458.0, 7187.0, 15107.0, 36929.0, 864868.0, 74524.0, 22471.0, 10326.0, 4833.0, 2374.0, 1205.0, 690.0, 347.0, 194.0, 132.0, 67.0, 46.0, 37.0, 13.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.625, -32.53125, -31.4375, -30.34375, -29.25, -28.15625, -27.0625, -25.96875, -24.875, -23.78125, -22.6875, -21.59375, -20.5, -19.40625, -18.3125, -17.21875, -16.125, -15.03125, -13.9375, -12.84375, -11.75, -10.65625, -9.5625, -8.46875, -7.375, -6.28125, -5.1875, -4.09375, -3.0, -1.90625, -0.8125, 0.28125, 1.375, 2.46875, 3.5625, 4.65625, 5.75, 6.84375, 7.9375, 9.03125, 10.125, 11.21875, 12.3125, 13.40625, 14.5, 15.59375, 16.6875, 17.78125, 18.875, 19.96875, 21.0625, 22.15625, 23.25, 24.34375, 25.4375, 26.53125, 27.625, 28.71875, 29.8125, 30.90625, 32.0, 33.09375, 34.1875, 35.28125, 36.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 8.0, 2.0, 5.0, 8.0, 10.0, 12.0, 7.0, 13.0, 17.0, 17.0, 22.0, 32.0, 29.0, 17.0, 39.0, 30.0, 44.0, 34.0, 36.0, 40.0, 55.0, 42.0, 48.0, 49.0, 43.0, 40.0, 42.0, 34.0, 34.0, 26.0, 25.0, 22.0, 18.0, 12.0, 13.0, 17.0, 14.0, 15.0, 11.0, 5.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.760498046875, -18.11474609375, -17.468994140625, -16.8232421875, -16.177490234375, -15.53173828125, -14.885986328125, -14.240234375, -13.594482421875, -12.94873046875, -12.302978515625, -11.6572265625, -11.011474609375, -10.36572265625, -9.719970703125, -9.07421875, -8.428466796875, -7.78271484375, -7.136962890625, -6.4912109375, -5.845458984375, -5.19970703125, -4.553955078125, -3.908203125, -3.262451171875, -2.61669921875, -1.970947265625, -1.3251953125, -0.679443359375, -0.03369140625, 0.612060546875, 1.2578125, 1.903564453125, 2.54931640625, 3.195068359375, 3.8408203125, 4.486572265625, 5.13232421875, 5.778076171875, 6.423828125, 7.069580078125, 7.71533203125, 8.361083984375, 9.0068359375, 9.652587890625, 10.29833984375, 10.944091796875, 11.58984375, 12.235595703125, 12.88134765625, 13.527099609375, 14.1728515625, 14.818603515625, 15.46435546875, 16.110107421875, 16.755859375, 17.401611328125, 18.04736328125, 18.693115234375, 19.3388671875, 19.984619140625, 20.63037109375, 21.276123046875, 21.921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 13.0, 8.0, 11.0, 8.0, 20.0, 33.0, 44.0, 67.0, 147.0, 224.0, 385.0, 731.0, 1412.0, 2903.0, 6059.0, 14453.0, 37534.0, 868771.0, 77039.0, 21681.0, 8808.0, 3922.0, 1997.0, 991.0, 525.0, 275.0, 180.0, 109.0, 60.0, 43.0, 29.0, 21.0, 11.0, 11.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.786285400390625, -2.69561767578125, -2.604949951171875, -2.5142822265625, -2.423614501953125, -2.33294677734375, -2.242279052734375, -2.151611328125, -2.060943603515625, -1.97027587890625, -1.879608154296875, -1.7889404296875, -1.698272705078125, -1.60760498046875, -1.516937255859375, -1.42626953125, -1.335601806640625, -1.24493408203125, -1.154266357421875, -1.0635986328125, -0.972930908203125, -0.88226318359375, -0.791595458984375, -0.700927734375, -0.610260009765625, -0.51959228515625, -0.428924560546875, -0.3382568359375, -0.247589111328125, -0.15692138671875, -0.066253662109375, 0.0244140625, 0.115081787109375, 0.20574951171875, 0.296417236328125, 0.3870849609375, 0.477752685546875, 0.56842041015625, 0.659088134765625, 0.749755859375, 0.840423583984375, 0.93109130859375, 1.021759033203125, 1.1124267578125, 1.203094482421875, 1.29376220703125, 1.384429931640625, 1.47509765625, 1.565765380859375, 1.65643310546875, 1.747100830078125, 1.8377685546875, 1.928436279296875, 2.01910400390625, 2.109771728515625, 2.200439453125, 2.291107177734375, 2.38177490234375, 2.472442626953125, 2.5631103515625, 2.653778076171875, 2.74444580078125, 2.835113525390625, 2.92578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 7.0, 11.0, 15.0, 18.0, 19.0, 35.0, 44.0, 65.0, 70.0, 105.0, 110.0, 104.0, 98.0, 84.0, 52.0, 53.0, 28.0, 25.0, 17.0, 12.0, 10.0, 4.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020039081573486328, -0.0001936890184879303, -0.00018698722124099731, -0.00018028542399406433, -0.00017358362674713135, -0.00016688182950019836, -0.00016018003225326538, -0.0001534782350063324, -0.00014677643775939941, -0.00014007464051246643, -0.00013337284326553345, -0.00012667104601860046, -0.00011996924877166748, -0.0001132674515247345, -0.00010656565427780151, -9.986385703086853e-05, -9.316205978393555e-05, -8.646026253700256e-05, -7.975846529006958e-05, -7.30566680431366e-05, -6.635487079620361e-05, -5.965307354927063e-05, -5.2951276302337646e-05, -4.624947905540466e-05, -3.954768180847168e-05, -3.2845884561538696e-05, -2.6144087314605713e-05, -1.944229006767273e-05, -1.2740492820739746e-05, -6.038695573806763e-06, 6.631016731262207e-07, 7.364898920059204e-06, 1.4066696166992188e-05, 2.076849341392517e-05, 2.7470290660858154e-05, 3.417208790779114e-05, 4.087388515472412e-05, 4.7575682401657104e-05, 5.427747964859009e-05, 6.097927689552307e-05, 6.768107414245605e-05, 7.438287138938904e-05, 8.108466863632202e-05, 8.7786465883255e-05, 9.448826313018799e-05, 0.00010119006037712097, 0.00010789185762405396, 0.00011459365487098694, 0.00012129545211791992, 0.0001279972493648529, 0.0001346990466117859, 0.00014140084385871887, 0.00014810264110565186, 0.00015480443835258484, 0.00016150623559951782, 0.0001682080328464508, 0.0001749098300933838, 0.00018161162734031677, 0.00018831342458724976, 0.00019501522183418274, 0.00020171701908111572, 0.0002084188163280487, 0.0002151206135749817, 0.00022182241082191467, 0.00022852420806884766]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 16.0, 11.0, 10.0, 12.0, 21.0, 29.0, 38.0, 60.0, 72.0, 116.0, 160.0, 228.0, 440.0, 779.0, 1410.0, 2660.0, 5482.0, 11064.0, 22973.0, 46387.0, 87527.0, 148946.0, 206704.0, 202582.0, 141717.0, 83115.0, 43266.0, 21508.0, 10531.0, 4967.0, 2528.0, 1263.0, 698.0, 437.0, 256.0, 142.0, 96.0, 71.0, 55.0, 29.0, 33.0, 21.0, 19.0, 16.0, 12.0, 8.0, 8.0, 5.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.564453125, -2.48419189453125, -2.4039306640625, -2.32366943359375, -2.243408203125, -2.16314697265625, -2.0828857421875, -2.00262451171875, -1.92236328125, -1.84210205078125, -1.7618408203125, -1.68157958984375, -1.601318359375, -1.52105712890625, -1.4407958984375, -1.36053466796875, -1.2802734375, -1.20001220703125, -1.1197509765625, -1.03948974609375, -0.959228515625, -0.87896728515625, -0.7987060546875, -0.71844482421875, -0.63818359375, -0.55792236328125, -0.4776611328125, -0.39739990234375, -0.317138671875, -0.23687744140625, -0.1566162109375, -0.07635498046875, 0.00390625, 0.08416748046875, 0.1644287109375, 0.24468994140625, 0.324951171875, 0.40521240234375, 0.4854736328125, 0.56573486328125, 0.64599609375, 0.72625732421875, 0.8065185546875, 0.88677978515625, 0.967041015625, 1.04730224609375, 1.1275634765625, 1.20782470703125, 1.2880859375, 1.36834716796875, 1.4486083984375, 1.52886962890625, 1.609130859375, 1.68939208984375, 1.7696533203125, 1.84991455078125, 1.93017578125, 2.01043701171875, 2.0906982421875, 2.17095947265625, 2.251220703125, 2.33148193359375, 2.4117431640625, 2.49200439453125, 2.572265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 10.0, 13.0, 10.0, 13.0, 19.0, 26.0, 35.0, 47.0, 57.0, 58.0, 86.0, 74.0, 96.0, 82.0, 69.0, 55.0, 56.0, 45.0, 40.0, 32.0, 17.0, 19.0, 12.0, 9.0, 4.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.079681396484375, -1.04412841796875, -1.008575439453125, -0.9730224609375, -0.937469482421875, -0.90191650390625, -0.866363525390625, -0.830810546875, -0.795257568359375, -0.75970458984375, -0.724151611328125, -0.6885986328125, -0.653045654296875, -0.61749267578125, -0.581939697265625, -0.54638671875, -0.510833740234375, -0.47528076171875, -0.439727783203125, -0.4041748046875, -0.368621826171875, -0.33306884765625, -0.297515869140625, -0.261962890625, -0.226409912109375, -0.19085693359375, -0.155303955078125, -0.1197509765625, -0.084197998046875, -0.04864501953125, -0.013092041015625, 0.0224609375, 0.058013916015625, 0.09356689453125, 0.129119873046875, 0.1646728515625, 0.200225830078125, 0.23577880859375, 0.271331787109375, 0.306884765625, 0.342437744140625, 0.37799072265625, 0.413543701171875, 0.4490966796875, 0.484649658203125, 0.52020263671875, 0.555755615234375, 0.59130859375, 0.626861572265625, 0.66241455078125, 0.697967529296875, 0.7335205078125, 0.769073486328125, 0.80462646484375, 0.840179443359375, 0.875732421875, 0.911285400390625, 0.94683837890625, 0.982391357421875, 1.0179443359375, 1.053497314453125, 1.08905029296875, 1.124603271484375, 1.16015625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 3.0, 6.0, 6.0, 12.0, 7.0, 12.0, 15.0, 16.0, 25.0, 30.0, 29.0, 26.0, 28.0, 31.0, 24.0, 37.0, 49.0, 37.0, 31.0, 38.0, 42.0, 41.0, 36.0, 46.0, 37.0, 36.0, 36.0, 32.0, 26.0, 18.0, 26.0, 19.0, 25.0, 20.0, 17.0, 16.0, 8.0, 14.0, 6.0, 4.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.033145904541016, -23.22198486328125, -22.410825729370117, -21.59966468811035, -20.788503646850586, -19.977344512939453, -19.166183471679688, -18.355022430419922, -17.54386329650879, -16.732702255249023, -15.921542167663574, -15.110382080078125, -14.299221992492676, -13.488061904907227, -12.676900863647461, -11.865740776062012, -11.054579734802246, -10.243419647216797, -9.432258605957031, -8.621098518371582, -7.809938430786133, -6.998777866363525, -6.187617301940918, -5.376457214355469, -4.565296649932861, -3.754136323928833, -2.9429759979248047, -2.1318154335021973, -1.320655107498169, -0.5094947814941406, 0.3016657829284668, 1.112825870513916, 1.9239864349365234, 2.7351467609405518, 3.54630708694458, 4.3574676513671875, 5.168627738952637, 5.979788303375244, 6.790948867797852, 7.602108955383301, 8.41326904296875, 9.2244291305542, 10.035590171813965, 10.846750259399414, 11.657910346984863, 12.469070434570312, 13.280231475830078, 14.091391563415527, 14.902552604675293, 15.713712692260742, 16.524873733520508, 17.33603286743164, 18.147193908691406, 18.958354949951172, 19.769515991210938, 20.58067512512207, 21.391836166381836, 22.2029972076416, 23.014156341552734, 23.8253173828125, 24.636478424072266, 25.4476375579834, 26.258798599243164, 27.069957733154297, 27.881118774414062]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 7.0, 14.0, 11.0, 18.0, 13.0, 28.0, 21.0, 28.0, 32.0, 20.0, 40.0, 36.0, 35.0, 48.0, 34.0, 40.0, 54.0, 57.0, 48.0, 45.0, 49.0, 30.0, 46.0, 28.0, 36.0, 32.0, 27.0, 19.0, 25.0, 14.0, 12.0, 10.0, 11.0, 4.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.725088119506836, -28.738977432250977, -27.752866744995117, -26.766756057739258, -25.7806453704834, -24.79453468322754, -23.808422088623047, -22.822311401367188, -21.836200714111328, -20.85009002685547, -19.86397933959961, -18.87786865234375, -17.89175796508789, -16.90564727783203, -15.919535636901855, -14.933424949645996, -13.947315216064453, -12.961204528808594, -11.975093841552734, -10.988983154296875, -10.002872467041016, -9.016761779785156, -8.03065013885498, -7.044539451599121, -6.058428764343262, -5.072318077087402, -4.086207389831543, -3.1000962257385254, -2.113985538482666, -1.1278748512268066, -0.14176368713378906, 0.8443470001220703, 1.8304595947265625, 2.816570281982422, 3.8026812076568604, 4.788792133331299, 5.774902820587158, 6.761013507843018, 7.747124671936035, 8.733235359191895, 9.719346046447754, 10.705456733703613, 11.691567420959473, 12.677679061889648, 13.663789749145508, 14.649900436401367, 15.636011123657227, 16.622121810913086, 17.608232498168945, 18.594343185424805, 19.580453872680664, 20.566564559936523, 21.552675247192383, 22.538785934448242, 23.524898529052734, 24.511009216308594, 25.497119903564453, 26.483230590820312, 27.469341278076172, 28.45545196533203, 29.44156265258789, 30.42767333984375, 31.41378402709961, 32.39989471435547, 33.38600540161133]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 15.0, 35.0, 29.0, 56.0, 79.0, 133.0, 198.0, 306.0, 482.0, 778.0, 1216.0, 1890.0, 2983.0, 4700.0, 6992.0, 10813.0, 15434.0, 22852.0, 31581.0, 42774.0, 56053.0, 70127.0, 83473.0, 92837.0, 98470.0, 95830.0, 89366.0, 78191.0, 64383.0, 50612.0, 38540.0, 27998.0, 19730.0, 13468.0, 8980.0, 6082.0, 3936.0, 2608.0, 1635.0, 1053.0, 648.0, 407.0, 265.0, 178.0, 111.0, 68.0, 56.0, 39.0, 21.0, 16.0, 5.0, 5.0, 5.0, 3.0, 3.0], "bins": [-21.0625, -20.439453125, -19.81640625, -19.193359375, -18.5703125, -17.947265625, -17.32421875, -16.701171875, -16.078125, -15.455078125, -14.83203125, -14.208984375, -13.5859375, -12.962890625, -12.33984375, -11.716796875, -11.09375, -10.470703125, -9.84765625, -9.224609375, -8.6015625, -7.978515625, -7.35546875, -6.732421875, -6.109375, -5.486328125, -4.86328125, -4.240234375, -3.6171875, -2.994140625, -2.37109375, -1.748046875, -1.125, -0.501953125, 0.12109375, 0.744140625, 1.3671875, 1.990234375, 2.61328125, 3.236328125, 3.859375, 4.482421875, 5.10546875, 5.728515625, 6.3515625, 6.974609375, 7.59765625, 8.220703125, 8.84375, 9.466796875, 10.08984375, 10.712890625, 11.3359375, 11.958984375, 12.58203125, 13.205078125, 13.828125, 14.451171875, 15.07421875, 15.697265625, 16.3203125, 16.943359375, 17.56640625, 18.189453125, 18.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 16.0, 12.0, 16.0, 14.0, 23.0, 30.0, 24.0, 29.0, 23.0, 42.0, 29.0, 40.0, 42.0, 39.0, 43.0, 43.0, 59.0, 45.0, 49.0, 47.0, 40.0, 35.0, 35.0, 31.0, 35.0, 29.0, 18.0, 24.0, 15.0, 13.0, 10.0, 8.0, 7.0, 6.0, 1.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.567626953125, -27.58837890625, -26.609130859375, -25.6298828125, -24.650634765625, -23.67138671875, -22.692138671875, -21.712890625, -20.733642578125, -19.75439453125, -18.775146484375, -17.7958984375, -16.816650390625, -15.83740234375, -14.858154296875, -13.87890625, -12.899658203125, -11.92041015625, -10.941162109375, -9.9619140625, -8.982666015625, -8.00341796875, -7.024169921875, -6.044921875, -5.065673828125, -4.08642578125, -3.107177734375, -2.1279296875, -1.148681640625, -0.16943359375, 0.809814453125, 1.7890625, 2.768310546875, 3.74755859375, 4.726806640625, 5.7060546875, 6.685302734375, 7.66455078125, 8.643798828125, 9.623046875, 10.602294921875, 11.58154296875, 12.560791015625, 13.5400390625, 14.519287109375, 15.49853515625, 16.477783203125, 17.45703125, 18.436279296875, 19.41552734375, 20.394775390625, 21.3740234375, 22.353271484375, 23.33251953125, 24.311767578125, 25.291015625, 26.270263671875, 27.24951171875, 28.228759765625, 29.2080078125, 30.187255859375, 31.16650390625, 32.145751953125, 33.125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 8.0, 12.0, 21.0, 35.0, 47.0, 73.0, 90.0, 136.0, 186.0, 310.0, 446.0, 650.0, 1053.0, 1600.0, 2299.0, 3562.0, 5496.0, 8508.0, 12833.0, 19346.0, 28522.0, 40919.0, 55647.0, 73776.0, 90783.0, 103894.0, 110428.0, 107053.0, 96284.0, 80001.0, 62000.0, 45588.0, 32265.0, 21956.0, 14725.0, 9582.0, 6335.0, 4225.0, 2651.0, 1731.0, 1132.0, 750.0, 561.0, 343.0, 233.0, 152.0, 104.0, 68.0, 55.0, 29.0, 20.0, 12.0, 10.0, 7.0, 5.0, 4.0, 0.0, 2.0], "bins": [-25.609375, -24.825439453125, -24.04150390625, -23.257568359375, -22.4736328125, -21.689697265625, -20.90576171875, -20.121826171875, -19.337890625, -18.553955078125, -17.77001953125, -16.986083984375, -16.2021484375, -15.418212890625, -14.63427734375, -13.850341796875, -13.06640625, -12.282470703125, -11.49853515625, -10.714599609375, -9.9306640625, -9.146728515625, -8.36279296875, -7.578857421875, -6.794921875, -6.010986328125, -5.22705078125, -4.443115234375, -3.6591796875, -2.875244140625, -2.09130859375, -1.307373046875, -0.5234375, 0.260498046875, 1.04443359375, 1.828369140625, 2.6123046875, 3.396240234375, 4.18017578125, 4.964111328125, 5.748046875, 6.531982421875, 7.31591796875, 8.099853515625, 8.8837890625, 9.667724609375, 10.45166015625, 11.235595703125, 12.01953125, 12.803466796875, 13.58740234375, 14.371337890625, 15.1552734375, 15.939208984375, 16.72314453125, 17.507080078125, 18.291015625, 19.074951171875, 19.85888671875, 20.642822265625, 21.4267578125, 22.210693359375, 22.99462890625, 23.778564453125, 24.5625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 5.0, 9.0, 4.0, 9.0, 10.0, 20.0, 18.0, 17.0, 18.0, 22.0, 23.0, 28.0, 26.0, 24.0, 31.0, 46.0, 23.0, 41.0, 25.0, 28.0, 37.0, 28.0, 40.0, 42.0, 48.0, 23.0, 30.0, 34.0, 32.0, 16.0, 25.0, 35.0, 29.0, 21.0, 19.0, 13.0, 15.0, 17.0, 11.0, 3.0, 13.0, 4.0, 4.0, 6.0, 3.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.421875, -16.87841796875, -16.3349609375, -15.79150390625, -15.248046875, -14.70458984375, -14.1611328125, -13.61767578125, -13.07421875, -12.53076171875, -11.9873046875, -11.44384765625, -10.900390625, -10.35693359375, -9.8134765625, -9.27001953125, -8.7265625, -8.18310546875, -7.6396484375, -7.09619140625, -6.552734375, -6.00927734375, -5.4658203125, -4.92236328125, -4.37890625, -3.83544921875, -3.2919921875, -2.74853515625, -2.205078125, -1.66162109375, -1.1181640625, -0.57470703125, -0.03125, 0.51220703125, 1.0556640625, 1.59912109375, 2.142578125, 2.68603515625, 3.2294921875, 3.77294921875, 4.31640625, 4.85986328125, 5.4033203125, 5.94677734375, 6.490234375, 7.03369140625, 7.5771484375, 8.12060546875, 8.6640625, 9.20751953125, 9.7509765625, 10.29443359375, 10.837890625, 11.38134765625, 11.9248046875, 12.46826171875, 13.01171875, 13.55517578125, 14.0986328125, 14.64208984375, 15.185546875, 15.72900390625, 16.2724609375, 16.81591796875, 17.359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 12.0, 6.0, 9.0, 15.0, 35.0, 38.0, 74.0, 85.0, 145.0, 280.0, 427.0, 647.0, 1022.0, 1808.0, 3053.0, 5005.0, 8555.0, 14324.0, 24290.0, 39172.0, 61055.0, 88820.0, 118469.0, 139126.0, 141581.0, 124997.0, 96453.0, 67609.0, 43364.0, 27210.0, 16703.0, 9772.0, 5934.0, 3359.0, 1992.0, 1176.0, 728.0, 432.0, 286.0, 195.0, 120.0, 66.0, 34.0, 28.0, 22.0, 9.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.8828125, -8.62249755859375, -8.3621826171875, -8.10186767578125, -7.841552734375, -7.58123779296875, -7.3209228515625, -7.06060791015625, -6.80029296875, -6.53997802734375, -6.2796630859375, -6.01934814453125, -5.759033203125, -5.49871826171875, -5.2384033203125, -4.97808837890625, -4.7177734375, -4.45745849609375, -4.1971435546875, -3.93682861328125, -3.676513671875, -3.41619873046875, -3.1558837890625, -2.89556884765625, -2.63525390625, -2.37493896484375, -2.1146240234375, -1.85430908203125, -1.593994140625, -1.33367919921875, -1.0733642578125, -0.81304931640625, -0.552734375, -0.29241943359375, -0.0321044921875, 0.22821044921875, 0.488525390625, 0.74884033203125, 1.0091552734375, 1.26947021484375, 1.52978515625, 1.79010009765625, 2.0504150390625, 2.31072998046875, 2.571044921875, 2.83135986328125, 3.0916748046875, 3.35198974609375, 3.6123046875, 3.87261962890625, 4.1329345703125, 4.39324951171875, 4.653564453125, 4.91387939453125, 5.1741943359375, 5.43450927734375, 5.69482421875, 5.95513916015625, 6.2154541015625, 6.47576904296875, 6.736083984375, 6.99639892578125, 7.2567138671875, 7.51702880859375, 7.77734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 5.0, 14.0, 14.0, 15.0, 20.0, 22.0, 26.0, 33.0, 48.0, 43.0, 55.0, 69.0, 64.0, 69.0, 51.0, 60.0, 51.0, 39.0, 44.0, 36.0, 45.0, 28.0, 21.0, 18.0, 29.0, 19.0, 15.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.001207977533340454, -0.001175224781036377, -0.0011424720287322998, -0.0011097192764282227, -0.0010769665241241455, -0.0010442137718200684, -0.0010114610195159912, -0.000978708267211914, -0.0009459555149078369, -0.0009132027626037598, -0.0008804500102996826, -0.0008476972579956055, -0.0008149445056915283, -0.0007821917533874512, -0.000749439001083374, -0.0007166862487792969, -0.0006839334964752197, -0.0006511807441711426, -0.0006184279918670654, -0.0005856752395629883, -0.0005529224872589111, -0.000520169734954834, -0.00048741698265075684, -0.0004546642303466797, -0.00042191147804260254, -0.0003891587257385254, -0.00035640597343444824, -0.0003236532211303711, -0.00029090046882629395, -0.0002581477165222168, -0.00022539496421813965, -0.0001926422119140625, -0.00015988945960998535, -0.0001271367073059082, -9.438395500183105e-05, -6.16312026977539e-05, -2.8878450393676758e-05, 3.874301910400391e-06, 3.662705421447754e-05, 6.937980651855469e-05, 0.00010213255882263184, 0.00013488531112670898, 0.00016763806343078613, 0.00020039081573486328, 0.00023314356803894043, 0.0002658963203430176, 0.0002986490726470947, 0.0003314018249511719, 0.000364154577255249, 0.00039690732955932617, 0.0004296600818634033, 0.00046241283416748047, 0.0004951655864715576, 0.0005279183387756348, 0.0005606710910797119, 0.0005934238433837891, 0.0006261765956878662, 0.0006589293479919434, 0.0006916821002960205, 0.0007244348526000977, 0.0007571876049041748, 0.000789940357208252, 0.0008226931095123291, 0.0008554458618164062]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 6.0, 6.0, 11.0, 16.0, 21.0, 43.0, 67.0, 117.0, 127.0, 279.0, 354.0, 603.0, 853.0, 1323.0, 2038.0, 3075.0, 4847.0, 7316.0, 11497.0, 17062.0, 25524.0, 37508.0, 53119.0, 70952.0, 89490.0, 105351.0, 113172.0, 110526.0, 100477.0, 83511.0, 64384.0, 46852.0, 32910.0, 22472.0, 14755.0, 9708.0, 6445.0, 4146.0, 2709.0, 1704.0, 1050.0, 764.0, 483.0, 301.0, 197.0, 153.0, 84.0, 53.0, 33.0, 25.0, 17.0, 8.0, 3.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4921875, -6.28155517578125, -6.0709228515625, -5.86029052734375, -5.649658203125, -5.43902587890625, -5.2283935546875, -5.01776123046875, -4.80712890625, -4.59649658203125, -4.3858642578125, -4.17523193359375, -3.964599609375, -3.75396728515625, -3.5433349609375, -3.33270263671875, -3.1220703125, -2.91143798828125, -2.7008056640625, -2.49017333984375, -2.279541015625, -2.06890869140625, -1.8582763671875, -1.64764404296875, -1.43701171875, -1.22637939453125, -1.0157470703125, -0.80511474609375, -0.594482421875, -0.38385009765625, -0.1732177734375, 0.03741455078125, 0.248046875, 0.45867919921875, 0.6693115234375, 0.87994384765625, 1.090576171875, 1.30120849609375, 1.5118408203125, 1.72247314453125, 1.93310546875, 2.14373779296875, 2.3543701171875, 2.56500244140625, 2.775634765625, 2.98626708984375, 3.1968994140625, 3.40753173828125, 3.6181640625, 3.82879638671875, 4.0394287109375, 4.25006103515625, 4.460693359375, 4.67132568359375, 4.8819580078125, 5.09259033203125, 5.30322265625, 5.51385498046875, 5.7244873046875, 5.93511962890625, 6.145751953125, 6.35638427734375, 6.5670166015625, 6.77764892578125, 6.98828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 5.0, 15.0, 5.0, 10.0, 15.0, 17.0, 28.0, 27.0, 33.0, 34.0, 43.0, 41.0, 45.0, 43.0, 35.0, 52.0, 67.0, 49.0, 53.0, 51.0, 56.0, 41.0, 42.0, 35.0, 28.0, 27.0, 16.0, 10.0, 15.0, 9.0, 14.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.05987548828125, -2.9576416015625, -2.85540771484375, -2.753173828125, -2.65093994140625, -2.5487060546875, -2.44647216796875, -2.34423828125, -2.24200439453125, -2.1397705078125, -2.03753662109375, -1.935302734375, -1.83306884765625, -1.7308349609375, -1.62860107421875, -1.5263671875, -1.42413330078125, -1.3218994140625, -1.21966552734375, -1.117431640625, -1.01519775390625, -0.9129638671875, -0.81072998046875, -0.70849609375, -0.60626220703125, -0.5040283203125, -0.40179443359375, -0.299560546875, -0.19732666015625, -0.0950927734375, 0.00714111328125, 0.109375, 0.21160888671875, 0.3138427734375, 0.41607666015625, 0.518310546875, 0.62054443359375, 0.7227783203125, 0.82501220703125, 0.92724609375, 1.02947998046875, 1.1317138671875, 1.23394775390625, 1.336181640625, 1.43841552734375, 1.5406494140625, 1.64288330078125, 1.7451171875, 1.84735107421875, 1.9495849609375, 2.05181884765625, 2.154052734375, 2.25628662109375, 2.3585205078125, 2.46075439453125, 2.56298828125, 2.66522216796875, 2.7674560546875, 2.86968994140625, 2.971923828125, 3.07415771484375, 3.1763916015625, 3.27862548828125, 3.380859375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 1.0, 3.0, 7.0, 8.0, 7.0, 14.0, 17.0, 13.0, 17.0, 26.0, 20.0, 17.0, 39.0, 53.0, 35.0, 29.0, 48.0, 39.0, 38.0, 34.0, 48.0, 41.0, 51.0, 52.0, 38.0, 31.0, 28.0, 32.0, 25.0, 28.0, 25.0, 27.0, 17.0, 17.0, 14.0, 11.0, 8.0, 7.0, 11.0, 10.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.159210205078125, -29.23592185974121, -28.312631607055664, -27.38934326171875, -26.466054916381836, -25.542766571044922, -24.619476318359375, -23.69618797302246, -22.772899627685547, -21.849611282348633, -20.926321029663086, -20.003032684326172, -19.079744338989258, -18.156455993652344, -17.233165740966797, -16.309877395629883, -15.386587142944336, -14.463297843933105, -13.540009498596191, -12.616720199584961, -11.693431854248047, -10.770142555236816, -9.846853256225586, -8.923564910888672, -8.000275611877441, -7.076986789703369, -6.153697967529297, -5.230408668518066, -4.307119846343994, -3.383831024169922, -2.4605417251586914, -1.5372529029846191, -0.6139621734619141, 0.30932676792144775, 1.2326157093048096, 2.155904769897461, 3.079193592071533, 4.0024824142456055, 4.925771713256836, 5.849060535430908, 6.7723493576049805, 7.695638179779053, 8.618927001953125, 9.542216300964355, 10.465505599975586, 11.3887939453125, 12.31208324432373, 13.235372543334961, 14.158660888671875, 15.081950187683105, 16.005239486694336, 16.92852783203125, 17.851816177368164, 18.775104522705078, 19.698394775390625, 20.62168312072754, 21.544971466064453, 22.468259811401367, 23.391550064086914, 24.314838409423828, 25.238126754760742, 26.161415100097656, 27.084705352783203, 28.007993698120117, 28.931283950805664]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 15.0, 12.0, 19.0, 22.0, 22.0, 20.0, 29.0, 43.0, 29.0, 56.0, 36.0, 54.0, 41.0, 51.0, 60.0, 37.0, 52.0, 43.0, 40.0, 40.0, 39.0, 42.0, 37.0, 32.0, 17.0, 21.0, 12.0, 16.0, 8.0, 10.0, 11.0, 9.0, 3.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.4459342956543, -32.32765197753906, -31.209365844726562, -30.091083526611328, -28.97279930114746, -27.854515075683594, -26.736230850219727, -25.61794662475586, -24.499664306640625, -23.381380081176758, -22.26309585571289, -21.144813537597656, -20.02652931213379, -18.908245086669922, -17.789960861206055, -16.671676635742188, -15.55339241027832, -14.435108184814453, -13.316824913024902, -12.198540687561035, -11.080257415771484, -9.961973190307617, -8.84368896484375, -7.725405216217041, -6.607121467590332, -5.488837718963623, -4.370553970336914, -3.252269744873047, -2.133985996246338, -1.015702247619629, 0.10258197784423828, 1.2208657264709473, 2.3391494750976562, 3.4574332237243652, 4.575716972351074, 5.694001197814941, 6.81228494644165, 7.930568695068359, 9.048852920532227, 10.167137145996094, 11.285420417785645, 12.403704643249512, 13.521987915039062, 14.64027214050293, 15.758556365966797, 16.87683868408203, 17.99512481689453, 19.113407135009766, 20.231691360473633, 21.3499755859375, 22.468259811401367, 23.586544036865234, 24.70482635498047, 25.823110580444336, 26.941394805908203, 28.05967903137207, 29.177963256835938, 30.296247482299805, 31.414531707763672, 32.532814025878906, 33.651100158691406, 34.76938247680664, 35.887664794921875, 37.005950927734375, 38.12423324584961]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 13.0, 21.0, 40.0, 44.0, 70.0, 119.0, 185.0, 297.0, 454.0, 712.0, 1155.0, 1933.0, 2891.0, 4681.0, 7386.0, 12225.0, 18959.0, 29887.0, 46752.0, 73340.0, 112611.0, 170066.0, 247752.0, 345250.0, 440354.0, 508453.0, 517783.0, 462795.0, 371197.0, 271495.0, 188599.0, 127389.0, 82890.0, 53694.0, 33891.0, 21667.0, 13564.0, 8647.0, 5559.0, 3388.0, 2246.0, 1372.0, 861.0, 572.0, 351.0, 233.0, 147.0, 114.0, 76.0, 31.0, 30.0, 16.0, 13.0, 11.0, 2.0, 2.0, 3.0, 1.0], "bins": [-26.890625, -26.053955078125, -25.21728515625, -24.380615234375, -23.5439453125, -22.707275390625, -21.87060546875, -21.033935546875, -20.197265625, -19.360595703125, -18.52392578125, -17.687255859375, -16.8505859375, -16.013916015625, -15.17724609375, -14.340576171875, -13.50390625, -12.667236328125, -11.83056640625, -10.993896484375, -10.1572265625, -9.320556640625, -8.48388671875, -7.647216796875, -6.810546875, -5.973876953125, -5.13720703125, -4.300537109375, -3.4638671875, -2.627197265625, -1.79052734375, -0.953857421875, -0.1171875, 0.719482421875, 1.55615234375, 2.392822265625, 3.2294921875, 4.066162109375, 4.90283203125, 5.739501953125, 6.576171875, 7.412841796875, 8.24951171875, 9.086181640625, 9.9228515625, 10.759521484375, 11.59619140625, 12.432861328125, 13.26953125, 14.106201171875, 14.94287109375, 15.779541015625, 16.6162109375, 17.452880859375, 18.28955078125, 19.126220703125, 19.962890625, 20.799560546875, 21.63623046875, 22.472900390625, 23.3095703125, 24.146240234375, 24.98291015625, 25.819580078125, 26.65625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 2.0, 10.0, 12.0, 14.0, 18.0, 17.0, 27.0, 22.0, 29.0, 35.0, 38.0, 48.0, 43.0, 47.0, 52.0, 53.0, 53.0, 49.0, 44.0, 47.0, 38.0, 39.0, 37.0, 42.0, 33.0, 34.0, 21.0, 17.0, 13.0, 16.0, 10.0, 11.0, 6.0, 10.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.436767578125, -26.48291015625, -25.529052734375, -24.5751953125, -23.621337890625, -22.66748046875, -21.713623046875, -20.759765625, -19.805908203125, -18.85205078125, -17.898193359375, -16.9443359375, -15.990478515625, -15.03662109375, -14.082763671875, -13.12890625, -12.175048828125, -11.22119140625, -10.267333984375, -9.3134765625, -8.359619140625, -7.40576171875, -6.451904296875, -5.498046875, -4.544189453125, -3.59033203125, -2.636474609375, -1.6826171875, -0.728759765625, 0.22509765625, 1.178955078125, 2.1328125, 3.086669921875, 4.04052734375, 4.994384765625, 5.9482421875, 6.902099609375, 7.85595703125, 8.809814453125, 9.763671875, 10.717529296875, 11.67138671875, 12.625244140625, 13.5791015625, 14.532958984375, 15.48681640625, 16.440673828125, 17.39453125, 18.348388671875, 19.30224609375, 20.256103515625, 21.2099609375, 22.163818359375, 23.11767578125, 24.071533203125, 25.025390625, 25.979248046875, 26.93310546875, 27.886962890625, 28.8408203125, 29.794677734375, 30.74853515625, 31.702392578125, 32.65625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 10.0, 20.0, 37.0, 58.0, 94.0, 155.0, 274.0, 437.0, 782.0, 1332.0, 2179.0, 3905.0, 6546.0, 11407.0, 19437.0, 32906.0, 54772.0, 89017.0, 140960.0, 214750.0, 308743.0, 411134.0, 497266.0, 533758.0, 506366.0, 422580.0, 321667.0, 225451.0, 149868.0, 94673.0, 58678.0, 35147.0, 20663.0, 12203.0, 7148.0, 4145.0, 2358.0, 1384.0, 827.0, 466.0, 274.0, 163.0, 96.0, 53.0, 25.0, 30.0, 13.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-28.5, -27.65087890625, -26.8017578125, -25.95263671875, -25.103515625, -24.25439453125, -23.4052734375, -22.55615234375, -21.70703125, -20.85791015625, -20.0087890625, -19.15966796875, -18.310546875, -17.46142578125, -16.6123046875, -15.76318359375, -14.9140625, -14.06494140625, -13.2158203125, -12.36669921875, -11.517578125, -10.66845703125, -9.8193359375, -8.97021484375, -8.12109375, -7.27197265625, -6.4228515625, -5.57373046875, -4.724609375, -3.87548828125, -3.0263671875, -2.17724609375, -1.328125, -0.47900390625, 0.3701171875, 1.21923828125, 2.068359375, 2.91748046875, 3.7666015625, 4.61572265625, 5.46484375, 6.31396484375, 7.1630859375, 8.01220703125, 8.861328125, 9.71044921875, 10.5595703125, 11.40869140625, 12.2578125, 13.10693359375, 13.9560546875, 14.80517578125, 15.654296875, 16.50341796875, 17.3525390625, 18.20166015625, 19.05078125, 19.89990234375, 20.7490234375, 21.59814453125, 22.447265625, 23.29638671875, 24.1455078125, 24.99462890625, 25.84375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 11.0, 18.0, 17.0, 17.0, 26.0, 36.0, 51.0, 65.0, 65.0, 90.0, 117.0, 153.0, 152.0, 164.0, 171.0, 186.0, 213.0, 229.0, 242.0, 244.0, 234.0, 207.0, 204.0, 171.0, 143.0, 156.0, 127.0, 121.0, 98.0, 74.0, 50.0, 39.0, 44.0, 31.0, 26.0, 21.0, 20.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.390625, -12.96875, -12.546875, -12.125, -11.703125, -11.28125, -10.859375, -10.4375, -10.015625, -9.59375, -9.171875, -8.75, -8.328125, -7.90625, -7.484375, -7.0625, -6.640625, -6.21875, -5.796875, -5.375, -4.953125, -4.53125, -4.109375, -3.6875, -3.265625, -2.84375, -2.421875, -2.0, -1.578125, -1.15625, -0.734375, -0.3125, 0.109375, 0.53125, 0.953125, 1.375, 1.796875, 2.21875, 2.640625, 3.0625, 3.484375, 3.90625, 4.328125, 4.75, 5.171875, 5.59375, 6.015625, 6.4375, 6.859375, 7.28125, 7.703125, 8.125, 8.546875, 8.96875, 9.390625, 9.8125, 10.234375, 10.65625, 11.078125, 11.5, 11.921875, 12.34375, 12.765625, 13.1875, 13.609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 13.0, 6.0, 4.0, 9.0, 17.0, 17.0, 22.0, 18.0, 24.0, 33.0, 21.0, 41.0, 29.0, 37.0, 32.0, 54.0, 29.0, 35.0, 47.0, 51.0, 48.0, 36.0, 28.0, 26.0, 37.0, 36.0, 31.0, 32.0, 25.0, 18.0, 17.0, 20.0, 13.0, 13.0, 12.0, 17.0, 2.0, 6.0, 7.0, 8.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-27.767608642578125, -26.920015335083008, -26.07242202758789, -25.224830627441406, -24.37723731994629, -23.529644012451172, -22.682050704956055, -21.834457397460938, -20.986865997314453, -20.139272689819336, -19.29167938232422, -18.444087982177734, -17.596494674682617, -16.7489013671875, -15.901308059692383, -15.053715705871582, -14.206122398376465, -13.358529090881348, -12.510936737060547, -11.66334342956543, -10.815751075744629, -9.968157768249512, -9.120565414428711, -8.272972106933594, -7.425379276275635, -6.577786445617676, -5.730193614959717, -4.882600784301758, -4.035007476806641, -3.1874146461486816, -2.3398218154907227, -1.4922289848327637, -0.6446361541748047, 0.20295673608779907, 1.0505496263504028, 1.8981425762176514, 2.7457354068756104, 3.5933284759521484, 4.440921306610107, 5.288514137268066, 6.136106967926025, 6.983699798583984, 7.831292629241943, 8.678885459899902, 9.52647876739502, 10.37407112121582, 11.221664428710938, 12.069257736206055, 12.916850090026855, 13.764443397521973, 14.612035751342773, 15.45962905883789, 16.307222366333008, 17.154815673828125, 18.00240707397461, 18.850000381469727, 19.697593688964844, 20.54518699645996, 21.392780303955078, 22.240371704101562, 23.08796501159668, 23.935558319091797, 24.783151626586914, 25.63074493408203, 26.478336334228516]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 1.0, 4.0, 6.0, 8.0, 9.0, 10.0, 10.0, 19.0, 14.0, 13.0, 30.0, 23.0, 27.0, 32.0, 40.0, 44.0, 33.0, 38.0, 47.0, 43.0, 50.0, 37.0, 42.0, 42.0, 36.0, 43.0, 43.0, 31.0, 26.0, 35.0, 29.0, 21.0, 22.0, 26.0, 10.0, 13.0, 8.0, 11.0, 3.0, 7.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.27320671081543, -28.30241584777832, -27.33162498474121, -26.3608341217041, -25.390043258666992, -24.419252395629883, -23.448461532592773, -22.477670669555664, -21.506879806518555, -20.536088943481445, -19.565298080444336, -18.594507217407227, -17.623716354370117, -16.652925491333008, -15.682134628295898, -14.711343765258789, -13.74055290222168, -12.76976203918457, -11.798971176147461, -10.828180313110352, -9.857389450073242, -8.886598587036133, -7.915807723999023, -6.945016860961914, -5.974225997924805, -5.003435134887695, -4.032644271850586, -3.0618534088134766, -2.091062545776367, -1.1202716827392578, -0.14948081970214844, 0.8213100433349609, 1.7921028137207031, 2.7628936767578125, 3.733684539794922, 4.704475402832031, 5.675266265869141, 6.64605712890625, 7.616847991943359, 8.587638854980469, 9.558429718017578, 10.529220581054688, 11.500011444091797, 12.470802307128906, 13.441593170166016, 14.412384033203125, 15.383174896240234, 16.353965759277344, 17.324756622314453, 18.295547485351562, 19.266338348388672, 20.23712921142578, 21.20792007446289, 22.1787109375, 23.14950180053711, 24.12029266357422, 25.091083526611328, 26.061874389648438, 27.032665252685547, 28.003456115722656, 28.974246978759766, 29.945037841796875, 30.915828704833984, 31.886619567871094, 32.8574104309082]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 11.0, 10.0, 13.0, 19.0, 38.0, 49.0, 77.0, 135.0, 181.0, 272.0, 415.0, 632.0, 992.0, 1588.0, 2411.0, 3747.0, 5593.0, 8448.0, 12401.0, 18197.0, 26233.0, 36433.0, 48948.0, 62993.0, 76365.0, 89038.0, 97186.0, 99138.0, 94673.0, 85237.0, 71749.0, 57663.0, 44059.0, 32208.0, 23108.0, 16168.0, 10987.0, 7291.0, 4726.0, 3162.0, 2077.0, 1347.0, 913.0, 577.0, 359.0, 241.0, 173.0, 113.0, 71.0, 41.0, 16.0, 14.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-11.7109375, -11.3370361328125, -10.963134765625, -10.5892333984375, -10.21533203125, -9.8414306640625, -9.467529296875, -9.0936279296875, -8.7197265625, -8.3458251953125, -7.971923828125, -7.5980224609375, -7.22412109375, -6.8502197265625, -6.476318359375, -6.1024169921875, -5.728515625, -5.3546142578125, -4.980712890625, -4.6068115234375, -4.23291015625, -3.8590087890625, -3.485107421875, -3.1112060546875, -2.7373046875, -2.3634033203125, -1.989501953125, -1.6156005859375, -1.24169921875, -0.8677978515625, -0.493896484375, -0.1199951171875, 0.25390625, 0.6278076171875, 1.001708984375, 1.3756103515625, 1.74951171875, 2.1234130859375, 2.497314453125, 2.8712158203125, 3.2451171875, 3.6190185546875, 3.992919921875, 4.3668212890625, 4.74072265625, 5.1146240234375, 5.488525390625, 5.8624267578125, 6.236328125, 6.6102294921875, 6.984130859375, 7.3580322265625, 7.73193359375, 8.1058349609375, 8.479736328125, 8.8536376953125, 9.2275390625, 9.6014404296875, 9.975341796875, 10.3492431640625, 10.72314453125, 11.0970458984375, 11.470947265625, 11.8448486328125, 12.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 2.0, 9.0, 9.0, 10.0, 12.0, 15.0, 14.0, 17.0, 19.0, 26.0, 32.0, 36.0, 37.0, 38.0, 37.0, 40.0, 45.0, 42.0, 59.0, 41.0, 40.0, 31.0, 42.0, 41.0, 42.0, 37.0, 24.0, 37.0, 22.0, 25.0, 22.0, 20.0, 13.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.609375, -28.624267578125, -27.63916015625, -26.654052734375, -25.6689453125, -24.683837890625, -23.69873046875, -22.713623046875, -21.728515625, -20.743408203125, -19.75830078125, -18.773193359375, -17.7880859375, -16.802978515625, -15.81787109375, -14.832763671875, -13.84765625, -12.862548828125, -11.87744140625, -10.892333984375, -9.9072265625, -8.922119140625, -7.93701171875, -6.951904296875, -5.966796875, -4.981689453125, -3.99658203125, -3.011474609375, -2.0263671875, -1.041259765625, -0.05615234375, 0.928955078125, 1.9140625, 2.899169921875, 3.88427734375, 4.869384765625, 5.8544921875, 6.839599609375, 7.82470703125, 8.809814453125, 9.794921875, 10.780029296875, 11.76513671875, 12.750244140625, 13.7353515625, 14.720458984375, 15.70556640625, 16.690673828125, 17.67578125, 18.660888671875, 19.64599609375, 20.631103515625, 21.6162109375, 22.601318359375, 23.58642578125, 24.571533203125, 25.556640625, 26.541748046875, 27.52685546875, 28.511962890625, 29.4970703125, 30.482177734375, 31.46728515625, 32.452392578125, 33.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 11.0, 17.0, 36.0, 34.0, 41.0, 63.0, 96.0, 142.0, 202.0, 287.0, 484.0, 678.0, 1022.0, 1555.0, 2320.0, 3403.0, 5215.0, 7754.0, 11475.0, 17832.0, 28782.0, 222954.0, 647239.0, 36159.0, 20589.0, 13375.0, 8776.0, 5989.0, 3947.0, 2708.0, 1785.0, 1205.0, 778.0, 484.0, 341.0, 251.0, 174.0, 124.0, 74.0, 46.0, 41.0, 27.0, 20.0, 13.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.856201171875, -23.00927734375, -22.162353515625, -21.3154296875, -20.468505859375, -19.62158203125, -18.774658203125, -17.927734375, -17.080810546875, -16.23388671875, -15.386962890625, -14.5400390625, -13.693115234375, -12.84619140625, -11.999267578125, -11.15234375, -10.305419921875, -9.45849609375, -8.611572265625, -7.7646484375, -6.917724609375, -6.07080078125, -5.223876953125, -4.376953125, -3.530029296875, -2.68310546875, -1.836181640625, -0.9892578125, -0.142333984375, 0.70458984375, 1.551513671875, 2.3984375, 3.245361328125, 4.09228515625, 4.939208984375, 5.7861328125, 6.633056640625, 7.47998046875, 8.326904296875, 9.173828125, 10.020751953125, 10.86767578125, 11.714599609375, 12.5615234375, 13.408447265625, 14.25537109375, 15.102294921875, 15.94921875, 16.796142578125, 17.64306640625, 18.489990234375, 19.3369140625, 20.183837890625, 21.03076171875, 21.877685546875, 22.724609375, 23.571533203125, 24.41845703125, 25.265380859375, 26.1123046875, 26.959228515625, 27.80615234375, 28.653076171875, 29.5]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 10.0, 6.0, 12.0, 10.0, 16.0, 13.0, 19.0, 28.0, 21.0, 19.0, 29.0, 24.0, 46.0, 42.0, 41.0, 39.0, 30.0, 44.0, 33.0, 48.0, 39.0, 43.0, 40.0, 42.0, 40.0, 29.0, 26.0, 28.0, 25.0, 25.0, 26.0, 14.0, 14.0, 13.0, 10.0, 8.0, 10.0, 6.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.265625, -19.58837890625, -18.9111328125, -18.23388671875, -17.556640625, -16.87939453125, -16.2021484375, -15.52490234375, -14.84765625, -14.17041015625, -13.4931640625, -12.81591796875, -12.138671875, -11.46142578125, -10.7841796875, -10.10693359375, -9.4296875, -8.75244140625, -8.0751953125, -7.39794921875, -6.720703125, -6.04345703125, -5.3662109375, -4.68896484375, -4.01171875, -3.33447265625, -2.6572265625, -1.97998046875, -1.302734375, -0.62548828125, 0.0517578125, 0.72900390625, 1.40625, 2.08349609375, 2.7607421875, 3.43798828125, 4.115234375, 4.79248046875, 5.4697265625, 6.14697265625, 6.82421875, 7.50146484375, 8.1787109375, 8.85595703125, 9.533203125, 10.21044921875, 10.8876953125, 11.56494140625, 12.2421875, 12.91943359375, 13.5966796875, 14.27392578125, 14.951171875, 15.62841796875, 16.3056640625, 16.98291015625, 17.66015625, 18.33740234375, 19.0146484375, 19.69189453125, 20.369140625, 21.04638671875, 21.7236328125, 22.40087890625, 23.078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 11.0, 15.0, 23.0, 39.0, 57.0, 74.0, 98.0, 183.0, 246.0, 313.0, 468.0, 691.0, 990.0, 1502.0, 2331.0, 3406.0, 4989.0, 7671.0, 12044.0, 19632.0, 39954.0, 533336.0, 335929.0, 33845.0, 17852.0, 11138.0, 7319.0, 4715.0, 3057.0, 2152.0, 1420.0, 957.0, 647.0, 421.0, 325.0, 228.0, 127.0, 104.0, 78.0, 52.0, 39.0, 20.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.231048583984375, -2.16326904296875, -2.095489501953125, -2.0277099609375, -1.959930419921875, -1.89215087890625, -1.824371337890625, -1.756591796875, -1.688812255859375, -1.62103271484375, -1.553253173828125, -1.4854736328125, -1.417694091796875, -1.34991455078125, -1.282135009765625, -1.21435546875, -1.146575927734375, -1.07879638671875, -1.011016845703125, -0.9432373046875, -0.875457763671875, -0.80767822265625, -0.739898681640625, -0.672119140625, -0.604339599609375, -0.53656005859375, -0.468780517578125, -0.4010009765625, -0.333221435546875, -0.26544189453125, -0.197662353515625, -0.1298828125, -0.062103271484375, 0.00567626953125, 0.073455810546875, 0.1412353515625, 0.209014892578125, 0.27679443359375, 0.344573974609375, 0.412353515625, 0.480133056640625, 0.54791259765625, 0.615692138671875, 0.6834716796875, 0.751251220703125, 0.81903076171875, 0.886810302734375, 0.95458984375, 1.022369384765625, 1.09014892578125, 1.157928466796875, 1.2257080078125, 1.293487548828125, 1.36126708984375, 1.429046630859375, 1.496826171875, 1.564605712890625, 1.63238525390625, 1.700164794921875, 1.7679443359375, 1.835723876953125, 1.90350341796875, 1.971282958984375, 2.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 22.0, 18.0, 32.0, 46.0, 36.0, 52.0, 67.0, 53.0, 74.0, 68.0, 61.0, 65.0, 57.0, 56.0, 62.0, 34.0, 38.0, 25.0, 23.0, 21.0, 12.0, 7.0, 2.0, 3.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007539913058280945, -0.0007293075323104858, -0.0007046237587928772, -0.0006799399852752686, -0.0006552562117576599, -0.0006305724382400513, -0.0006058886647224426, -0.000581204891204834, -0.0005565211176872253, -0.0005318373441696167, -0.0005071535706520081, -0.0004824697971343994, -0.00045778602361679077, -0.00043310225009918213, -0.0004084184765815735, -0.00038373470306396484, -0.0003590509295463562, -0.00033436715602874756, -0.0003096833825111389, -0.0002849996089935303, -0.00026031583547592163, -0.000235632061958313, -0.00021094828844070435, -0.0001862645149230957, -0.00016158074140548706, -0.00013689696788787842, -0.00011221319437026978, -8.752942085266113e-05, -6.284564733505249e-05, -3.816187381744385e-05, -1.3478100299835205e-05, 1.1205673217773438e-05, 3.588944673538208e-05, 6.057322025299072e-05, 8.525699377059937e-05, 0.00010994076728820801, 0.00013462454080581665, 0.0001593083143234253, 0.00018399208784103394, 0.00020867586135864258, 0.00023335963487625122, 0.00025804340839385986, 0.0002827271819114685, 0.00030741095542907715, 0.0003320947289466858, 0.00035677850246429443, 0.0003814622759819031, 0.0004061460494995117, 0.00043082982301712036, 0.000455513596534729, 0.00048019737005233765, 0.0005048811435699463, 0.0005295649170875549, 0.0005542486906051636, 0.0005789324641227722, 0.0006036162376403809, 0.0006283000111579895, 0.0006529837846755981, 0.0006776675581932068, 0.0007023513317108154, 0.0007270351052284241, 0.0007517188787460327, 0.0007764026522636414, 0.00080108642578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 12.0, 25.0, 40.0, 50.0, 63.0, 127.0, 176.0, 288.0, 454.0, 690.0, 1063.0, 1716.0, 2656.0, 4320.0, 6824.0, 10951.0, 18351.0, 30795.0, 51046.0, 82249.0, 119914.0, 152483.0, 159828.0, 138109.0, 100530.0, 65255.0, 39623.0, 23569.0, 14038.0, 8737.0, 5337.0, 3340.0, 2122.0, 1293.0, 894.0, 591.0, 333.0, 213.0, 137.0, 118.0, 54.0, 50.0, 22.0, 22.0, 11.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.058746337890625, -1.02374267578125, -0.988739013671875, -0.9537353515625, -0.918731689453125, -0.88372802734375, -0.848724365234375, -0.813720703125, -0.778717041015625, -0.74371337890625, -0.708709716796875, -0.6737060546875, -0.638702392578125, -0.60369873046875, -0.568695068359375, -0.53369140625, -0.498687744140625, -0.46368408203125, -0.428680419921875, -0.3936767578125, -0.358673095703125, -0.32366943359375, -0.288665771484375, -0.253662109375, -0.218658447265625, -0.18365478515625, -0.148651123046875, -0.1136474609375, -0.078643798828125, -0.04364013671875, -0.008636474609375, 0.0263671875, 0.061370849609375, 0.09637451171875, 0.131378173828125, 0.1663818359375, 0.201385498046875, 0.23638916015625, 0.271392822265625, 0.306396484375, 0.341400146484375, 0.37640380859375, 0.411407470703125, 0.4464111328125, 0.481414794921875, 0.51641845703125, 0.551422119140625, 0.58642578125, 0.621429443359375, 0.65643310546875, 0.691436767578125, 0.7264404296875, 0.761444091796875, 0.79644775390625, 0.831451416015625, 0.866455078125, 0.901458740234375, 0.93646240234375, 0.971466064453125, 1.0064697265625, 1.041473388671875, 1.07647705078125, 1.111480712890625, 1.146484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 11.0, 12.0, 12.0, 11.0, 19.0, 20.0, 19.0, 37.0, 50.0, 42.0, 60.0, 57.0, 79.0, 82.0, 66.0, 76.0, 67.0, 41.0, 42.0, 36.0, 43.0, 28.0, 17.0, 13.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.54736328125, -0.5319862365722656, -0.5166091918945312, -0.5012321472167969, -0.4858551025390625, -0.4704780578613281, -0.45510101318359375, -0.4397239685058594, -0.424346923828125, -0.4089698791503906, -0.39359283447265625, -0.3782157897949219, -0.3628387451171875, -0.3474617004394531, -0.33208465576171875, -0.3167076110839844, -0.30133056640625, -0.2859535217285156, -0.27057647705078125, -0.2551994323730469, -0.2398223876953125, -0.22444534301757812, -0.20906829833984375, -0.19369125366210938, -0.178314208984375, -0.16293716430664062, -0.14756011962890625, -0.13218307495117188, -0.1168060302734375, -0.10142898559570312, -0.08605194091796875, -0.07067489624023438, -0.0552978515625, -0.039920806884765625, -0.02454376220703125, -0.009166717529296875, 0.0062103271484375, 0.021587371826171875, 0.03696441650390625, 0.052341461181640625, 0.067718505859375, 0.08309555053710938, 0.09847259521484375, 0.11384963989257812, 0.1292266845703125, 0.14460372924804688, 0.15998077392578125, 0.17535781860351562, 0.19073486328125, 0.20611190795898438, 0.22148895263671875, 0.23686599731445312, 0.2522430419921875, 0.2676200866699219, 0.28299713134765625, 0.2983741760253906, 0.313751220703125, 0.3291282653808594, 0.34450531005859375, 0.3598823547363281, 0.3752593994140625, 0.3906364440917969, 0.40601348876953125, 0.4213905334472656, 0.436767578125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 4.0, 2.0, 7.0, 9.0, 17.0, 12.0, 14.0, 22.0, 20.0, 30.0, 24.0, 26.0, 37.0, 37.0, 34.0, 32.0, 36.0, 38.0, 49.0, 41.0, 41.0, 43.0, 44.0, 39.0, 37.0, 35.0, 28.0, 39.0, 29.0, 27.0, 24.0, 22.0, 12.0, 14.0, 13.0, 9.0, 6.0, 9.0, 5.0, 5.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.42294692993164, -27.53778076171875, -26.65261459350586, -25.76744842529297, -24.882282257080078, -23.997116088867188, -23.111949920654297, -22.226783752441406, -21.341617584228516, -20.456451416015625, -19.571285247802734, -18.686119079589844, -17.800952911376953, -16.915786743164062, -16.030620574951172, -15.145454406738281, -14.26028823852539, -13.3751220703125, -12.48995590209961, -11.604789733886719, -10.719623565673828, -9.834457397460938, -8.949291229248047, -8.064125061035156, -7.178958892822266, -6.293792724609375, -5.408626556396484, -4.523460388183594, -3.638294219970703, -2.7531280517578125, -1.8679618835449219, -0.9827957153320312, -0.09762954711914062, 0.78753662109375, 1.6727027893066406, 2.5578689575195312, 3.443035125732422, 4.3282012939453125, 5.213367462158203, 6.098533630371094, 6.983699798583984, 7.868865966796875, 8.754032135009766, 9.639198303222656, 10.524364471435547, 11.409530639648438, 12.294696807861328, 13.179862976074219, 14.06502914428711, 14.9501953125, 15.83536148071289, 16.72052764892578, 17.605693817138672, 18.490859985351562, 19.376026153564453, 20.261192321777344, 21.146358489990234, 22.031524658203125, 22.916690826416016, 23.801856994628906, 24.687023162841797, 25.572189331054688, 26.457355499267578, 27.34252166748047, 28.22768783569336]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 3.0, 7.0, 6.0, 8.0, 15.0, 9.0, 18.0, 11.0, 18.0, 25.0, 26.0, 28.0, 45.0, 37.0, 38.0, 34.0, 39.0, 41.0, 54.0, 47.0, 38.0, 40.0, 32.0, 44.0, 36.0, 45.0, 33.0, 34.0, 21.0, 29.0, 24.0, 19.0, 21.0, 16.0, 10.0, 8.0, 7.0, 9.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.991809844970703, -28.021595001220703, -27.05137825012207, -26.08116340637207, -25.11094856262207, -24.140731811523438, -23.170516967773438, -22.200302124023438, -21.230087280273438, -20.259872436523438, -19.289655685424805, -18.319440841674805, -17.349225997924805, -16.379009246826172, -15.408794403076172, -14.438579559326172, -13.468363761901855, -12.498147964477539, -11.527933120727539, -10.557717323303223, -9.587502479553223, -8.617286682128906, -7.647071361541748, -6.67685604095459, -5.706640720367432, -4.736425399780273, -3.7662100791931152, -2.795994520187378, -1.8257791996002197, -0.8555636405944824, 0.11465167999267578, 1.084867000579834, 2.055082321166992, 3.0252976417541504, 3.9955129623413086, 4.965728759765625, 5.935943603515625, 6.906159400939941, 7.8763747215271, 8.846590042114258, 9.816804885864258, 10.787020683288574, 11.757235527038574, 12.72745132446289, 13.69766616821289, 14.667881965637207, 15.638097763061523, 16.608312606811523, 17.578529357910156, 18.548744201660156, 19.51896095275879, 20.48917579650879, 21.45939064025879, 22.429607391357422, 23.399822235107422, 24.370037078857422, 25.340251922607422, 26.310466766357422, 27.280683517456055, 28.250898361206055, 29.221113204956055, 30.191329956054688, 31.161544799804688, 32.13175964355469, 33.10197448730469]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 13.0, 14.0, 27.0, 47.0, 70.0, 82.0, 134.0, 194.0, 318.0, 505.0, 824.0, 1304.0, 2279.0, 3598.0, 6395.0, 10563.0, 17569.0, 28438.0, 43827.0, 65573.0, 89347.0, 113194.0, 129325.0, 130132.0, 116772.0, 93695.0, 69043.0, 47045.0, 30310.0, 18891.0, 11273.0, 7062.0, 4111.0, 2570.0, 1477.0, 957.0, 545.0, 343.0, 260.0, 150.0, 85.0, 67.0, 40.0, 28.0, 16.0, 17.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-28.0, -27.178466796875, -26.35693359375, -25.535400390625, -24.7138671875, -23.892333984375, -23.07080078125, -22.249267578125, -21.427734375, -20.606201171875, -19.78466796875, -18.963134765625, -18.1416015625, -17.320068359375, -16.49853515625, -15.677001953125, -14.85546875, -14.033935546875, -13.21240234375, -12.390869140625, -11.5693359375, -10.747802734375, -9.92626953125, -9.104736328125, -8.283203125, -7.461669921875, -6.64013671875, -5.818603515625, -4.9970703125, -4.175537109375, -3.35400390625, -2.532470703125, -1.7109375, -0.889404296875, -0.06787109375, 0.753662109375, 1.5751953125, 2.396728515625, 3.21826171875, 4.039794921875, 4.861328125, 5.682861328125, 6.50439453125, 7.325927734375, 8.1474609375, 8.968994140625, 9.79052734375, 10.612060546875, 11.43359375, 12.255126953125, 13.07666015625, 13.898193359375, 14.7197265625, 15.541259765625, 16.36279296875, 17.184326171875, 18.005859375, 18.827392578125, 19.64892578125, 20.470458984375, 21.2919921875, 22.113525390625, 22.93505859375, 23.756591796875, 24.578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 9.0, 7.0, 19.0, 19.0, 13.0, 21.0, 25.0, 33.0, 33.0, 36.0, 37.0, 35.0, 34.0, 48.0, 38.0, 49.0, 42.0, 38.0, 40.0, 40.0, 38.0, 41.0, 37.0, 31.0, 29.0, 28.0, 28.0, 17.0, 26.0, 15.0, 15.0, 10.0, 10.0, 8.0, 3.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.296875, -26.39892578125, -25.5009765625, -24.60302734375, -23.705078125, -22.80712890625, -21.9091796875, -21.01123046875, -20.11328125, -19.21533203125, -18.3173828125, -17.41943359375, -16.521484375, -15.62353515625, -14.7255859375, -13.82763671875, -12.9296875, -12.03173828125, -11.1337890625, -10.23583984375, -9.337890625, -8.43994140625, -7.5419921875, -6.64404296875, -5.74609375, -4.84814453125, -3.9501953125, -3.05224609375, -2.154296875, -1.25634765625, -0.3583984375, 0.53955078125, 1.4375, 2.33544921875, 3.2333984375, 4.13134765625, 5.029296875, 5.92724609375, 6.8251953125, 7.72314453125, 8.62109375, 9.51904296875, 10.4169921875, 11.31494140625, 12.212890625, 13.11083984375, 14.0087890625, 14.90673828125, 15.8046875, 16.70263671875, 17.6005859375, 18.49853515625, 19.396484375, 20.29443359375, 21.1923828125, 22.09033203125, 22.98828125, 23.88623046875, 24.7841796875, 25.68212890625, 26.580078125, 27.47802734375, 28.3759765625, 29.27392578125, 30.171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 14.0, 19.0, 25.0, 32.0, 54.0, 55.0, 125.0, 146.0, 261.0, 430.0, 604.0, 970.0, 1529.0, 2575.0, 4091.0, 6296.0, 10422.0, 16760.0, 26510.0, 40557.0, 60309.0, 83426.0, 106841.0, 124626.0, 128980.0, 118153.0, 97888.0, 73185.0, 51217.0, 34065.0, 21876.0, 13838.0, 8447.0, 5310.0, 3283.0, 2061.0, 1275.0, 794.0, 505.0, 335.0, 229.0, 148.0, 86.0, 69.0, 34.0, 32.0, 23.0, 16.0, 13.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.90625, -27.0419921875, -26.177734375, -25.3134765625, -24.44921875, -23.5849609375, -22.720703125, -21.8564453125, -20.9921875, -20.1279296875, -19.263671875, -18.3994140625, -17.53515625, -16.6708984375, -15.806640625, -14.9423828125, -14.078125, -13.2138671875, -12.349609375, -11.4853515625, -10.62109375, -9.7568359375, -8.892578125, -8.0283203125, -7.1640625, -6.2998046875, -5.435546875, -4.5712890625, -3.70703125, -2.8427734375, -1.978515625, -1.1142578125, -0.25, 0.6142578125, 1.478515625, 2.3427734375, 3.20703125, 4.0712890625, 4.935546875, 5.7998046875, 6.6640625, 7.5283203125, 8.392578125, 9.2568359375, 10.12109375, 10.9853515625, 11.849609375, 12.7138671875, 13.578125, 14.4423828125, 15.306640625, 16.1708984375, 17.03515625, 17.8994140625, 18.763671875, 19.6279296875, 20.4921875, 21.3564453125, 22.220703125, 23.0849609375, 23.94921875, 24.8134765625, 25.677734375, 26.5419921875, 27.40625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 8.0, 3.0, 5.0, 9.0, 9.0, 10.0, 8.0, 8.0, 21.0, 19.0, 17.0, 29.0, 24.0, 31.0, 34.0, 34.0, 32.0, 37.0, 37.0, 36.0, 31.0, 35.0, 38.0, 37.0, 39.0, 40.0, 29.0, 39.0, 27.0, 38.0, 31.0, 25.0, 22.0, 16.0, 19.0, 15.0, 19.0, 14.0, 11.0, 13.0, 11.0, 10.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-16.75, -16.22802734375, -15.7060546875, -15.18408203125, -14.662109375, -14.14013671875, -13.6181640625, -13.09619140625, -12.57421875, -12.05224609375, -11.5302734375, -11.00830078125, -10.486328125, -9.96435546875, -9.4423828125, -8.92041015625, -8.3984375, -7.87646484375, -7.3544921875, -6.83251953125, -6.310546875, -5.78857421875, -5.2666015625, -4.74462890625, -4.22265625, -3.70068359375, -3.1787109375, -2.65673828125, -2.134765625, -1.61279296875, -1.0908203125, -0.56884765625, -0.046875, 0.47509765625, 0.9970703125, 1.51904296875, 2.041015625, 2.56298828125, 3.0849609375, 3.60693359375, 4.12890625, 4.65087890625, 5.1728515625, 5.69482421875, 6.216796875, 6.73876953125, 7.2607421875, 7.78271484375, 8.3046875, 8.82666015625, 9.3486328125, 9.87060546875, 10.392578125, 10.91455078125, 11.4365234375, 11.95849609375, 12.48046875, 13.00244140625, 13.5244140625, 14.04638671875, 14.568359375, 15.09033203125, 15.6123046875, 16.13427734375, 16.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 35.0, 41.0, 58.0, 96.0, 179.0, 325.0, 520.0, 918.0, 1613.0, 3051.0, 5992.0, 11286.0, 21632.0, 41844.0, 77068.0, 128370.0, 177132.0, 190317.0, 157766.0, 104455.0, 59905.0, 31452.0, 16165.0, 8446.0, 4486.0, 2415.0, 1250.0, 693.0, 411.0, 244.0, 140.0, 80.0, 57.0, 33.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.28759765625, -10.9267578125, -10.56591796875, -10.205078125, -9.84423828125, -9.4833984375, -9.12255859375, -8.76171875, -8.40087890625, -8.0400390625, -7.67919921875, -7.318359375, -6.95751953125, -6.5966796875, -6.23583984375, -5.875, -5.51416015625, -5.1533203125, -4.79248046875, -4.431640625, -4.07080078125, -3.7099609375, -3.34912109375, -2.98828125, -2.62744140625, -2.2666015625, -1.90576171875, -1.544921875, -1.18408203125, -0.8232421875, -0.46240234375, -0.1015625, 0.25927734375, 0.6201171875, 0.98095703125, 1.341796875, 1.70263671875, 2.0634765625, 2.42431640625, 2.78515625, 3.14599609375, 3.5068359375, 3.86767578125, 4.228515625, 4.58935546875, 4.9501953125, 5.31103515625, 5.671875, 6.03271484375, 6.3935546875, 6.75439453125, 7.115234375, 7.47607421875, 7.8369140625, 8.19775390625, 8.55859375, 8.91943359375, 9.2802734375, 9.64111328125, 10.001953125, 10.36279296875, 10.7236328125, 11.08447265625, 11.4453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 9.0, 12.0, 22.0, 23.0, 22.0, 30.0, 36.0, 46.0, 49.0, 61.0, 62.0, 60.0, 69.0, 70.0, 60.0, 65.0, 53.0, 48.0, 52.0, 24.0, 22.0, 26.0, 11.0, 16.0, 12.0, 11.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010309219360351562, -0.000993773341178894, -0.0009566247463226318, -0.0009194761514663696, -0.0008823275566101074, -0.0008451789617538452, -0.000808030366897583, -0.0007708817720413208, -0.0007337331771850586, -0.0006965845823287964, -0.0006594359874725342, -0.000622287392616272, -0.0005851387977600098, -0.0005479902029037476, -0.0005108416080474854, -0.00047369301319122314, -0.00043654441833496094, -0.00039939582347869873, -0.0003622472286224365, -0.0003250986337661743, -0.0002879500389099121, -0.0002508014440536499, -0.0002136528491973877, -0.0001765042543411255, -0.00013935565948486328, -0.00010220706462860107, -6.505846977233887e-05, -2.790987491607666e-05, 9.238719940185547e-06, 4.6387314796447754e-05, 8.353590965270996e-05, 0.00012068450450897217, 0.00015783309936523438, 0.00019498169422149658, 0.0002321302890777588, 0.000269278883934021, 0.0003064274787902832, 0.0003435760736465454, 0.0003807246685028076, 0.0004178732633590698, 0.00045502185821533203, 0.0004921704530715942, 0.0005293190479278564, 0.0005664676427841187, 0.0006036162376403809, 0.0006407648324966431, 0.0006779134273529053, 0.0007150620222091675, 0.0007522106170654297, 0.0007893592119216919, 0.0008265078067779541, 0.0008636564016342163, 0.0009008049964904785, 0.0009379535913467407, 0.0009751021862030029, 0.0010122507810592651, 0.0010493993759155273, 0.0010865479707717896, 0.0011236965656280518, 0.001160845160484314, 0.0011979937553405762, 0.0012351423501968384, 0.0012722909450531006, 0.0013094395399093628, 0.001346588134765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 15.0, 17.0, 17.0, 31.0, 35.0, 58.0, 95.0, 109.0, 181.0, 225.0, 375.0, 516.0, 803.0, 1302.0, 1987.0, 3101.0, 5144.0, 8441.0, 13692.0, 22152.0, 35510.0, 54679.0, 78506.0, 105706.0, 126267.0, 134888.0, 126456.0, 104996.0, 77970.0, 53764.0, 34498.0, 21726.0, 13470.0, 8065.0, 5013.0, 3120.0, 1910.0, 1236.0, 811.0, 538.0, 371.0, 250.0, 173.0, 113.0, 83.0, 48.0, 30.0, 24.0, 13.0, 15.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.75, -7.4957275390625, -7.241455078125, -6.9871826171875, -6.73291015625, -6.4786376953125, -6.224365234375, -5.9700927734375, -5.7158203125, -5.4615478515625, -5.207275390625, -4.9530029296875, -4.69873046875, -4.4444580078125, -4.190185546875, -3.9359130859375, -3.681640625, -3.4273681640625, -3.173095703125, -2.9188232421875, -2.66455078125, -2.4102783203125, -2.156005859375, -1.9017333984375, -1.6474609375, -1.3931884765625, -1.138916015625, -0.8846435546875, -0.63037109375, -0.3760986328125, -0.121826171875, 0.1324462890625, 0.38671875, 0.6409912109375, 0.895263671875, 1.1495361328125, 1.40380859375, 1.6580810546875, 1.912353515625, 2.1666259765625, 2.4208984375, 2.6751708984375, 2.929443359375, 3.1837158203125, 3.43798828125, 3.6922607421875, 3.946533203125, 4.2008056640625, 4.455078125, 4.7093505859375, 4.963623046875, 5.2178955078125, 5.47216796875, 5.7264404296875, 5.980712890625, 6.2349853515625, 6.4892578125, 6.7435302734375, 6.997802734375, 7.2520751953125, 7.50634765625, 7.7606201171875, 8.014892578125, 8.2691650390625, 8.5234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 0.0, 11.0, 17.0, 19.0, 34.0, 28.0, 28.0, 49.0, 38.0, 50.0, 58.0, 77.0, 80.0, 57.0, 59.0, 60.0, 48.0, 63.0, 42.0, 40.0, 15.0, 28.0, 20.0, 15.0, 17.0, 7.0, 8.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.322265625, -3.191192626953125, -3.06011962890625, -2.929046630859375, -2.7979736328125, -2.666900634765625, -2.53582763671875, -2.404754638671875, -2.273681640625, -2.142608642578125, -2.01153564453125, -1.880462646484375, -1.7493896484375, -1.618316650390625, -1.48724365234375, -1.356170654296875, -1.22509765625, -1.094024658203125, -0.96295166015625, -0.831878662109375, -0.7008056640625, -0.569732666015625, -0.43865966796875, -0.307586669921875, -0.176513671875, -0.045440673828125, 0.08563232421875, 0.216705322265625, 0.3477783203125, 0.478851318359375, 0.60992431640625, 0.740997314453125, 0.8720703125, 1.003143310546875, 1.13421630859375, 1.265289306640625, 1.3963623046875, 1.527435302734375, 1.65850830078125, 1.789581298828125, 1.920654296875, 2.051727294921875, 2.18280029296875, 2.313873291015625, 2.4449462890625, 2.576019287109375, 2.70709228515625, 2.838165283203125, 2.96923828125, 3.100311279296875, 3.23138427734375, 3.362457275390625, 3.4935302734375, 3.624603271484375, 3.75567626953125, 3.886749267578125, 4.017822265625, 4.148895263671875, 4.27996826171875, 4.411041259765625, 4.5421142578125, 4.673187255859375, 4.80426025390625, 4.935333251953125, 5.06640625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 6.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 19.0, 22.0, 30.0, 33.0, 31.0, 25.0, 28.0, 41.0, 30.0, 30.0, 39.0, 45.0, 35.0, 51.0, 39.0, 35.0, 29.0, 30.0, 32.0, 27.0, 32.0, 25.0, 30.0, 22.0, 23.0, 14.0, 14.0, 12.0, 12.0, 15.0, 10.0, 7.0, 5.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-24.755844116210938, -23.971595764160156, -23.187349319458008, -22.403100967407227, -21.618854522705078, -20.834606170654297, -20.05035972595215, -19.266111373901367, -18.48186492919922, -17.697616577148438, -16.91337013244629, -16.129121780395508, -15.34487533569336, -14.560627937316895, -13.77638053894043, -12.992132186889648, -12.207884788513184, -11.423637390136719, -10.639389991760254, -9.855142593383789, -9.070895195007324, -8.28664779663086, -7.502399921417236, -6.7181525230407715, -5.933905124664307, -5.149657726287842, -4.365410327911377, -3.581162691116333, -2.796915292739868, -2.0126678943634033, -1.2284202575683594, -0.44417285919189453, 0.3400745391845703, 1.1243219375610352, 1.9085694551467896, 2.692816972732544, 3.477064371109009, 4.2613115310668945, 5.045559406280518, 5.829806804656982, 6.614054203033447, 7.398301601409912, 8.182549476623535, 8.966796875, 9.751044273376465, 10.53529167175293, 11.319539070129395, 12.10378646850586, 12.888033866882324, 13.672281265258789, 14.456528663635254, 15.240776062011719, 16.0250244140625, 16.80927085876465, 17.59351921081543, 18.377765655517578, 19.16201400756836, 19.94626235961914, 20.73050880432129, 21.51475715637207, 22.29900360107422, 23.083251953125, 23.86749839782715, 24.65174674987793, 25.435993194580078]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 11.0, 7.0, 9.0, 6.0, 14.0, 26.0, 36.0, 31.0, 21.0, 29.0, 34.0, 33.0, 41.0, 45.0, 46.0, 53.0, 34.0, 37.0, 42.0, 44.0, 42.0, 23.0, 34.0, 35.0, 37.0, 25.0, 30.0, 24.0, 26.0, 11.0, 14.0, 6.0, 15.0, 13.0, 9.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.704984664916992, -25.78809356689453, -24.871200561523438, -23.954309463500977, -23.037416458129883, -22.120525360107422, -21.203632354736328, -20.286741256713867, -19.369850158691406, -18.452959060668945, -17.53606605529785, -16.61917495727539, -15.702281951904297, -14.785390853881836, -13.868498802185059, -12.951606750488281, -12.034713745117188, -11.11782169342041, -10.200929641723633, -9.284038543701172, -8.367145538330078, -7.450253963470459, -6.53336238861084, -5.6164703369140625, -4.699578285217285, -3.782686233520508, -2.8657944202423096, -1.9489026069641113, -1.032010555267334, -0.11511850357055664, 0.8017730712890625, 1.7186651229858398, 2.6355552673339844, 3.5524473190307617, 4.469339370727539, 5.386230945587158, 6.3031229972839355, 7.220015048980713, 8.136906623840332, 9.05379867553711, 9.970690727233887, 10.887582778930664, 11.804474830627441, 12.721366882324219, 13.63825798034668, 14.555150985717773, 15.472042083740234, 16.388935089111328, 17.30582618713379, 18.22271728515625, 19.139610290527344, 20.056501388549805, 20.9733943939209, 21.89028549194336, 22.807178497314453, 23.724069595336914, 24.640960693359375, 25.557851791381836, 26.47474479675293, 27.39163589477539, 28.308528900146484, 29.225419998168945, 30.142311096191406, 31.0592041015625, 31.976097106933594]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 6.0, 18.0, 27.0, 43.0, 72.0, 166.0, 286.0, 457.0, 860.0, 1508.0, 2704.0, 4870.0, 8510.0, 14644.0, 25044.0, 42855.0, 71963.0, 117802.0, 188237.0, 286544.0, 403132.0, 514820.0, 570492.0, 546734.0, 455319.0, 336007.0, 228504.0, 146440.0, 91054.0, 55301.0, 33115.0, 19526.0, 11279.0, 6641.0, 3824.0, 2337.0, 1353.0, 771.0, 415.0, 263.0, 135.0, 85.0, 50.0, 34.0, 14.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.61328125, -20.7734375, -19.93359375, -19.09375, -18.25390625, -17.4140625, -16.57421875, -15.734375, -14.89453125, -14.0546875, -13.21484375, -12.375, -11.53515625, -10.6953125, -9.85546875, -9.015625, -8.17578125, -7.3359375, -6.49609375, -5.65625, -4.81640625, -3.9765625, -3.13671875, -2.296875, -1.45703125, -0.6171875, 0.22265625, 1.0625, 1.90234375, 2.7421875, 3.58203125, 4.421875, 5.26171875, 6.1015625, 6.94140625, 7.78125, 8.62109375, 9.4609375, 10.30078125, 11.140625, 11.98046875, 12.8203125, 13.66015625, 14.5, 15.33984375, 16.1796875, 17.01953125, 17.859375, 18.69921875, 19.5390625, 20.37890625, 21.21875, 22.05859375, 22.8984375, 23.73828125, 24.578125, 25.41796875, 26.2578125, 27.09765625, 27.9375, 28.77734375, 29.6171875, 30.45703125, 31.296875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 10.0, 12.0, 7.0, 16.0, 19.0, 23.0, 28.0, 27.0, 31.0, 30.0, 31.0, 40.0, 37.0, 52.0, 43.0, 42.0, 42.0, 40.0, 35.0, 41.0, 34.0, 33.0, 34.0, 32.0, 32.0, 32.0, 21.0, 24.0, 19.0, 20.0, 6.0, 14.0, 12.0, 20.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.546875, -21.762451171875, -20.97802734375, -20.193603515625, -19.4091796875, -18.624755859375, -17.84033203125, -17.055908203125, -16.271484375, -15.487060546875, -14.70263671875, -13.918212890625, -13.1337890625, -12.349365234375, -11.56494140625, -10.780517578125, -9.99609375, -9.211669921875, -8.42724609375, -7.642822265625, -6.8583984375, -6.073974609375, -5.28955078125, -4.505126953125, -3.720703125, -2.936279296875, -2.15185546875, -1.367431640625, -0.5830078125, 0.201416015625, 0.98583984375, 1.770263671875, 2.5546875, 3.339111328125, 4.12353515625, 4.907958984375, 5.6923828125, 6.476806640625, 7.26123046875, 8.045654296875, 8.830078125, 9.614501953125, 10.39892578125, 11.183349609375, 11.9677734375, 12.752197265625, 13.53662109375, 14.321044921875, 15.10546875, 15.889892578125, 16.67431640625, 17.458740234375, 18.2431640625, 19.027587890625, 19.81201171875, 20.596435546875, 21.380859375, 22.165283203125, 22.94970703125, 23.734130859375, 24.5185546875, 25.302978515625, 26.08740234375, 26.871826171875, 27.65625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 17.0, 22.0, 35.0, 69.0, 109.0, 168.0, 305.0, 513.0, 852.0, 1486.0, 2489.0, 4044.0, 6688.0, 10799.0, 17815.0, 28743.0, 45480.0, 70870.0, 108335.0, 159319.0, 226969.0, 303958.0, 382302.0, 446099.0, 471342.0, 453657.0, 396314.0, 320030.0, 240478.0, 170108.0, 116642.0, 77495.0, 49602.0, 31569.0, 19479.0, 11627.0, 7406.0, 4394.0, 2620.0, 1600.0, 979.0, 556.0, 362.0, 198.0, 123.0, 78.0, 56.0, 39.0, 23.0, 8.0, 7.0, 2.0, 1.0, 3.0, 3.0], "bins": [-25.1875, -24.437744140625, -23.68798828125, -22.938232421875, -22.1884765625, -21.438720703125, -20.68896484375, -19.939208984375, -19.189453125, -18.439697265625, -17.68994140625, -16.940185546875, -16.1904296875, -15.440673828125, -14.69091796875, -13.941162109375, -13.19140625, -12.441650390625, -11.69189453125, -10.942138671875, -10.1923828125, -9.442626953125, -8.69287109375, -7.943115234375, -7.193359375, -6.443603515625, -5.69384765625, -4.944091796875, -4.1943359375, -3.444580078125, -2.69482421875, -1.945068359375, -1.1953125, -0.445556640625, 0.30419921875, 1.053955078125, 1.8037109375, 2.553466796875, 3.30322265625, 4.052978515625, 4.802734375, 5.552490234375, 6.30224609375, 7.052001953125, 7.8017578125, 8.551513671875, 9.30126953125, 10.051025390625, 10.80078125, 11.550537109375, 12.30029296875, 13.050048828125, 13.7998046875, 14.549560546875, 15.29931640625, 16.049072265625, 16.798828125, 17.548583984375, 18.29833984375, 19.048095703125, 19.7978515625, 20.547607421875, 21.29736328125, 22.047119140625, 22.796875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 17.0, 28.0, 20.0, 39.0, 29.0, 39.0, 65.0, 74.0, 85.0, 107.0, 99.0, 120.0, 157.0, 172.0, 167.0, 191.0, 208.0, 228.0, 207.0, 211.0, 203.0, 191.0, 194.0, 174.0, 158.0, 139.0, 129.0, 115.0, 97.0, 79.0, 61.0, 44.0, 36.0, 35.0, 31.0, 26.0, 21.0, 17.0, 13.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5703125, -12.184326171875, -11.79833984375, -11.412353515625, -11.0263671875, -10.640380859375, -10.25439453125, -9.868408203125, -9.482421875, -9.096435546875, -8.71044921875, -8.324462890625, -7.9384765625, -7.552490234375, -7.16650390625, -6.780517578125, -6.39453125, -6.008544921875, -5.62255859375, -5.236572265625, -4.8505859375, -4.464599609375, -4.07861328125, -3.692626953125, -3.306640625, -2.920654296875, -2.53466796875, -2.148681640625, -1.7626953125, -1.376708984375, -0.99072265625, -0.604736328125, -0.21875, 0.167236328125, 0.55322265625, 0.939208984375, 1.3251953125, 1.711181640625, 2.09716796875, 2.483154296875, 2.869140625, 3.255126953125, 3.64111328125, 4.027099609375, 4.4130859375, 4.799072265625, 5.18505859375, 5.571044921875, 5.95703125, 6.343017578125, 6.72900390625, 7.114990234375, 7.5009765625, 7.886962890625, 8.27294921875, 8.658935546875, 9.044921875, 9.430908203125, 9.81689453125, 10.202880859375, 10.5888671875, 10.974853515625, 11.36083984375, 11.746826171875, 12.1328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 16.0, 18.0, 18.0, 19.0, 28.0, 24.0, 21.0, 35.0, 40.0, 30.0, 35.0, 27.0, 39.0, 38.0, 46.0, 43.0, 35.0, 37.0, 41.0, 43.0, 39.0, 32.0, 31.0, 28.0, 18.0, 25.0, 18.0, 26.0, 22.0, 12.0, 12.0, 15.0, 6.0, 1.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-25.224323272705078, -24.37598991394043, -23.527658462524414, -22.679325103759766, -21.83099365234375, -20.9826602935791, -20.134326934814453, -19.285995483398438, -18.43766212463379, -17.58932876586914, -16.740997314453125, -15.892663955688477, -15.044331550598145, -14.195999145507812, -13.34766674041748, -12.499334335327148, -11.651001930236816, -10.802669525146484, -9.954337120056152, -9.10600471496582, -8.257671356201172, -7.40933895111084, -6.561006546020508, -5.712673664093018, -4.8643412590026855, -4.0160088539123535, -3.1676759719848633, -2.3193435668945312, -1.4710109233856201, -0.622678279876709, 0.22565412521362305, 1.0739870071411133, 1.9223194122314453, 2.7706520557403564, 3.6189846992492676, 4.4673171043396, 5.31564998626709, 6.163982391357422, 7.012314796447754, 7.860647678375244, 8.708980560302734, 9.557312965393066, 10.405645370483398, 11.253978729248047, 12.102311134338379, 12.950643539428711, 13.798975944519043, 14.647308349609375, 15.495640754699707, 16.34397315979004, 17.192306518554688, 18.040637969970703, 18.88897132873535, 19.7373046875, 20.585636138916016, 21.433969497680664, 22.28230094909668, 23.130634307861328, 23.978965759277344, 24.827299118041992, 25.675630569458008, 26.523963928222656, 27.372295379638672, 28.22062873840332, 29.06896209716797]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 6.0, 5.0, 8.0, 6.0, 15.0, 16.0, 16.0, 13.0, 20.0, 26.0, 23.0, 22.0, 32.0, 33.0, 31.0, 26.0, 45.0, 42.0, 42.0, 33.0, 42.0, 31.0, 44.0, 39.0, 34.0, 26.0, 31.0, 31.0, 25.0, 30.0, 32.0, 27.0, 24.0, 17.0, 17.0, 8.0, 14.0, 13.0, 9.0, 3.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-26.389484405517578, -25.511083602905273, -24.632680892944336, -23.75428009033203, -22.875879287719727, -21.997478485107422, -21.119075775146484, -20.24067497253418, -19.362274169921875, -18.48387336730957, -17.605470657348633, -16.727069854736328, -15.848669052124023, -14.970267295837402, -14.091865539550781, -13.213464736938477, -12.335062026977539, -11.456660270690918, -10.578259468078613, -9.699857711791992, -8.821456909179688, -7.943055152893066, -7.064653396606445, -6.186252117156982, -5.3078508377075195, -4.429449558258057, -3.5510480403900146, -2.6726465225219727, -1.7942452430725098, -0.9158439636230469, -0.03744220733642578, 0.8409590721130371, 1.7193622589111328, 2.5977635383605957, 3.4761650562286377, 4.35456657409668, 5.232967853546143, 6.1113691329956055, 6.989770889282227, 7.8681721687316895, 8.746573448181152, 9.624975204467773, 10.503376007080078, 11.3817777633667, 12.26017951965332, 13.138580322265625, 14.016982078552246, 14.895383834838867, 15.773784637451172, 16.652185440063477, 17.530588150024414, 18.40898895263672, 19.287389755249023, 20.165790557861328, 21.044193267822266, 21.92259407043457, 22.800994873046875, 23.67939567565918, 24.557798385620117, 25.436199188232422, 26.314599990844727, 27.19300079345703, 28.07140350341797, 28.949804306030273, 29.82820701599121]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 11.0, 12.0, 23.0, 25.0, 52.0, 73.0, 112.0, 179.0, 261.0, 450.0, 624.0, 1003.0, 1581.0, 2331.0, 3468.0, 5092.0, 7598.0, 11000.0, 15430.0, 21885.0, 29690.0, 39283.0, 50577.0, 62543.0, 74154.0, 83168.0, 89418.0, 90533.0, 87238.0, 78929.0, 68994.0, 56863.0, 45537.0, 34686.0, 25790.0, 18474.0, 13426.0, 9156.0, 6298.0, 4253.0, 2833.0, 1920.0, 1298.0, 804.0, 520.0, 354.0, 230.0, 138.0, 92.0, 56.0, 25.0, 26.0, 16.0, 10.0, 8.0, 5.0, 1.0, 2.0], "bins": [-12.21875, -11.8514404296875, -11.484130859375, -11.1168212890625, -10.74951171875, -10.3822021484375, -10.014892578125, -9.6475830078125, -9.2802734375, -8.9129638671875, -8.545654296875, -8.1783447265625, -7.81103515625, -7.4437255859375, -7.076416015625, -6.7091064453125, -6.341796875, -5.9744873046875, -5.607177734375, -5.2398681640625, -4.87255859375, -4.5052490234375, -4.137939453125, -3.7706298828125, -3.4033203125, -3.0360107421875, -2.668701171875, -2.3013916015625, -1.93408203125, -1.5667724609375, -1.199462890625, -0.8321533203125, -0.46484375, -0.0975341796875, 0.269775390625, 0.6370849609375, 1.00439453125, 1.3717041015625, 1.739013671875, 2.1063232421875, 2.4736328125, 2.8409423828125, 3.208251953125, 3.5755615234375, 3.94287109375, 4.3101806640625, 4.677490234375, 5.0447998046875, 5.412109375, 5.7794189453125, 6.146728515625, 6.5140380859375, 6.88134765625, 7.2486572265625, 7.615966796875, 7.9832763671875, 8.3505859375, 8.7178955078125, 9.085205078125, 9.4525146484375, 9.81982421875, 10.1871337890625, 10.554443359375, 10.9217529296875, 11.2890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 10.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 16.0, 14.0, 22.0, 22.0, 25.0, 26.0, 33.0, 28.0, 33.0, 33.0, 41.0, 40.0, 39.0, 41.0, 38.0, 35.0, 46.0, 36.0, 29.0, 28.0, 36.0, 28.0, 23.0, 33.0, 27.0, 32.0, 20.0, 17.0, 16.0, 6.0, 14.0, 13.0, 7.0, 3.0, 8.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-26.234375, -25.345703125, -24.45703125, -23.568359375, -22.6796875, -21.791015625, -20.90234375, -20.013671875, -19.125, -18.236328125, -17.34765625, -16.458984375, -15.5703125, -14.681640625, -13.79296875, -12.904296875, -12.015625, -11.126953125, -10.23828125, -9.349609375, -8.4609375, -7.572265625, -6.68359375, -5.794921875, -4.90625, -4.017578125, -3.12890625, -2.240234375, -1.3515625, -0.462890625, 0.42578125, 1.314453125, 2.203125, 3.091796875, 3.98046875, 4.869140625, 5.7578125, 6.646484375, 7.53515625, 8.423828125, 9.3125, 10.201171875, 11.08984375, 11.978515625, 12.8671875, 13.755859375, 14.64453125, 15.533203125, 16.421875, 17.310546875, 18.19921875, 19.087890625, 19.9765625, 20.865234375, 21.75390625, 22.642578125, 23.53125, 24.419921875, 25.30859375, 26.197265625, 27.0859375, 27.974609375, 28.86328125, 29.751953125, 30.640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 7.0, 9.0, 20.0, 24.0, 36.0, 51.0, 69.0, 91.0, 158.0, 208.0, 336.0, 485.0, 725.0, 998.0, 1580.0, 2377.0, 3426.0, 4775.0, 7047.0, 10258.0, 15028.0, 23004.0, 49735.0, 724288.0, 124549.0, 26271.0, 16816.0, 11383.0, 7787.0, 5226.0, 3699.0, 2592.0, 1755.0, 1181.0, 856.0, 558.0, 366.0, 249.0, 158.0, 113.0, 82.0, 65.0, 27.0, 33.0, 16.0, 15.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-29.53125, -28.67919921875, -27.8271484375, -26.97509765625, -26.123046875, -25.27099609375, -24.4189453125, -23.56689453125, -22.71484375, -21.86279296875, -21.0107421875, -20.15869140625, -19.306640625, -18.45458984375, -17.6025390625, -16.75048828125, -15.8984375, -15.04638671875, -14.1943359375, -13.34228515625, -12.490234375, -11.63818359375, -10.7861328125, -9.93408203125, -9.08203125, -8.22998046875, -7.3779296875, -6.52587890625, -5.673828125, -4.82177734375, -3.9697265625, -3.11767578125, -2.265625, -1.41357421875, -0.5615234375, 0.29052734375, 1.142578125, 1.99462890625, 2.8466796875, 3.69873046875, 4.55078125, 5.40283203125, 6.2548828125, 7.10693359375, 7.958984375, 8.81103515625, 9.6630859375, 10.51513671875, 11.3671875, 12.21923828125, 13.0712890625, 13.92333984375, 14.775390625, 15.62744140625, 16.4794921875, 17.33154296875, 18.18359375, 19.03564453125, 19.8876953125, 20.73974609375, 21.591796875, 22.44384765625, 23.2958984375, 24.14794921875, 25.0]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 0.0, 0.0, 8.0, 9.0, 11.0, 15.0, 14.0, 25.0, 16.0, 25.0, 20.0, 28.0, 28.0, 29.0, 35.0, 35.0, 37.0, 26.0, 40.0, 46.0, 38.0, 46.0, 44.0, 35.0, 39.0, 43.0, 33.0, 32.0, 35.0, 35.0, 36.0, 22.0, 22.0, 12.0, 17.0, 11.0, 9.0, 5.0, 8.0, 4.0, 3.0, 5.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0], "bins": [-27.828125, -27.073486328125, -26.31884765625, -25.564208984375, -24.8095703125, -24.054931640625, -23.30029296875, -22.545654296875, -21.791015625, -21.036376953125, -20.28173828125, -19.527099609375, -18.7724609375, -18.017822265625, -17.26318359375, -16.508544921875, -15.75390625, -14.999267578125, -14.24462890625, -13.489990234375, -12.7353515625, -11.980712890625, -11.22607421875, -10.471435546875, -9.716796875, -8.962158203125, -8.20751953125, -7.452880859375, -6.6982421875, -5.943603515625, -5.18896484375, -4.434326171875, -3.6796875, -2.925048828125, -2.17041015625, -1.415771484375, -0.6611328125, 0.093505859375, 0.84814453125, 1.602783203125, 2.357421875, 3.112060546875, 3.86669921875, 4.621337890625, 5.3759765625, 6.130615234375, 6.88525390625, 7.639892578125, 8.39453125, 9.149169921875, 9.90380859375, 10.658447265625, 11.4130859375, 12.167724609375, 12.92236328125, 13.677001953125, 14.431640625, 15.186279296875, 15.94091796875, 16.695556640625, 17.4501953125, 18.204833984375, 18.95947265625, 19.714111328125, 20.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 4.0, 6.0, 17.0, 31.0, 47.0, 58.0, 107.0, 195.0, 342.0, 683.0, 1516.0, 3250.0, 7381.0, 18714.0, 75678.0, 873453.0, 42864.0, 13726.0, 5560.0, 2514.0, 1123.0, 559.0, 267.0, 168.0, 82.0, 67.0, 33.0, 40.0, 11.0, 18.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.015625, -7.79510498046875, -7.5745849609375, -7.35406494140625, -7.133544921875, -6.91302490234375, -6.6925048828125, -6.47198486328125, -6.25146484375, -6.03094482421875, -5.8104248046875, -5.58990478515625, -5.369384765625, -5.14886474609375, -4.9283447265625, -4.70782470703125, -4.4873046875, -4.26678466796875, -4.0462646484375, -3.82574462890625, -3.605224609375, -3.38470458984375, -3.1641845703125, -2.94366455078125, -2.72314453125, -2.50262451171875, -2.2821044921875, -2.06158447265625, -1.841064453125, -1.62054443359375, -1.4000244140625, -1.17950439453125, -0.958984375, -0.73846435546875, -0.5179443359375, -0.29742431640625, -0.076904296875, 0.14361572265625, 0.3641357421875, 0.58465576171875, 0.80517578125, 1.02569580078125, 1.2462158203125, 1.46673583984375, 1.687255859375, 1.90777587890625, 2.1282958984375, 2.34881591796875, 2.5693359375, 2.78985595703125, 3.0103759765625, 3.23089599609375, 3.451416015625, 3.67193603515625, 3.8924560546875, 4.11297607421875, 4.33349609375, 4.55401611328125, 4.7745361328125, 4.99505615234375, 5.215576171875, 5.43609619140625, 5.6566162109375, 5.87713623046875, 6.09765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 9.0, 16.0, 26.0, 54.0, 103.0, 182.0, 192.0, 185.0, 115.0, 67.0, 27.0, 11.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003265380859375, -0.0031554102897644043, -0.0030454397201538086, -0.002935469150543213, -0.002825498580932617, -0.0027155280113220215, -0.0026055574417114258, -0.00249558687210083, -0.0023856163024902344, -0.0022756457328796387, -0.002165675163269043, -0.0020557045936584473, -0.0019457340240478516, -0.0018357634544372559, -0.0017257928848266602, -0.0016158223152160645, -0.0015058517456054688, -0.001395881175994873, -0.0012859106063842773, -0.0011759400367736816, -0.001065969467163086, -0.0009559988975524902, -0.0008460283279418945, -0.0007360577583312988, -0.0006260871887207031, -0.0005161166191101074, -0.0004061460494995117, -0.000296175479888916, -0.0001862049102783203, -7.623434066772461e-05, 3.3736228942871094e-05, 0.0001437067985534668, 0.0002536773681640625, 0.0003636479377746582, 0.0004736185073852539, 0.0005835890769958496, 0.0006935596466064453, 0.000803530216217041, 0.0009135007858276367, 0.0010234713554382324, 0.0011334419250488281, 0.0012434124946594238, 0.0013533830642700195, 0.0014633536338806152, 0.001573324203491211, 0.0016832947731018066, 0.0017932653427124023, 0.001903235912322998, 0.0020132064819335938, 0.0021231770515441895, 0.002233147621154785, 0.002343118190765381, 0.0024530887603759766, 0.0025630593299865723, 0.002673029899597168, 0.0027830004692077637, 0.0028929710388183594, 0.003002941608428955, 0.0031129121780395508, 0.0032228827476501465, 0.003332853317260742, 0.003442823886871338, 0.0035527944564819336, 0.0036627650260925293, 0.003772735595703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 12.0, 19.0, 25.0, 31.0, 35.0, 49.0, 66.0, 107.0, 135.0, 201.0, 292.0, 453.0, 641.0, 998.0, 1517.0, 2306.0, 3825.0, 6159.0, 10429.0, 17507.0, 29016.0, 47899.0, 75097.0, 113992.0, 149515.0, 163497.0, 142487.0, 104980.0, 68319.0, 42849.0, 25924.0, 15658.0, 9327.0, 5509.0, 3429.0, 2152.0, 1313.0, 808.0, 616.0, 402.0, 286.0, 185.0, 151.0, 103.0, 62.0, 51.0, 35.0, 21.0, 19.0, 17.0, 9.0, 3.0, 13.0, 5.0, 3.0], "bins": [-1.455078125, -1.4127655029296875, -1.370452880859375, -1.3281402587890625, -1.28582763671875, -1.2435150146484375, -1.201202392578125, -1.1588897705078125, -1.1165771484375, -1.0742645263671875, -1.031951904296875, -0.9896392822265625, -0.94732666015625, -0.9050140380859375, -0.862701416015625, -0.8203887939453125, -0.778076171875, -0.7357635498046875, -0.693450927734375, -0.6511383056640625, -0.60882568359375, -0.5665130615234375, -0.524200439453125, -0.4818878173828125, -0.4395751953125, -0.3972625732421875, -0.354949951171875, -0.3126373291015625, -0.27032470703125, -0.2280120849609375, -0.185699462890625, -0.1433868408203125, -0.10107421875, -0.0587615966796875, -0.016448974609375, 0.0258636474609375, 0.06817626953125, 0.1104888916015625, 0.152801513671875, 0.1951141357421875, 0.2374267578125, 0.2797393798828125, 0.322052001953125, 0.3643646240234375, 0.40667724609375, 0.4489898681640625, 0.491302490234375, 0.5336151123046875, 0.575927734375, 0.6182403564453125, 0.660552978515625, 0.7028656005859375, 0.74517822265625, 0.7874908447265625, 0.829803466796875, 0.8721160888671875, 0.9144287109375, 0.9567413330078125, 0.999053955078125, 1.0413665771484375, 1.08367919921875, 1.1259918212890625, 1.168304443359375, 1.2106170654296875, 1.2529296875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 2.0, 5.0, 9.0, 9.0, 20.0, 16.0, 23.0, 26.0, 24.0, 31.0, 31.0, 55.0, 75.0, 70.0, 84.0, 66.0, 60.0, 60.0, 42.0, 41.0, 41.0, 29.0, 18.0, 25.0, 22.0, 16.0, 8.0, 18.0, 6.0, 11.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5171966552734375, -0.501678466796875, -0.4861602783203125, -0.47064208984375, -0.4551239013671875, -0.439605712890625, -0.4240875244140625, -0.4085693359375, -0.3930511474609375, -0.377532958984375, -0.3620147705078125, -0.34649658203125, -0.3309783935546875, -0.315460205078125, -0.2999420166015625, -0.284423828125, -0.2689056396484375, -0.253387451171875, -0.2378692626953125, -0.22235107421875, -0.2068328857421875, -0.191314697265625, -0.1757965087890625, -0.1602783203125, -0.1447601318359375, -0.129241943359375, -0.1137237548828125, -0.09820556640625, -0.0826873779296875, -0.067169189453125, -0.0516510009765625, -0.0361328125, -0.0206146240234375, -0.005096435546875, 0.0104217529296875, 0.02593994140625, 0.0414581298828125, 0.056976318359375, 0.0724945068359375, 0.0880126953125, 0.1035308837890625, 0.119049072265625, 0.1345672607421875, 0.15008544921875, 0.1656036376953125, 0.181121826171875, 0.1966400146484375, 0.212158203125, 0.2276763916015625, 0.243194580078125, 0.2587127685546875, 0.27423095703125, 0.2897491455078125, 0.305267333984375, 0.3207855224609375, 0.3363037109375, 0.3518218994140625, 0.367340087890625, 0.3828582763671875, 0.39837646484375, 0.4138946533203125, 0.429412841796875, 0.4449310302734375, 0.46044921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 12.0, 7.0, 10.0, 17.0, 13.0, 20.0, 27.0, 21.0, 33.0, 21.0, 30.0, 37.0, 32.0, 37.0, 38.0, 37.0, 34.0, 42.0, 44.0, 40.0, 37.0, 42.0, 37.0, 47.0, 24.0, 32.0, 26.0, 30.0, 25.0, 27.0, 13.0, 14.0, 12.0, 16.0, 6.0, 13.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.963294982910156, -24.102270126342773, -23.24124526977539, -22.380220413208008, -21.519195556640625, -20.658170700073242, -19.79714584350586, -18.93612289428711, -18.075096130371094, -17.21407127380371, -16.353046417236328, -15.492021560668945, -14.630996704101562, -13.76997184753418, -12.908947944641113, -12.04792308807373, -11.186899185180664, -10.325874328613281, -9.464849472045898, -8.603824615478516, -7.742800235748291, -6.881775379180908, -6.020750999450684, -5.159726142883301, -4.298701286315918, -3.437676429748535, -2.5766518115997314, -1.7156271934509277, -0.8546023368835449, 0.006422519683837891, 0.8674468994140625, 1.7284717559814453, 2.5894947052001953, 3.450519561767578, 4.311544418334961, 5.1725687980651855, 6.033593654632568, 6.894618511199951, 7.755642890930176, 8.616667747497559, 9.477692604064941, 10.338717460632324, 11.199742317199707, 12.060766220092773, 12.921791076660156, 13.782815933227539, 14.643840789794922, 15.504865646362305, 16.365890502929688, 17.22691535949707, 18.087940216064453, 18.948965072631836, 19.80998992919922, 20.6710147857666, 21.532039642333984, 22.393062591552734, 23.25408935546875, 24.115114212036133, 24.976139068603516, 25.8371639251709, 26.69818878173828, 27.559213638305664, 28.420238494873047, 29.281261444091797, 30.14228630065918]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 6.0, 6.0, 3.0, 10.0, 12.0, 14.0, 18.0, 13.0, 19.0, 24.0, 27.0, 19.0, 36.0, 28.0, 33.0, 27.0, 46.0, 42.0, 34.0, 43.0, 40.0, 37.0, 39.0, 39.0, 31.0, 32.0, 33.0, 31.0, 28.0, 25.0, 29.0, 32.0, 23.0, 15.0, 17.0, 8.0, 12.0, 15.0, 9.0, 3.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-26.57605743408203, -25.684240341186523, -24.792423248291016, -23.900606155395508, -23.0087890625, -22.116971969604492, -21.225154876708984, -20.333337783813477, -19.44152069091797, -18.54970359802246, -17.657886505126953, -16.766069412231445, -15.874252319335938, -14.98243522644043, -14.090618133544922, -13.198801040649414, -12.306983947753906, -11.415166854858398, -10.52334976196289, -9.631532669067383, -8.739715576171875, -7.847898483276367, -6.956081390380859, -6.064264297485352, -5.172447204589844, -4.280630111694336, -3.388813018798828, -2.4969959259033203, -1.6051788330078125, -0.7133617401123047, 0.17845535278320312, 1.070272445678711, 1.9620895385742188, 2.8539066314697266, 3.7457237243652344, 4.637540817260742, 5.52935791015625, 6.421175003051758, 7.312992095947266, 8.204809188842773, 9.096626281738281, 9.988443374633789, 10.880260467529297, 11.772077560424805, 12.663894653320312, 13.55571174621582, 14.447528839111328, 15.339345932006836, 16.231163024902344, 17.12298011779785, 18.01479721069336, 18.906614303588867, 19.798431396484375, 20.690248489379883, 21.58206558227539, 22.4738826751709, 23.365699768066406, 24.257516860961914, 25.149333953857422, 26.04115104675293, 26.932968139648438, 27.824785232543945, 28.716602325439453, 29.60841941833496, 30.50023651123047]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 6.0, 9.0, 16.0, 33.0, 33.0, 52.0, 71.0, 129.0, 227.0, 370.0, 627.0, 1079.0, 1779.0, 3070.0, 5161.0, 8674.0, 14130.0, 22316.0, 34371.0, 51025.0, 71536.0, 93356.0, 111857.0, 123451.0, 121004.0, 106865.0, 86716.0, 65296.0, 45232.0, 30193.0, 19361.0, 12114.0, 7407.0, 4511.0, 2633.0, 1525.0, 893.0, 551.0, 346.0, 205.0, 113.0, 78.0, 47.0, 35.0, 21.0, 15.0, 8.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.640625, -19.871826171875, -19.10302734375, -18.334228515625, -17.5654296875, -16.796630859375, -16.02783203125, -15.259033203125, -14.490234375, -13.721435546875, -12.95263671875, -12.183837890625, -11.4150390625, -10.646240234375, -9.87744140625, -9.108642578125, -8.33984375, -7.571044921875, -6.80224609375, -6.033447265625, -5.2646484375, -4.495849609375, -3.72705078125, -2.958251953125, -2.189453125, -1.420654296875, -0.65185546875, 0.116943359375, 0.8857421875, 1.654541015625, 2.42333984375, 3.192138671875, 3.9609375, 4.729736328125, 5.49853515625, 6.267333984375, 7.0361328125, 7.804931640625, 8.57373046875, 9.342529296875, 10.111328125, 10.880126953125, 11.64892578125, 12.417724609375, 13.1865234375, 13.955322265625, 14.72412109375, 15.492919921875, 16.26171875, 17.030517578125, 17.79931640625, 18.568115234375, 19.3369140625, 20.105712890625, 20.87451171875, 21.643310546875, 22.412109375, 23.180908203125, 23.94970703125, 24.718505859375, 25.4873046875, 26.256103515625, 27.02490234375, 27.793701171875, 28.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 9.0, 6.0, 3.0, 7.0, 6.0, 16.0, 15.0, 16.0, 17.0, 17.0, 25.0, 30.0, 20.0, 26.0, 32.0, 35.0, 26.0, 47.0, 41.0, 31.0, 44.0, 41.0, 44.0, 33.0, 45.0, 30.0, 25.0, 35.0, 24.0, 34.0, 31.0, 31.0, 25.0, 23.0, 18.0, 15.0, 5.0, 14.0, 13.0, 7.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-25.5625, -24.72900390625, -23.8955078125, -23.06201171875, -22.228515625, -21.39501953125, -20.5615234375, -19.72802734375, -18.89453125, -18.06103515625, -17.2275390625, -16.39404296875, -15.560546875, -14.72705078125, -13.8935546875, -13.06005859375, -12.2265625, -11.39306640625, -10.5595703125, -9.72607421875, -8.892578125, -8.05908203125, -7.2255859375, -6.39208984375, -5.55859375, -4.72509765625, -3.8916015625, -3.05810546875, -2.224609375, -1.39111328125, -0.5576171875, 0.27587890625, 1.109375, 1.94287109375, 2.7763671875, 3.60986328125, 4.443359375, 5.27685546875, 6.1103515625, 6.94384765625, 7.77734375, 8.61083984375, 9.4443359375, 10.27783203125, 11.111328125, 11.94482421875, 12.7783203125, 13.61181640625, 14.4453125, 15.27880859375, 16.1123046875, 16.94580078125, 17.779296875, 18.61279296875, 19.4462890625, 20.27978515625, 21.11328125, 21.94677734375, 22.7802734375, 23.61376953125, 24.447265625, 25.28076171875, 26.1142578125, 26.94775390625, 27.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 8.0, 7.0, 8.0, 21.0, 24.0, 40.0, 51.0, 98.0, 173.0, 303.0, 564.0, 1047.0, 1874.0, 3359.0, 6462.0, 11597.0, 21770.0, 38322.0, 64255.0, 98621.0, 134199.0, 156467.0, 153735.0, 127637.0, 91900.0, 58634.0, 34844.0, 19350.0, 10622.0, 5699.0, 3016.0, 1651.0, 943.0, 519.0, 298.0, 177.0, 107.0, 52.0, 34.0, 28.0, 19.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.8125, -31.7841796875, -30.755859375, -29.7275390625, -28.69921875, -27.6708984375, -26.642578125, -25.6142578125, -24.5859375, -23.5576171875, -22.529296875, -21.5009765625, -20.47265625, -19.4443359375, -18.416015625, -17.3876953125, -16.359375, -15.3310546875, -14.302734375, -13.2744140625, -12.24609375, -11.2177734375, -10.189453125, -9.1611328125, -8.1328125, -7.1044921875, -6.076171875, -5.0478515625, -4.01953125, -2.9912109375, -1.962890625, -0.9345703125, 0.09375, 1.1220703125, 2.150390625, 3.1787109375, 4.20703125, 5.2353515625, 6.263671875, 7.2919921875, 8.3203125, 9.3486328125, 10.376953125, 11.4052734375, 12.43359375, 13.4619140625, 14.490234375, 15.5185546875, 16.546875, 17.5751953125, 18.603515625, 19.6318359375, 20.66015625, 21.6884765625, 22.716796875, 23.7451171875, 24.7734375, 25.8017578125, 26.830078125, 27.8583984375, 28.88671875, 29.9150390625, 30.943359375, 31.9716796875, 33.0]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 5.0, 11.0, 22.0, 17.0, 19.0, 22.0, 27.0, 20.0, 27.0, 25.0, 42.0, 38.0, 34.0, 45.0, 37.0, 49.0, 54.0, 42.0, 50.0, 46.0, 37.0, 40.0, 42.0, 38.0, 34.0, 16.0, 31.0, 20.0, 20.0, 13.0, 8.0, 15.0, 8.0, 9.0, 9.0, 3.0, 1.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.653564453125, -17.02587890625, -16.398193359375, -15.7705078125, -15.142822265625, -14.51513671875, -13.887451171875, -13.259765625, -12.632080078125, -12.00439453125, -11.376708984375, -10.7490234375, -10.121337890625, -9.49365234375, -8.865966796875, -8.23828125, -7.610595703125, -6.98291015625, -6.355224609375, -5.7275390625, -5.099853515625, -4.47216796875, -3.844482421875, -3.216796875, -2.589111328125, -1.96142578125, -1.333740234375, -0.7060546875, -0.078369140625, 0.54931640625, 1.177001953125, 1.8046875, 2.432373046875, 3.06005859375, 3.687744140625, 4.3154296875, 4.943115234375, 5.57080078125, 6.198486328125, 6.826171875, 7.453857421875, 8.08154296875, 8.709228515625, 9.3369140625, 9.964599609375, 10.59228515625, 11.219970703125, 11.84765625, 12.475341796875, 13.10302734375, 13.730712890625, 14.3583984375, 14.986083984375, 15.61376953125, 16.241455078125, 16.869140625, 17.496826171875, 18.12451171875, 18.752197265625, 19.3798828125, 20.007568359375, 20.63525390625, 21.262939453125, 21.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 16.0, 20.0, 36.0, 40.0, 75.0, 112.0, 174.0, 298.0, 608.0, 1070.0, 2254.0, 4961.0, 11598.0, 29128.0, 75173.0, 179362.0, 287956.0, 247854.0, 124961.0, 49158.0, 19059.0, 7741.0, 3381.0, 1592.0, 778.0, 454.0, 253.0, 151.0, 105.0, 53.0, 32.0, 26.0, 17.0, 13.0, 9.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5, -22.782958984375, -22.06591796875, -21.348876953125, -20.6318359375, -19.914794921875, -19.19775390625, -18.480712890625, -17.763671875, -17.046630859375, -16.32958984375, -15.612548828125, -14.8955078125, -14.178466796875, -13.46142578125, -12.744384765625, -12.02734375, -11.310302734375, -10.59326171875, -9.876220703125, -9.1591796875, -8.442138671875, -7.72509765625, -7.008056640625, -6.291015625, -5.573974609375, -4.85693359375, -4.139892578125, -3.4228515625, -2.705810546875, -1.98876953125, -1.271728515625, -0.5546875, 0.162353515625, 0.87939453125, 1.596435546875, 2.3134765625, 3.030517578125, 3.74755859375, 4.464599609375, 5.181640625, 5.898681640625, 6.61572265625, 7.332763671875, 8.0498046875, 8.766845703125, 9.48388671875, 10.200927734375, 10.91796875, 11.635009765625, 12.35205078125, 13.069091796875, 13.7861328125, 14.503173828125, 15.22021484375, 15.937255859375, 16.654296875, 17.371337890625, 18.08837890625, 18.805419921875, 19.5224609375, 20.239501953125, 20.95654296875, 21.673583984375, 22.390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 5.0, 5.0, 6.0, 13.0, 9.0, 22.0, 19.0, 24.0, 28.0, 38.0, 34.0, 27.0, 40.0, 46.0, 39.0, 39.0, 58.0, 47.0, 46.0, 45.0, 45.0, 49.0, 36.0, 36.0, 30.0, 25.0, 23.0, 25.0, 29.0, 19.0, 14.0, 10.0, 10.0, 7.0, 6.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.001071929931640625, -0.0010370910167694092, -0.0010022521018981934, -0.0009674131870269775, -0.0009325742721557617, -0.0008977353572845459, -0.0008628964424133301, -0.0008280575275421143, -0.0007932186126708984, -0.0007583796977996826, -0.0007235407829284668, -0.000688701868057251, -0.0006538629531860352, -0.0006190240383148193, -0.0005841851234436035, -0.0005493462085723877, -0.0005145072937011719, -0.00047966837882995605, -0.00044482946395874023, -0.0004099905490875244, -0.0003751516342163086, -0.0003403127193450928, -0.00030547380447387695, -0.00027063488960266113, -0.0002357959747314453, -0.0002009570598602295, -0.00016611814498901367, -0.00013127923011779785, -9.644031524658203e-05, -6.160140037536621e-05, -2.676248550415039e-05, 8.07642936706543e-06, 4.291534423828125e-05, 7.775425910949707e-05, 0.00011259317398071289, 0.0001474320888519287, 0.00018227100372314453, 0.00021710991859436035, 0.00025194883346557617, 0.000286787748336792, 0.0003216266632080078, 0.00035646557807922363, 0.00039130449295043945, 0.0004261434078216553, 0.0004609823226928711, 0.0004958212375640869, 0.0005306601524353027, 0.0005654990673065186, 0.0006003379821777344, 0.0006351768970489502, 0.000670015811920166, 0.0007048547267913818, 0.0007396936416625977, 0.0007745325565338135, 0.0008093714714050293, 0.0008442103862762451, 0.0008790493011474609, 0.0009138882160186768, 0.0009487271308898926, 0.0009835660457611084, 0.0010184049606323242, 0.00105324387550354, 0.0010880827903747559, 0.0011229217052459717, 0.0011577606201171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 12.0, 17.0, 22.0, 36.0, 48.0, 58.0, 107.0, 139.0, 207.0, 266.0, 441.0, 642.0, 859.0, 1271.0, 1948.0, 3043.0, 4371.0, 6954.0, 10436.0, 16362.0, 24804.0, 37423.0, 55015.0, 76248.0, 99323.0, 118410.0, 125708.0, 119251.0, 100804.0, 77365.0, 55533.0, 37996.0, 25242.0, 16731.0, 10713.0, 6936.0, 4640.0, 2958.0, 2013.0, 1389.0, 906.0, 613.0, 408.0, 301.0, 180.0, 133.0, 87.0, 68.0, 41.0, 27.0, 19.0, 15.0, 13.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.2734375, -8.9696044921875, -8.665771484375, -8.3619384765625, -8.05810546875, -7.7542724609375, -7.450439453125, -7.1466064453125, -6.8427734375, -6.5389404296875, -6.235107421875, -5.9312744140625, -5.62744140625, -5.3236083984375, -5.019775390625, -4.7159423828125, -4.412109375, -4.1082763671875, -3.804443359375, -3.5006103515625, -3.19677734375, -2.8929443359375, -2.589111328125, -2.2852783203125, -1.9814453125, -1.6776123046875, -1.373779296875, -1.0699462890625, -0.76611328125, -0.4622802734375, -0.158447265625, 0.1453857421875, 0.44921875, 0.7530517578125, 1.056884765625, 1.3607177734375, 1.66455078125, 1.9683837890625, 2.272216796875, 2.5760498046875, 2.8798828125, 3.1837158203125, 3.487548828125, 3.7913818359375, 4.09521484375, 4.3990478515625, 4.702880859375, 5.0067138671875, 5.310546875, 5.6143798828125, 5.918212890625, 6.2220458984375, 6.52587890625, 6.8297119140625, 7.133544921875, 7.4373779296875, 7.7412109375, 8.0450439453125, 8.348876953125, 8.6527099609375, 8.95654296875, 9.2603759765625, 9.564208984375, 9.8680419921875, 10.171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 4.0, 10.0, 11.0, 11.0, 7.0, 22.0, 27.0, 20.0, 23.0, 22.0, 35.0, 35.0, 47.0, 47.0, 56.0, 65.0, 58.0, 44.0, 63.0, 50.0, 55.0, 48.0, 30.0, 47.0, 27.0, 17.0, 22.0, 18.0, 13.0, 15.0, 4.0, 9.0, 3.0, 10.0, 2.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.10546875, -4.94921875, -4.79296875, -4.63671875, -4.48046875, -4.32421875, -4.16796875, -4.01171875, -3.85546875, -3.69921875, -3.54296875, -3.38671875, -3.23046875, -3.07421875, -2.91796875, -2.76171875, -2.60546875, -2.44921875, -2.29296875, -2.13671875, -1.98046875, -1.82421875, -1.66796875, -1.51171875, -1.35546875, -1.19921875, -1.04296875, -0.88671875, -0.73046875, -0.57421875, -0.41796875, -0.26171875, -0.10546875, 0.05078125, 0.20703125, 0.36328125, 0.51953125, 0.67578125, 0.83203125, 0.98828125, 1.14453125, 1.30078125, 1.45703125, 1.61328125, 1.76953125, 1.92578125, 2.08203125, 2.23828125, 2.39453125, 2.55078125, 2.70703125, 2.86328125, 3.01953125, 3.17578125, 3.33203125, 3.48828125, 3.64453125, 3.80078125, 3.95703125, 4.11328125, 4.26953125, 4.42578125, 4.58203125, 4.73828125, 4.89453125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 10.0, 10.0, 6.0, 10.0, 15.0, 13.0, 22.0, 16.0, 23.0, 33.0, 37.0, 21.0, 29.0, 39.0, 34.0, 41.0, 30.0, 37.0, 39.0, 43.0, 44.0, 37.0, 32.0, 32.0, 40.0, 26.0, 30.0, 35.0, 38.0, 24.0, 17.0, 25.0, 16.0, 17.0, 15.0, 7.0, 8.0, 5.0, 2.0, 8.0, 6.0, 5.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.53798484802246, -23.73561668395996, -22.93324851989746, -22.130878448486328, -21.328510284423828, -20.526142120361328, -19.723773956298828, -18.921405792236328, -18.119037628173828, -17.316669464111328, -16.514301300048828, -15.711932182312012, -14.909563064575195, -14.107194900512695, -13.304826736450195, -12.502458572387695, -11.700088500976562, -10.897720336914062, -10.095351219177246, -9.292983055114746, -8.49061393737793, -7.68824577331543, -6.88587760925293, -6.0835089683532715, -5.281140327453613, -4.478771686553955, -3.676403284072876, -2.874034881591797, -2.0716662406921387, -1.2692975997924805, -0.46692943572998047, 0.33543920516967773, 1.1378097534179688, 1.9401782751083374, 2.742546796798706, 3.544915199279785, 4.347283840179443, 5.149652481079102, 5.952020645141602, 6.75438928604126, 7.556757926940918, 8.359126091003418, 9.161495208740234, 9.963863372802734, 10.766231536865234, 11.56860065460205, 12.37096881866455, 13.173337936401367, 13.975706100463867, 14.778074264526367, 15.580443382263184, 16.3828125, 17.1851806640625, 17.987548828125, 18.7899169921875, 19.59228515625, 20.3946533203125, 21.197021484375, 21.9993896484375, 22.8017578125, 23.604127883911133, 24.406496047973633, 25.208864212036133, 26.011232376098633, 26.813602447509766]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 7.0, 6.0, 8.0, 8.0, 14.0, 18.0, 15.0, 14.0, 23.0, 26.0, 19.0, 24.0, 32.0, 27.0, 28.0, 46.0, 35.0, 49.0, 37.0, 36.0, 38.0, 39.0, 39.0, 44.0, 42.0, 38.0, 44.0, 32.0, 31.0, 24.0, 26.0, 22.0, 12.0, 17.0, 10.0, 19.0, 5.0, 5.0, 8.0, 6.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-29.367952346801758, -28.423612594604492, -27.479272842407227, -26.534934997558594, -25.590595245361328, -24.646255493164062, -23.701915740966797, -22.75757598876953, -21.813236236572266, -20.868896484375, -19.924556732177734, -18.98021697998047, -18.035879135131836, -17.09153938293457, -16.147199630737305, -15.202859878540039, -14.258522033691406, -13.31418228149414, -12.369843482971191, -11.425503730773926, -10.481164932250977, -9.536825180053711, -8.592485427856445, -7.648146152496338, -6.7038068771362305, -5.759467601776123, -4.815128326416016, -3.87078857421875, -2.9264492988586426, -1.9821100234985352, -1.0377702713012695, -0.09343099594116211, 0.8509063720703125, 1.7952457666397095, 2.7395851612091064, 3.683924674987793, 4.6282639503479, 5.572603225708008, 6.516942977905273, 7.461282253265381, 8.405621528625488, 9.349961280822754, 10.294300079345703, 11.238639831542969, 12.182979583740234, 13.127318382263184, 14.07165813446045, 15.015996932983398, 15.960336685180664, 16.90467643737793, 17.849016189575195, 18.793354034423828, 19.737693786621094, 20.68203353881836, 21.626373291015625, 22.57071304321289, 23.515052795410156, 24.459392547607422, 25.403732299804688, 26.348072052001953, 27.292409896850586, 28.23674964904785, 29.181089401245117, 30.125429153442383, 31.069766998291016]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [3.0, 5.0, 6.0, 8.0, 14.0, 20.0, 32.0, 45.0, 94.0, 155.0, 243.0, 434.0, 622.0, 1079.0, 1727.0, 2867.0, 4564.0, 7634.0, 11909.0, 18935.0, 30597.0, 48404.0, 75706.0, 115644.0, 172381.0, 245769.0, 332018.0, 413289.0, 472904.0, 486253.0, 450528.0, 378725.0, 292919.0, 211883.0, 146957.0, 97261.0, 63464.0, 40596.0, 25500.0, 15995.0, 10175.0, 6375.0, 4065.0, 2422.0, 1529.0, 954.0, 620.0, 371.0, 246.0, 137.0, 78.0, 58.0, 24.0, 26.0, 13.0, 10.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.453125, -18.7890625, -18.125, -17.4609375, -16.796875, -16.1328125, -15.46875, -14.8046875, -14.140625, -13.4765625, -12.8125, -12.1484375, -11.484375, -10.8203125, -10.15625, -9.4921875, -8.828125, -8.1640625, -7.5, -6.8359375, -6.171875, -5.5078125, -4.84375, -4.1796875, -3.515625, -2.8515625, -2.1875, -1.5234375, -0.859375, -0.1953125, 0.46875, 1.1328125, 1.796875, 2.4609375, 3.125, 3.7890625, 4.453125, 5.1171875, 5.78125, 6.4453125, 7.109375, 7.7734375, 8.4375, 9.1015625, 9.765625, 10.4296875, 11.09375, 11.7578125, 12.421875, 13.0859375, 13.75, 14.4140625, 15.078125, 15.7421875, 16.40625, 17.0703125, 17.734375, 18.3984375, 19.0625, 19.7265625, 20.390625, 21.0546875, 21.71875, 22.3828125, 23.046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 4.0, 4.0, 7.0, 9.0, 5.0, 16.0, 15.0, 18.0, 16.0, 18.0, 23.0, 23.0, 23.0, 27.0, 31.0, 30.0, 44.0, 35.0, 39.0, 40.0, 42.0, 31.0, 35.0, 41.0, 48.0, 39.0, 39.0, 38.0, 33.0, 37.0, 21.0, 39.0, 14.0, 14.0, 13.0, 16.0, 18.0, 9.0, 5.0, 8.0, 10.0, 4.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-25.828125, -25.010009765625, -24.19189453125, -23.373779296875, -22.5556640625, -21.737548828125, -20.91943359375, -20.101318359375, -19.283203125, -18.465087890625, -17.64697265625, -16.828857421875, -16.0107421875, -15.192626953125, -14.37451171875, -13.556396484375, -12.73828125, -11.920166015625, -11.10205078125, -10.283935546875, -9.4658203125, -8.647705078125, -7.82958984375, -7.011474609375, -6.193359375, -5.375244140625, -4.55712890625, -3.739013671875, -2.9208984375, -2.102783203125, -1.28466796875, -0.466552734375, 0.3515625, 1.169677734375, 1.98779296875, 2.805908203125, 3.6240234375, 4.442138671875, 5.26025390625, 6.078369140625, 6.896484375, 7.714599609375, 8.53271484375, 9.350830078125, 10.1689453125, 10.987060546875, 11.80517578125, 12.623291015625, 13.44140625, 14.259521484375, 15.07763671875, 15.895751953125, 16.7138671875, 17.531982421875, 18.35009765625, 19.168212890625, 19.986328125, 20.804443359375, 21.62255859375, 22.440673828125, 23.2587890625, 24.076904296875, 24.89501953125, 25.713134765625, 26.53125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 13.0, 15.0, 29.0, 43.0, 54.0, 101.0, 202.0, 319.0, 455.0, 764.0, 1194.0, 1815.0, 2957.0, 4817.0, 7563.0, 11780.0, 17837.0, 27354.0, 41352.0, 61123.0, 89111.0, 126481.0, 173623.0, 229938.0, 290603.0, 348406.0, 393284.0, 412053.0, 400801.0, 363880.0, 308116.0, 247138.0, 189834.0, 139400.0, 99577.0, 68748.0, 46463.0, 30895.0, 19994.0, 12974.0, 8470.0, 5538.0, 3367.0, 2151.0, 1371.0, 871.0, 487.0, 368.0, 211.0, 121.0, 81.0, 56.0, 31.0, 28.0, 16.0, 8.0, 4.0, 6.0, 3.0], "bins": [-20.90625, -20.265869140625, -19.62548828125, -18.985107421875, -18.3447265625, -17.704345703125, -17.06396484375, -16.423583984375, -15.783203125, -15.142822265625, -14.50244140625, -13.862060546875, -13.2216796875, -12.581298828125, -11.94091796875, -11.300537109375, -10.66015625, -10.019775390625, -9.37939453125, -8.739013671875, -8.0986328125, -7.458251953125, -6.81787109375, -6.177490234375, -5.537109375, -4.896728515625, -4.25634765625, -3.615966796875, -2.9755859375, -2.335205078125, -1.69482421875, -1.054443359375, -0.4140625, 0.226318359375, 0.86669921875, 1.507080078125, 2.1474609375, 2.787841796875, 3.42822265625, 4.068603515625, 4.708984375, 5.349365234375, 5.98974609375, 6.630126953125, 7.2705078125, 7.910888671875, 8.55126953125, 9.191650390625, 9.83203125, 10.472412109375, 11.11279296875, 11.753173828125, 12.3935546875, 13.033935546875, 13.67431640625, 14.314697265625, 14.955078125, 15.595458984375, 16.23583984375, 16.876220703125, 17.5166015625, 18.156982421875, 18.79736328125, 19.437744140625, 20.078125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 12.0, 17.0, 16.0, 15.0, 20.0, 26.0, 42.0, 42.0, 59.0, 50.0, 62.0, 85.0, 108.0, 115.0, 129.0, 147.0, 141.0, 168.0, 170.0, 168.0, 212.0, 192.0, 199.0, 177.0, 195.0, 173.0, 173.0, 154.0, 143.0, 124.0, 134.0, 108.0, 89.0, 68.0, 75.0, 54.0, 38.0, 41.0, 29.0, 23.0, 18.0, 15.0, 4.0, 10.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0076904296875, -9.663818359375, -9.3199462890625, -8.97607421875, -8.6322021484375, -8.288330078125, -7.9444580078125, -7.6005859375, -7.2567138671875, -6.912841796875, -6.5689697265625, -6.22509765625, -5.8812255859375, -5.537353515625, -5.1934814453125, -4.849609375, -4.5057373046875, -4.161865234375, -3.8179931640625, -3.47412109375, -3.1302490234375, -2.786376953125, -2.4425048828125, -2.0986328125, -1.7547607421875, -1.410888671875, -1.0670166015625, -0.72314453125, -0.3792724609375, -0.035400390625, 0.3084716796875, 0.65234375, 0.9962158203125, 1.340087890625, 1.6839599609375, 2.02783203125, 2.3717041015625, 2.715576171875, 3.0594482421875, 3.4033203125, 3.7471923828125, 4.091064453125, 4.4349365234375, 4.77880859375, 5.1226806640625, 5.466552734375, 5.8104248046875, 6.154296875, 6.4981689453125, 6.842041015625, 7.1859130859375, 7.52978515625, 7.8736572265625, 8.217529296875, 8.5614013671875, 8.9052734375, 9.2491455078125, 9.593017578125, 9.9368896484375, 10.28076171875, 10.6246337890625, 10.968505859375, 11.3123779296875, 11.65625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 3.0, 7.0, 8.0, 10.0, 16.0, 12.0, 19.0, 27.0, 22.0, 35.0, 33.0, 26.0, 31.0, 31.0, 29.0, 49.0, 34.0, 32.0, 44.0, 34.0, 46.0, 36.0, 38.0, 43.0, 29.0, 29.0, 31.0, 22.0, 27.0, 17.0, 22.0, 21.0, 20.0, 20.0, 14.0, 13.0, 11.0, 9.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.437240600585938, -23.615877151489258, -22.794513702392578, -21.9731502532959, -21.15178680419922, -20.330421447753906, -19.50905990600586, -18.687694549560547, -17.866331100463867, -17.044967651367188, -16.223604202270508, -15.402240753173828, -14.580876350402832, -13.759512901306152, -12.938149452209473, -12.116785049438477, -11.295422554016113, -10.474059104919434, -9.652695655822754, -8.831331253051758, -8.009967803955078, -7.188604354858398, -6.367240905761719, -5.545876979827881, -4.724513530731201, -3.9031498432159424, -3.0817861557006836, -2.260422706604004, -1.4390590190887451, -0.6176953315734863, 0.20366811752319336, 1.0250320434570312, 1.846395492553711, 2.6677591800689697, 3.4891228675842285, 4.310486316680908, 5.131850242614746, 5.953213691711426, 6.7745771408081055, 7.595941066741943, 8.417304992675781, 9.238668441772461, 10.06003189086914, 10.88139533996582, 11.702759742736816, 12.524123191833496, 13.345486640930176, 14.166851043701172, 14.988213539123535, 15.809576988220215, 16.63094139099121, 17.45230484008789, 18.27366828918457, 19.09503173828125, 19.91639518737793, 20.73775863647461, 21.55912208557129, 22.38048553466797, 23.20184898376465, 24.023212432861328, 24.844575881958008, 25.665939331054688, 26.4873046875, 27.30866813659668, 28.13003158569336]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 8.0, 8.0, 17.0, 11.0, 15.0, 20.0, 26.0, 20.0, 26.0, 15.0, 31.0, 31.0, 28.0, 31.0, 38.0, 36.0, 39.0, 43.0, 42.0, 38.0, 42.0, 39.0, 42.0, 44.0, 35.0, 29.0, 24.0, 44.0, 21.0, 29.0, 14.0, 15.0, 17.0, 18.0, 7.0, 10.0, 7.0, 9.0, 9.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-32.672080993652344, -31.711727142333984, -30.751371383666992, -29.791015625, -28.83066177368164, -27.87030792236328, -26.90995216369629, -25.949596405029297, -24.989242553710938, -24.028888702392578, -23.068532943725586, -22.108177185058594, -21.147823333740234, -20.187469482421875, -19.227113723754883, -18.26675796508789, -17.30640411376953, -16.346050262451172, -15.38569450378418, -14.425339698791504, -13.464984893798828, -12.504630088806152, -11.544275283813477, -10.5839204788208, -9.623565673828125, -8.66321086883545, -7.702856063842773, -6.742501258850098, -5.782146453857422, -4.821791648864746, -3.8614368438720703, -2.9010820388793945, -1.940725326538086, -0.9803705215454102, -0.020015716552734375, 0.9403390884399414, 1.9006938934326172, 2.861048698425293, 3.8214035034179688, 4.7817583084106445, 5.74211311340332, 6.702467918395996, 7.662822723388672, 8.623177528381348, 9.583532333374023, 10.5438871383667, 11.504241943359375, 12.46459674835205, 13.424951553344727, 14.385306358337402, 15.345661163330078, 16.306015014648438, 17.26637077331543, 18.226726531982422, 19.18708038330078, 20.14743423461914, 21.107789993286133, 22.068145751953125, 23.028499603271484, 23.988853454589844, 24.949209213256836, 25.909564971923828, 26.869918823242188, 27.830272674560547, 28.79062843322754]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 12.0, 17.0, 31.0, 27.0, 42.0, 101.0, 155.0, 252.0, 398.0, 624.0, 959.0, 1490.0, 2442.0, 3955.0, 6150.0, 9253.0, 13943.0, 21093.0, 29706.0, 41433.0, 55192.0, 70207.0, 85181.0, 95777.0, 101429.0, 100276.0, 93204.0, 80332.0, 65464.0, 50881.0, 37789.0, 26646.0, 18753.0, 12426.0, 8275.0, 5328.0, 3465.0, 2213.0, 1357.0, 826.0, 548.0, 325.0, 218.0, 126.0, 83.0, 64.0, 36.0, 16.0, 13.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.484375, -12.0924072265625, -11.700439453125, -11.3084716796875, -10.91650390625, -10.5245361328125, -10.132568359375, -9.7406005859375, -9.3486328125, -8.9566650390625, -8.564697265625, -8.1727294921875, -7.78076171875, -7.3887939453125, -6.996826171875, -6.6048583984375, -6.212890625, -5.8209228515625, -5.428955078125, -5.0369873046875, -4.64501953125, -4.2530517578125, -3.861083984375, -3.4691162109375, -3.0771484375, -2.6851806640625, -2.293212890625, -1.9012451171875, -1.50927734375, -1.1173095703125, -0.725341796875, -0.3333740234375, 0.05859375, 0.4505615234375, 0.842529296875, 1.2344970703125, 1.62646484375, 2.0184326171875, 2.410400390625, 2.8023681640625, 3.1943359375, 3.5863037109375, 3.978271484375, 4.3702392578125, 4.76220703125, 5.1541748046875, 5.546142578125, 5.9381103515625, 6.330078125, 6.7220458984375, 7.114013671875, 7.5059814453125, 7.89794921875, 8.2899169921875, 8.681884765625, 9.0738525390625, 9.4658203125, 9.8577880859375, 10.249755859375, 10.6417236328125, 11.03369140625, 11.4256591796875, 11.817626953125, 12.2095947265625, 12.6015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 14.0, 11.0, 12.0, 19.0, 15.0, 27.0, 20.0, 26.0, 16.0, 30.0, 33.0, 30.0, 30.0, 39.0, 31.0, 44.0, 45.0, 40.0, 42.0, 37.0, 36.0, 49.0, 40.0, 30.0, 30.0, 24.0, 44.0, 22.0, 25.0, 18.0, 13.0, 19.0, 15.0, 10.0, 9.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-33.1875, -32.213623046875, -31.23974609375, -30.265869140625, -29.2919921875, -28.318115234375, -27.34423828125, -26.370361328125, -25.396484375, -24.422607421875, -23.44873046875, -22.474853515625, -21.5009765625, -20.527099609375, -19.55322265625, -18.579345703125, -17.60546875, -16.631591796875, -15.65771484375, -14.683837890625, -13.7099609375, -12.736083984375, -11.76220703125, -10.788330078125, -9.814453125, -8.840576171875, -7.86669921875, -6.892822265625, -5.9189453125, -4.945068359375, -3.97119140625, -2.997314453125, -2.0234375, -1.049560546875, -0.07568359375, 0.898193359375, 1.8720703125, 2.845947265625, 3.81982421875, 4.793701171875, 5.767578125, 6.741455078125, 7.71533203125, 8.689208984375, 9.6630859375, 10.636962890625, 11.61083984375, 12.584716796875, 13.55859375, 14.532470703125, 15.50634765625, 16.480224609375, 17.4541015625, 18.427978515625, 19.40185546875, 20.375732421875, 21.349609375, 22.323486328125, 23.29736328125, 24.271240234375, 25.2451171875, 26.218994140625, 27.19287109375, 28.166748046875, 29.140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 15.0, 24.0, 35.0, 52.0, 57.0, 79.0, 138.0, 178.0, 225.0, 364.0, 512.0, 719.0, 1011.0, 1449.0, 2012.0, 2807.0, 3810.0, 5203.0, 7425.0, 10504.0, 15220.0, 22478.0, 50332.0, 697550.0, 141392.0, 26057.0, 17335.0, 11811.0, 8472.0, 6174.0, 4334.0, 3267.0, 2188.0, 1622.0, 1098.0, 819.0, 525.0, 358.0, 272.0, 174.0, 138.0, 87.0, 61.0, 37.0, 37.0, 25.0, 17.0, 17.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.71875, -21.953125, -21.1875, -20.421875, -19.65625, -18.890625, -18.125, -17.359375, -16.59375, -15.828125, -15.0625, -14.296875, -13.53125, -12.765625, -12.0, -11.234375, -10.46875, -9.703125, -8.9375, -8.171875, -7.40625, -6.640625, -5.875, -5.109375, -4.34375, -3.578125, -2.8125, -2.046875, -1.28125, -0.515625, 0.25, 1.015625, 1.78125, 2.546875, 3.3125, 4.078125, 4.84375, 5.609375, 6.375, 7.140625, 7.90625, 8.671875, 9.4375, 10.203125, 10.96875, 11.734375, 12.5, 13.265625, 14.03125, 14.796875, 15.5625, 16.328125, 17.09375, 17.859375, 18.625, 19.390625, 20.15625, 20.921875, 21.6875, 22.453125, 23.21875, 23.984375, 24.75, 25.515625, 26.28125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 3.0, 9.0, 6.0, 7.0, 14.0, 16.0, 18.0, 20.0, 26.0, 24.0, 28.0, 21.0, 31.0, 32.0, 36.0, 37.0, 50.0, 38.0, 52.0, 42.0, 41.0, 39.0, 39.0, 38.0, 37.0, 28.0, 34.0, 32.0, 25.0, 27.0, 21.0, 27.0, 18.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 5.0, 6.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.015625, -25.239501953125, -24.46337890625, -23.687255859375, -22.9111328125, -22.135009765625, -21.35888671875, -20.582763671875, -19.806640625, -19.030517578125, -18.25439453125, -17.478271484375, -16.7021484375, -15.926025390625, -15.14990234375, -14.373779296875, -13.59765625, -12.821533203125, -12.04541015625, -11.269287109375, -10.4931640625, -9.717041015625, -8.94091796875, -8.164794921875, -7.388671875, -6.612548828125, -5.83642578125, -5.060302734375, -4.2841796875, -3.508056640625, -2.73193359375, -1.955810546875, -1.1796875, -0.403564453125, 0.37255859375, 1.148681640625, 1.9248046875, 2.700927734375, 3.47705078125, 4.253173828125, 5.029296875, 5.805419921875, 6.58154296875, 7.357666015625, 8.1337890625, 8.909912109375, 9.68603515625, 10.462158203125, 11.23828125, 12.014404296875, 12.79052734375, 13.566650390625, 14.3427734375, 15.118896484375, 15.89501953125, 16.671142578125, 17.447265625, 18.223388671875, 18.99951171875, 19.775634765625, 20.5517578125, 21.327880859375, 22.10400390625, 22.880126953125, 23.65625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 15.0, 17.0, 29.0, 33.0, 61.0, 81.0, 119.0, 178.0, 264.0, 396.0, 626.0, 995.0, 1580.0, 2662.0, 4509.0, 7827.0, 14427.0, 27845.0, 185090.0, 718093.0, 40987.0, 18184.0, 9945.0, 5665.0, 3359.0, 2041.0, 1233.0, 736.0, 504.0, 332.0, 207.0, 156.0, 113.0, 65.0, 50.0, 36.0, 24.0, 15.0, 9.0, 13.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.48046875, -3.37237548828125, -3.2642822265625, -3.15618896484375, -3.048095703125, -2.94000244140625, -2.8319091796875, -2.72381591796875, -2.61572265625, -2.50762939453125, -2.3995361328125, -2.29144287109375, -2.183349609375, -2.07525634765625, -1.9671630859375, -1.85906982421875, -1.7509765625, -1.64288330078125, -1.5347900390625, -1.42669677734375, -1.318603515625, -1.21051025390625, -1.1024169921875, -0.99432373046875, -0.88623046875, -0.77813720703125, -0.6700439453125, -0.56195068359375, -0.453857421875, -0.34576416015625, -0.2376708984375, -0.12957763671875, -0.021484375, 0.08660888671875, 0.1947021484375, 0.30279541015625, 0.410888671875, 0.51898193359375, 0.6270751953125, 0.73516845703125, 0.84326171875, 0.95135498046875, 1.0594482421875, 1.16754150390625, 1.275634765625, 1.38372802734375, 1.4918212890625, 1.59991455078125, 1.7080078125, 1.81610107421875, 1.9241943359375, 2.03228759765625, 2.140380859375, 2.24847412109375, 2.3565673828125, 2.46466064453125, 2.57275390625, 2.68084716796875, 2.7889404296875, 2.89703369140625, 3.005126953125, 3.11322021484375, 3.2213134765625, 3.32940673828125, 3.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 8.0, 11.0, 14.0, 10.0, 16.0, 18.0, 15.0, 29.0, 33.0, 42.0, 41.0, 47.0, 63.0, 63.0, 70.0, 62.0, 76.0, 50.0, 53.0, 44.0, 43.0, 40.0, 32.0, 22.0, 15.0, 14.0, 19.0, 10.0, 14.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009069442749023438, -0.0008811578154563904, -0.000855371356010437, -0.0008295848965644836, -0.0008037984371185303, -0.0007780119776725769, -0.0007522255182266235, -0.0007264390587806702, -0.0007006525993347168, -0.0006748661398887634, -0.0006490796804428101, -0.0006232932209968567, -0.0005975067615509033, -0.00057172030210495, -0.0005459338426589966, -0.0005201473832130432, -0.0004943609237670898, -0.0004685744643211365, -0.0004427880048751831, -0.00041700154542922974, -0.00039121508598327637, -0.000365428626537323, -0.00033964216709136963, -0.00031385570764541626, -0.0002880692481994629, -0.0002622827887535095, -0.00023649632930755615, -0.00021070986986160278, -0.00018492341041564941, -0.00015913695096969604, -0.00013335049152374268, -0.0001075640320777893, -8.177757263183594e-05, -5.599111318588257e-05, -3.02046537399292e-05, -4.41819429397583e-06, 2.136826515197754e-05, 4.715472459793091e-05, 7.294118404388428e-05, 9.872764348983765e-05, 0.00012451410293579102, 0.00015030056238174438, 0.00017608702182769775, 0.00020187348127365112, 0.0002276599407196045, 0.00025344640016555786, 0.00027923285961151123, 0.0003050193190574646, 0.00033080577850341797, 0.00035659223794937134, 0.0003823786973953247, 0.0004081651568412781, 0.00043395161628723145, 0.0004597380757331848, 0.0004855245351791382, 0.0005113109946250916, 0.0005370974540710449, 0.0005628839135169983, 0.0005886703729629517, 0.000614456832408905, 0.0006402432918548584, 0.0006660297513008118, 0.0006918162107467651, 0.0007176026701927185, 0.0007433891296386719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 10.0, 13.0, 17.0, 35.0, 34.0, 75.0, 95.0, 114.0, 174.0, 290.0, 386.0, 590.0, 791.0, 1178.0, 1726.0, 2630.0, 3992.0, 6271.0, 10221.0, 17631.0, 31343.0, 55264.0, 97434.0, 151737.0, 190671.0, 176140.0, 124327.0, 73818.0, 41640.0, 23513.0, 13335.0, 7971.0, 5115.0, 3193.0, 2118.0, 1483.0, 947.0, 690.0, 478.0, 322.0, 253.0, 164.0, 99.0, 75.0, 58.0, 33.0, 24.0, 17.0, 8.0, 7.0, 4.0, 4.0, 0.0, 2.0], "bins": [-1.6279296875, -1.581085205078125, -1.53424072265625, -1.487396240234375, -1.4405517578125, -1.393707275390625, -1.34686279296875, -1.300018310546875, -1.253173828125, -1.206329345703125, -1.15948486328125, -1.112640380859375, -1.0657958984375, -1.018951416015625, -0.97210693359375, -0.925262451171875, -0.87841796875, -0.831573486328125, -0.78472900390625, -0.737884521484375, -0.6910400390625, -0.644195556640625, -0.59735107421875, -0.550506591796875, -0.503662109375, -0.456817626953125, -0.40997314453125, -0.363128662109375, -0.3162841796875, -0.269439697265625, -0.22259521484375, -0.175750732421875, -0.12890625, -0.082061767578125, -0.03521728515625, 0.011627197265625, 0.0584716796875, 0.105316162109375, 0.15216064453125, 0.199005126953125, 0.245849609375, 0.292694091796875, 0.33953857421875, 0.386383056640625, 0.4332275390625, 0.480072021484375, 0.52691650390625, 0.573760986328125, 0.62060546875, 0.667449951171875, 0.71429443359375, 0.761138916015625, 0.8079833984375, 0.854827880859375, 0.90167236328125, 0.948516845703125, 0.995361328125, 1.042205810546875, 1.08905029296875, 1.135894775390625, 1.1827392578125, 1.229583740234375, 1.27642822265625, 1.323272705078125, 1.3701171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 7.0, 8.0, 13.0, 13.0, 13.0, 10.0, 21.0, 28.0, 26.0, 22.0, 42.0, 45.0, 57.0, 66.0, 66.0, 50.0, 66.0, 68.0, 49.0, 48.0, 46.0, 45.0, 30.0, 28.0, 21.0, 14.0, 20.0, 15.0, 4.0, 10.0, 7.0, 6.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5099639892578125, -0.493560791015625, -0.4771575927734375, -0.46075439453125, -0.4443511962890625, -0.427947998046875, -0.4115447998046875, -0.3951416015625, -0.3787384033203125, -0.362335205078125, -0.3459320068359375, -0.32952880859375, -0.3131256103515625, -0.296722412109375, -0.2803192138671875, -0.263916015625, -0.2475128173828125, -0.231109619140625, -0.2147064208984375, -0.19830322265625, -0.1819000244140625, -0.165496826171875, -0.1490936279296875, -0.1326904296875, -0.1162872314453125, -0.099884033203125, -0.0834808349609375, -0.06707763671875, -0.0506744384765625, -0.034271240234375, -0.0178680419921875, -0.00146484375, 0.0149383544921875, 0.031341552734375, 0.0477447509765625, 0.06414794921875, 0.0805511474609375, 0.096954345703125, 0.1133575439453125, 0.1297607421875, 0.1461639404296875, 0.162567138671875, 0.1789703369140625, 0.19537353515625, 0.2117767333984375, 0.228179931640625, 0.2445831298828125, 0.260986328125, 0.2773895263671875, 0.293792724609375, 0.3101959228515625, 0.32659912109375, 0.3430023193359375, 0.359405517578125, 0.3758087158203125, 0.3922119140625, 0.4086151123046875, 0.425018310546875, 0.4414215087890625, 0.45782470703125, 0.4742279052734375, 0.490631103515625, 0.5070343017578125, 0.5234375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 1.0, 4.0, 13.0, 18.0, 12.0, 11.0, 20.0, 19.0, 34.0, 22.0, 30.0, 30.0, 24.0, 33.0, 33.0, 41.0, 46.0, 45.0, 33.0, 42.0, 38.0, 46.0, 52.0, 28.0, 40.0, 30.0, 28.0, 31.0, 27.0, 14.0, 20.0, 15.0, 24.0, 19.0, 15.0, 8.0, 9.0, 12.0, 10.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.495849609375, -23.61009979248047, -22.72435188293457, -21.83860206604004, -20.952852249145508, -20.06710433959961, -19.181354522705078, -18.295604705810547, -17.409854888916016, -16.524105072021484, -15.63835620880127, -14.752607345581055, -13.866857528686523, -12.981108665466309, -12.095359802246094, -11.209609985351562, -10.323861122131348, -9.438112258911133, -8.552362442016602, -7.666613578796387, -6.7808637619018555, -5.895114898681641, -5.009365558624268, -4.1236162185668945, -3.2378668785095215, -2.3521175384521484, -1.466368317604065, -0.5806190967559814, 0.3051302433013916, 1.1908793449401855, 2.0766286849975586, 2.9623780250549316, 3.8481273651123047, 4.733876705169678, 5.619626045227051, 6.505374908447266, 7.391124725341797, 8.276873588562012, 9.162622451782227, 10.048372268676758, 10.934122085571289, 11.819870948791504, 12.705620765686035, 13.59136962890625, 14.477119445800781, 15.362868309020996, 16.24861717224121, 17.134366989135742, 18.02011489868164, 18.905864715576172, 19.79161262512207, 20.6773624420166, 21.563112258911133, 22.44886016845703, 23.334609985351562, 24.220359802246094, 25.106109619140625, 25.991859436035156, 26.877607345581055, 27.763357162475586, 28.649106979370117, 29.534854888916016, 30.420604705810547, 31.306354522705078, 32.19210433959961]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 7.0, 13.0, 12.0, 14.0, 17.0, 19.0, 25.0, 20.0, 24.0, 20.0, 27.0, 36.0, 26.0, 36.0, 36.0, 29.0, 45.0, 45.0, 41.0, 36.0, 42.0, 39.0, 42.0, 46.0, 30.0, 30.0, 22.0, 39.0, 25.0, 27.0, 17.0, 12.0, 18.0, 18.0, 9.0, 9.0, 5.0, 10.0, 7.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 1.0], "bins": [-33.08607864379883, -32.11357498168945, -31.141069412231445, -30.16856575012207, -29.196060180664062, -28.223556518554688, -27.251052856445312, -26.278549194335938, -25.30604362487793, -24.333539962768555, -23.361034393310547, -22.388530731201172, -21.416027069091797, -20.44352149963379, -19.471017837524414, -18.498512268066406, -17.52600860595703, -16.553504943847656, -15.580999374389648, -14.608495712280273, -13.635991096496582, -12.66348648071289, -11.690982818603516, -10.718478202819824, -9.745973587036133, -8.773468971252441, -7.800964832305908, -6.828460693359375, -5.855956077575684, -4.883451461791992, -3.910947322845459, -2.938443183898926, -1.9659385681152344, -0.9934341907501221, -0.020929813385009766, 0.9515745639801025, 1.9240789413452148, 2.8965835571289062, 3.8690876960754395, 4.841591835021973, 5.814096450805664, 6.7866010665893555, 7.759105205535889, 8.731609344482422, 9.704113960266113, 10.676618576049805, 11.64912223815918, 12.621626853942871, 13.594131469726562, 14.566636085510254, 15.539140701293945, 16.51164436340332, 17.484149932861328, 18.456653594970703, 19.429157257080078, 20.401660919189453, 21.37416648864746, 22.346670150756836, 23.319175720214844, 24.29167938232422, 25.264183044433594, 26.2366886138916, 27.209192276000977, 28.181697845458984, 29.15420150756836]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 3.0, 5.0, 13.0, 15.0, 36.0, 60.0, 70.0, 117.0, 217.0, 328.0, 552.0, 1101.0, 1847.0, 3214.0, 5610.0, 9628.0, 16717.0, 27584.0, 44538.0, 66618.0, 93802.0, 119877.0, 135920.0, 135679.0, 118341.0, 92601.0, 65435.0, 43051.0, 27012.0, 16189.0, 9449.0, 5575.0, 3138.0, 1742.0, 1009.0, 560.0, 338.0, 208.0, 122.0, 77.0, 52.0, 42.0, 21.0, 10.0, 10.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.28125, -28.365478515625, -27.44970703125, -26.533935546875, -25.6181640625, -24.702392578125, -23.78662109375, -22.870849609375, -21.955078125, -21.039306640625, -20.12353515625, -19.207763671875, -18.2919921875, -17.376220703125, -16.46044921875, -15.544677734375, -14.62890625, -13.713134765625, -12.79736328125, -11.881591796875, -10.9658203125, -10.050048828125, -9.13427734375, -8.218505859375, -7.302734375, -6.386962890625, -5.47119140625, -4.555419921875, -3.6396484375, -2.723876953125, -1.80810546875, -0.892333984375, 0.0234375, 0.939208984375, 1.85498046875, 2.770751953125, 3.6865234375, 4.602294921875, 5.51806640625, 6.433837890625, 7.349609375, 8.265380859375, 9.18115234375, 10.096923828125, 11.0126953125, 11.928466796875, 12.84423828125, 13.760009765625, 14.67578125, 15.591552734375, 16.50732421875, 17.423095703125, 18.3388671875, 19.254638671875, 20.17041015625, 21.086181640625, 22.001953125, 22.917724609375, 23.83349609375, 24.749267578125, 25.6650390625, 26.580810546875, 27.49658203125, 28.412353515625, 29.328125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 16.0, 12.0, 11.0, 21.0, 20.0, 20.0, 23.0, 25.0, 22.0, 27.0, 31.0, 30.0, 39.0, 31.0, 32.0, 46.0, 40.0, 44.0, 37.0, 37.0, 43.0, 50.0, 31.0, 36.0, 26.0, 30.0, 35.0, 26.0, 29.0, 10.0, 17.0, 18.0, 14.0, 9.0, 9.0, 6.0, 9.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-31.0, -30.0859375, -29.171875, -28.2578125, -27.34375, -26.4296875, -25.515625, -24.6015625, -23.6875, -22.7734375, -21.859375, -20.9453125, -20.03125, -19.1171875, -18.203125, -17.2890625, -16.375, -15.4609375, -14.546875, -13.6328125, -12.71875, -11.8046875, -10.890625, -9.9765625, -9.0625, -8.1484375, -7.234375, -6.3203125, -5.40625, -4.4921875, -3.578125, -2.6640625, -1.75, -0.8359375, 0.078125, 0.9921875, 1.90625, 2.8203125, 3.734375, 4.6484375, 5.5625, 6.4765625, 7.390625, 8.3046875, 9.21875, 10.1328125, 11.046875, 11.9609375, 12.875, 13.7890625, 14.703125, 15.6171875, 16.53125, 17.4453125, 18.359375, 19.2734375, 20.1875, 21.1015625, 22.015625, 22.9296875, 23.84375, 24.7578125, 25.671875, 26.5859375, 27.5]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 19.0, 25.0, 28.0, 57.0, 71.0, 118.0, 176.0, 240.0, 390.0, 607.0, 946.0, 1409.0, 2170.0, 3246.0, 4885.0, 7582.0, 11302.0, 16631.0, 24413.0, 34329.0, 47216.0, 62497.0, 78910.0, 93914.0, 103638.0, 105581.0, 99967.0, 87410.0, 71824.0, 55959.0, 41121.0, 29203.0, 20741.0, 13961.0, 9566.0, 6294.0, 4147.0, 2763.0, 1785.0, 1160.0, 777.0, 489.0, 354.0, 239.0, 124.0, 78.0, 76.0, 41.0, 23.0, 17.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.375, -21.65966796875, -20.9443359375, -20.22900390625, -19.513671875, -18.79833984375, -18.0830078125, -17.36767578125, -16.65234375, -15.93701171875, -15.2216796875, -14.50634765625, -13.791015625, -13.07568359375, -12.3603515625, -11.64501953125, -10.9296875, -10.21435546875, -9.4990234375, -8.78369140625, -8.068359375, -7.35302734375, -6.6376953125, -5.92236328125, -5.20703125, -4.49169921875, -3.7763671875, -3.06103515625, -2.345703125, -1.63037109375, -0.9150390625, -0.19970703125, 0.515625, 1.23095703125, 1.9462890625, 2.66162109375, 3.376953125, 4.09228515625, 4.8076171875, 5.52294921875, 6.23828125, 6.95361328125, 7.6689453125, 8.38427734375, 9.099609375, 9.81494140625, 10.5302734375, 11.24560546875, 11.9609375, 12.67626953125, 13.3916015625, 14.10693359375, 14.822265625, 15.53759765625, 16.2529296875, 16.96826171875, 17.68359375, 18.39892578125, 19.1142578125, 19.82958984375, 20.544921875, 21.26025390625, 21.9755859375, 22.69091796875, 23.40625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 2.0, 5.0, 7.0, 5.0, 10.0, 12.0, 13.0, 12.0, 21.0, 18.0, 23.0, 26.0, 32.0, 25.0, 32.0, 38.0, 38.0, 34.0, 46.0, 34.0, 36.0, 36.0, 40.0, 41.0, 36.0, 27.0, 36.0, 47.0, 32.0, 19.0, 27.0, 24.0, 18.0, 23.0, 22.0, 19.0, 12.0, 13.0, 12.0, 8.0, 9.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.875, -19.28564453125, -18.6962890625, -18.10693359375, -17.517578125, -16.92822265625, -16.3388671875, -15.74951171875, -15.16015625, -14.57080078125, -13.9814453125, -13.39208984375, -12.802734375, -12.21337890625, -11.6240234375, -11.03466796875, -10.4453125, -9.85595703125, -9.2666015625, -8.67724609375, -8.087890625, -7.49853515625, -6.9091796875, -6.31982421875, -5.73046875, -5.14111328125, -4.5517578125, -3.96240234375, -3.373046875, -2.78369140625, -2.1943359375, -1.60498046875, -1.015625, -0.42626953125, 0.1630859375, 0.75244140625, 1.341796875, 1.93115234375, 2.5205078125, 3.10986328125, 3.69921875, 4.28857421875, 4.8779296875, 5.46728515625, 6.056640625, 6.64599609375, 7.2353515625, 7.82470703125, 8.4140625, 9.00341796875, 9.5927734375, 10.18212890625, 10.771484375, 11.36083984375, 11.9501953125, 12.53955078125, 13.12890625, 13.71826171875, 14.3076171875, 14.89697265625, 15.486328125, 16.07568359375, 16.6650390625, 17.25439453125, 17.84375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 13.0, 13.0, 25.0, 34.0, 51.0, 82.0, 112.0, 177.0, 272.0, 478.0, 744.0, 1377.0, 2535.0, 4704.0, 8721.0, 16041.0, 29430.0, 51882.0, 85827.0, 127815.0, 162759.0, 169157.0, 142548.0, 100425.0, 62787.0, 36462.0, 20119.0, 10902.0, 5793.0, 3028.0, 1728.0, 957.0, 580.0, 342.0, 210.0, 139.0, 85.0, 58.0, 44.0, 29.0, 17.0, 8.0, 12.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.8359375, -11.4681396484375, -11.100341796875, -10.7325439453125, -10.36474609375, -9.9969482421875, -9.629150390625, -9.2613525390625, -8.8935546875, -8.5257568359375, -8.157958984375, -7.7901611328125, -7.42236328125, -7.0545654296875, -6.686767578125, -6.3189697265625, -5.951171875, -5.5833740234375, -5.215576171875, -4.8477783203125, -4.47998046875, -4.1121826171875, -3.744384765625, -3.3765869140625, -3.0087890625, -2.6409912109375, -2.273193359375, -1.9053955078125, -1.53759765625, -1.1697998046875, -0.802001953125, -0.4342041015625, -0.06640625, 0.3013916015625, 0.669189453125, 1.0369873046875, 1.40478515625, 1.7725830078125, 2.140380859375, 2.5081787109375, 2.8759765625, 3.2437744140625, 3.611572265625, 3.9793701171875, 4.34716796875, 4.7149658203125, 5.082763671875, 5.4505615234375, 5.818359375, 6.1861572265625, 6.553955078125, 6.9217529296875, 7.28955078125, 7.6573486328125, 8.025146484375, 8.3929443359375, 8.7607421875, 9.1285400390625, 9.496337890625, 9.8641357421875, 10.23193359375, 10.5997314453125, 10.967529296875, 11.3353271484375, 11.703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 11.0, 12.0, 14.0, 9.0, 17.0, 19.0, 24.0, 38.0, 47.0, 34.0, 55.0, 49.0, 72.0, 59.0, 55.0, 70.0, 55.0, 40.0, 65.0, 46.0, 45.0, 26.0, 25.0, 16.0, 21.0, 18.0, 7.0, 9.0, 7.0, 3.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012149810791015625, -0.0011740028858184814, -0.0011330246925354004, -0.0010920464992523193, -0.0010510683059692383, -0.0010100901126861572, -0.0009691119194030762, -0.0009281337261199951, -0.0008871555328369141, -0.000846177339553833, -0.000805199146270752, -0.0007642209529876709, -0.0007232427597045898, -0.0006822645664215088, -0.0006412863731384277, -0.0006003081798553467, -0.0005593299865722656, -0.0005183517932891846, -0.0004773736000061035, -0.00043639540672302246, -0.0003954172134399414, -0.00035443902015686035, -0.0003134608268737793, -0.00027248263359069824, -0.0002315044403076172, -0.00019052624702453613, -0.00014954805374145508, -0.00010856986045837402, -6.759166717529297e-05, -2.6613473892211914e-05, 1.436471939086914e-05, 5.5342912673950195e-05, 9.632110595703125e-05, 0.0001372992992401123, 0.00017827749252319336, 0.00021925568580627441, 0.00026023387908935547, 0.0003012120723724365, 0.0003421902656555176, 0.00038316845893859863, 0.0004241466522216797, 0.00046512484550476074, 0.0005061030387878418, 0.0005470812320709229, 0.0005880594253540039, 0.000629037618637085, 0.000670015811920166, 0.0007109940052032471, 0.0007519721984863281, 0.0007929503917694092, 0.0008339285850524902, 0.0008749067783355713, 0.0009158849716186523, 0.0009568631649017334, 0.0009978413581848145, 0.0010388195514678955, 0.0010797977447509766, 0.0011207759380340576, 0.0011617541313171387, 0.0012027323246002197, 0.0012437105178833008, 0.0012846887111663818, 0.0013256669044494629, 0.001366645097732544, 0.001407623291015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 12.0, 8.0, 11.0, 26.0, 29.0, 65.0, 77.0, 99.0, 155.0, 206.0, 338.0, 472.0, 710.0, 1113.0, 1888.0, 3052.0, 4895.0, 8224.0, 13859.0, 23284.0, 37976.0, 61103.0, 89485.0, 120689.0, 141677.0, 145579.0, 125825.0, 95790.0, 65330.0, 42039.0, 25839.0, 15357.0, 9120.0, 5336.0, 3340.0, 1997.0, 1194.0, 750.0, 537.0, 344.0, 232.0, 162.0, 93.0, 84.0, 59.0, 34.0, 25.0, 16.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-10.5859375, -10.256103515625, -9.92626953125, -9.596435546875, -9.2666015625, -8.936767578125, -8.60693359375, -8.277099609375, -7.947265625, -7.617431640625, -7.28759765625, -6.957763671875, -6.6279296875, -6.298095703125, -5.96826171875, -5.638427734375, -5.30859375, -4.978759765625, -4.64892578125, -4.319091796875, -3.9892578125, -3.659423828125, -3.32958984375, -2.999755859375, -2.669921875, -2.340087890625, -2.01025390625, -1.680419921875, -1.3505859375, -1.020751953125, -0.69091796875, -0.361083984375, -0.03125, 0.298583984375, 0.62841796875, 0.958251953125, 1.2880859375, 1.617919921875, 1.94775390625, 2.277587890625, 2.607421875, 2.937255859375, 3.26708984375, 3.596923828125, 3.9267578125, 4.256591796875, 4.58642578125, 4.916259765625, 5.24609375, 5.575927734375, 5.90576171875, 6.235595703125, 6.5654296875, 6.895263671875, 7.22509765625, 7.554931640625, 7.884765625, 8.214599609375, 8.54443359375, 8.874267578125, 9.2041015625, 9.533935546875, 9.86376953125, 10.193603515625, 10.5234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 14.0, 25.0, 18.0, 24.0, 26.0, 38.0, 41.0, 50.0, 63.0, 74.0, 79.0, 72.0, 70.0, 79.0, 56.0, 55.0, 45.0, 38.0, 31.0, 25.0, 13.0, 11.0, 11.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.94140625, -6.73858642578125, -6.5357666015625, -6.33294677734375, -6.130126953125, -5.92730712890625, -5.7244873046875, -5.52166748046875, -5.31884765625, -5.11602783203125, -4.9132080078125, -4.71038818359375, -4.507568359375, -4.30474853515625, -4.1019287109375, -3.89910888671875, -3.6962890625, -3.49346923828125, -3.2906494140625, -3.08782958984375, -2.885009765625, -2.68218994140625, -2.4793701171875, -2.27655029296875, -2.07373046875, -1.87091064453125, -1.6680908203125, -1.46527099609375, -1.262451171875, -1.05963134765625, -0.8568115234375, -0.65399169921875, -0.451171875, -0.24835205078125, -0.0455322265625, 0.15728759765625, 0.360107421875, 0.56292724609375, 0.7657470703125, 0.96856689453125, 1.17138671875, 1.37420654296875, 1.5770263671875, 1.77984619140625, 1.982666015625, 2.18548583984375, 2.3883056640625, 2.59112548828125, 2.7939453125, 2.99676513671875, 3.1995849609375, 3.40240478515625, 3.605224609375, 3.80804443359375, 4.0108642578125, 4.21368408203125, 4.41650390625, 4.61932373046875, 4.8221435546875, 5.02496337890625, 5.227783203125, 5.43060302734375, 5.6334228515625, 5.83624267578125, 6.0390625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 12.0, 11.0, 11.0, 14.0, 16.0, 27.0, 22.0, 25.0, 29.0, 27.0, 31.0, 35.0, 40.0, 47.0, 40.0, 38.0, 31.0, 50.0, 47.0, 36.0, 36.0, 39.0, 41.0, 28.0, 34.0, 30.0, 23.0, 17.0, 22.0, 15.0, 25.0, 14.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.10675048828125, -24.247634887695312, -23.388521194458008, -22.52940559387207, -21.670291900634766, -20.811176300048828, -19.95206069946289, -19.092947006225586, -18.23383140563965, -17.37471580505371, -16.515602111816406, -15.656486511230469, -14.797371864318848, -13.938257217407227, -13.079142570495605, -12.220027923583984, -11.360913276672363, -10.501798629760742, -9.642683982849121, -8.7835693359375, -7.9244537353515625, -7.065339088439941, -6.20622444152832, -5.347109317779541, -4.48799467086792, -3.6288797855377197, -2.7697649002075195, -1.9106502532958984, -1.0515353679656982, -0.19242048263549805, 0.666694164276123, 1.5258092880249023, 2.3849239349365234, 3.2440388202667236, 4.103153705596924, 4.962268352508545, 5.821383476257324, 6.680498123168945, 7.539612770080566, 8.398727416992188, 9.257843017578125, 10.116957664489746, 10.976072311401367, 11.835187911987305, 12.694302558898926, 13.553417205810547, 14.412531852722168, 15.271646499633789, 16.130760192871094, 16.98987579345703, 17.848989486694336, 18.708105087280273, 19.567218780517578, 20.426334381103516, 21.285449981689453, 22.144563674926758, 23.003679275512695, 23.862794876098633, 24.721908569335938, 25.581024169921875, 26.44013786315918, 27.299253463745117, 28.158367156982422, 29.01748275756836, 29.876598358154297]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 9.0, 13.0, 8.0, 16.0, 20.0, 19.0, 28.0, 19.0, 26.0, 26.0, 27.0, 30.0, 32.0, 32.0, 41.0, 36.0, 37.0, 34.0, 36.0, 46.0, 43.0, 43.0, 29.0, 37.0, 35.0, 34.0, 31.0, 25.0, 30.0, 19.0, 18.0, 19.0, 13.0, 20.0, 13.0, 7.0, 8.0, 13.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.841938018798828, -25.89006805419922, -24.93819808959961, -23.986326217651367, -23.034456253051758, -22.08258628845215, -21.130714416503906, -20.178844451904297, -19.226974487304688, -18.275104522705078, -17.32323455810547, -16.371362686157227, -15.419492721557617, -14.467622756958008, -13.515751838684082, -12.563880920410156, -11.612010955810547, -10.660140991210938, -9.708270072937012, -8.756399154663086, -7.804529190063477, -6.852658748626709, -5.900788307189941, -4.948917865753174, -3.9970474243164062, -3.0451769828796387, -2.093306541442871, -1.1414361000061035, -0.18956565856933594, 0.7623047828674316, 1.7141752243041992, 2.666045665740967, 3.6179161071777344, 4.569786548614502, 5.5216569900512695, 6.473527431488037, 7.425397872924805, 8.377267837524414, 9.32913875579834, 10.281009674072266, 11.232879638671875, 12.184749603271484, 13.13662052154541, 14.088491439819336, 15.040361404418945, 15.992231369018555, 16.944103240966797, 17.895973205566406, 18.847843170166016, 19.799713134765625, 20.751583099365234, 21.703454971313477, 22.655324935913086, 23.607194900512695, 24.559066772460938, 25.510936737060547, 26.462806701660156, 27.414676666259766, 28.366546630859375, 29.318418502807617, 30.270288467407227, 31.222158432006836, 32.17403030395508, 33.12590026855469, 34.0777702331543]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 41.0, 50.0, 99.0, 181.0, 258.0, 458.0, 708.0, 1263.0, 2124.0, 3454.0, 6047.0, 10052.0, 17102.0, 28946.0, 48003.0, 77611.0, 124342.0, 190400.0, 277349.0, 377387.0, 468581.0, 522389.0, 514131.0, 450282.0, 354589.0, 256136.0, 173516.0, 111813.0, 70187.0, 42586.0, 25914.0, 15561.0, 9095.0, 5625.0, 3249.0, 1934.0, 1111.0, 695.0, 391.0, 250.0, 151.0, 78.0, 54.0, 25.0, 21.0, 15.0, 7.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.421875, -21.71875, -21.015625, -20.3125, -19.609375, -18.90625, -18.203125, -17.5, -16.796875, -16.09375, -15.390625, -14.6875, -13.984375, -13.28125, -12.578125, -11.875, -11.171875, -10.46875, -9.765625, -9.0625, -8.359375, -7.65625, -6.953125, -6.25, -5.546875, -4.84375, -4.140625, -3.4375, -2.734375, -2.03125, -1.328125, -0.625, 0.078125, 0.78125, 1.484375, 2.1875, 2.890625, 3.59375, 4.296875, 5.0, 5.703125, 6.40625, 7.109375, 7.8125, 8.515625, 9.21875, 9.921875, 10.625, 11.328125, 12.03125, 12.734375, 13.4375, 14.140625, 14.84375, 15.546875, 16.25, 16.953125, 17.65625, 18.359375, 19.0625, 19.765625, 20.46875, 21.171875, 21.875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [5.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 8.0, 12.0, 5.0, 9.0, 19.0, 19.0, 19.0, 26.0, 13.0, 22.0, 31.0, 29.0, 25.0, 35.0, 28.0, 36.0, 36.0, 34.0, 38.0, 33.0, 40.0, 49.0, 39.0, 37.0, 30.0, 38.0, 27.0, 38.0, 22.0, 36.0, 19.0, 19.0, 21.0, 11.0, 21.0, 18.0, 8.0, 9.0, 8.0, 7.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.51123046875, -20.7099609375, -19.90869140625, -19.107421875, -18.30615234375, -17.5048828125, -16.70361328125, -15.90234375, -15.10107421875, -14.2998046875, -13.49853515625, -12.697265625, -11.89599609375, -11.0947265625, -10.29345703125, -9.4921875, -8.69091796875, -7.8896484375, -7.08837890625, -6.287109375, -5.48583984375, -4.6845703125, -3.88330078125, -3.08203125, -2.28076171875, -1.4794921875, -0.67822265625, 0.123046875, 0.92431640625, 1.7255859375, 2.52685546875, 3.328125, 4.12939453125, 4.9306640625, 5.73193359375, 6.533203125, 7.33447265625, 8.1357421875, 8.93701171875, 9.73828125, 10.53955078125, 11.3408203125, 12.14208984375, 12.943359375, 13.74462890625, 14.5458984375, 15.34716796875, 16.1484375, 16.94970703125, 17.7509765625, 18.55224609375, 19.353515625, 20.15478515625, 20.9560546875, 21.75732421875, 22.55859375, 23.35986328125, 24.1611328125, 24.96240234375, 25.763671875, 26.56494140625, 27.3662109375, 28.16748046875, 28.96875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 16.0, 8.0, 26.0, 46.0, 82.0, 130.0, 238.0, 375.0, 643.0, 1025.0, 1838.0, 2946.0, 4932.0, 8180.0, 13271.0, 21419.0, 34253.0, 53480.0, 82495.0, 122386.0, 176020.0, 241281.0, 313753.0, 382555.0, 431427.0, 450527.0, 429431.0, 376445.0, 307043.0, 234932.0, 170246.0, 117269.0, 78809.0, 51558.0, 32753.0, 20308.0, 12716.0, 7623.0, 4660.0, 2899.0, 1640.0, 1048.0, 585.0, 381.0, 241.0, 151.0, 72.0, 48.0, 40.0, 8.0, 14.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-21.9375, -21.239990234375, -20.54248046875, -19.844970703125, -19.1474609375, -18.449951171875, -17.75244140625, -17.054931640625, -16.357421875, -15.659912109375, -14.96240234375, -14.264892578125, -13.5673828125, -12.869873046875, -12.17236328125, -11.474853515625, -10.77734375, -10.079833984375, -9.38232421875, -8.684814453125, -7.9873046875, -7.289794921875, -6.59228515625, -5.894775390625, -5.197265625, -4.499755859375, -3.80224609375, -3.104736328125, -2.4072265625, -1.709716796875, -1.01220703125, -0.314697265625, 0.3828125, 1.080322265625, 1.77783203125, 2.475341796875, 3.1728515625, 3.870361328125, 4.56787109375, 5.265380859375, 5.962890625, 6.660400390625, 7.35791015625, 8.055419921875, 8.7529296875, 9.450439453125, 10.14794921875, 10.845458984375, 11.54296875, 12.240478515625, 12.93798828125, 13.635498046875, 14.3330078125, 15.030517578125, 15.72802734375, 16.425537109375, 17.123046875, 17.820556640625, 18.51806640625, 19.215576171875, 19.9130859375, 20.610595703125, 21.30810546875, 22.005615234375, 22.703125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 12.0, 24.0, 25.0, 30.0, 31.0, 49.0, 59.0, 80.0, 98.0, 118.0, 121.0, 141.0, 177.0, 178.0, 224.0, 218.0, 237.0, 232.0, 223.0, 240.0, 236.0, 230.0, 201.0, 170.0, 140.0, 124.0, 107.0, 72.0, 64.0, 53.0, 41.0, 33.0, 24.0, 17.0, 13.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.75, -13.317138671875, -12.88427734375, -12.451416015625, -12.0185546875, -11.585693359375, -11.15283203125, -10.719970703125, -10.287109375, -9.854248046875, -9.42138671875, -8.988525390625, -8.5556640625, -8.122802734375, -7.68994140625, -7.257080078125, -6.82421875, -6.391357421875, -5.95849609375, -5.525634765625, -5.0927734375, -4.659912109375, -4.22705078125, -3.794189453125, -3.361328125, -2.928466796875, -2.49560546875, -2.062744140625, -1.6298828125, -1.197021484375, -0.76416015625, -0.331298828125, 0.1015625, 0.534423828125, 0.96728515625, 1.400146484375, 1.8330078125, 2.265869140625, 2.69873046875, 3.131591796875, 3.564453125, 3.997314453125, 4.43017578125, 4.863037109375, 5.2958984375, 5.728759765625, 6.16162109375, 6.594482421875, 7.02734375, 7.460205078125, 7.89306640625, 8.325927734375, 8.7587890625, 9.191650390625, 9.62451171875, 10.057373046875, 10.490234375, 10.923095703125, 11.35595703125, 11.788818359375, 12.2216796875, 12.654541015625, 13.08740234375, 13.520263671875, 13.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 0.0, 3.0, 7.0, 6.0, 15.0, 10.0, 15.0, 12.0, 17.0, 18.0, 19.0, 15.0, 26.0, 33.0, 27.0, 41.0, 36.0, 34.0, 41.0, 42.0, 38.0, 41.0, 44.0, 48.0, 38.0, 29.0, 40.0, 29.0, 33.0, 23.0, 29.0, 30.0, 28.0, 17.0, 16.0, 20.0, 19.0, 10.0, 9.0, 7.0, 11.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.271831512451172, -25.450593948364258, -24.629358291625977, -23.808120727539062, -22.98688316345215, -22.165645599365234, -21.344409942626953, -20.52317237854004, -19.701934814453125, -18.88069725036621, -18.05946159362793, -17.238224029541016, -16.4169864654541, -15.595749855041504, -14.774513244628906, -13.953275680541992, -13.132039070129395, -12.310802459716797, -11.489564895629883, -10.668328285217285, -9.847090721130371, -9.025854110717773, -8.20461654663086, -7.383379936218262, -6.562142848968506, -5.74090576171875, -4.919668674468994, -4.098431587219238, -3.2771947383880615, -2.4559578895568848, -1.634720802307129, -0.813483715057373, 0.0077533721923828125, 0.8289903998374939, 1.650227427482605, 2.4714643955230713, 3.292701482772827, 4.113938331604004, 4.93517541885376, 5.756412506103516, 6.5776495933532715, 7.398886680603027, 8.220123291015625, 9.041360855102539, 9.862597465515137, 10.683834075927734, 11.505071640014648, 12.326309204101562, 13.14754581451416, 13.968782424926758, 14.790019989013672, 15.61125659942627, 16.432493209838867, 17.25373077392578, 18.074968338012695, 18.89620590209961, 19.71744155883789, 20.538679122924805, 21.359914779663086, 22.18115234375, 23.002389907836914, 23.823627471923828, 24.64486312866211, 25.466100692749023, 26.287338256835938]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 9.0, 10.0, 8.0, 15.0, 18.0, 23.0, 26.0, 21.0, 21.0, 23.0, 27.0, 33.0, 41.0, 31.0, 35.0, 27.0, 35.0, 38.0, 43.0, 35.0, 43.0, 41.0, 36.0, 42.0, 41.0, 27.0, 37.0, 30.0, 24.0, 28.0, 21.0, 20.0, 20.0, 10.0, 13.0, 12.0, 9.0, 4.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.024250030517578, -24.063556671142578, -23.102863311767578, -22.142169952392578, -21.181476593017578, -20.220783233642578, -19.260089874267578, -18.299396514892578, -17.338703155517578, -16.378009796142578, -15.417316436767578, -14.456623077392578, -13.495929718017578, -12.535236358642578, -11.574542045593262, -10.613848686218262, -9.653154373168945, -8.692461013793945, -7.731767654418945, -6.771073818206787, -5.810380458831787, -4.849687099456787, -3.888993263244629, -2.928299903869629, -1.967606544494629, -1.0069130659103394, -0.046219587326049805, 0.9144740104675293, 1.8751673698425293, 2.8358607292175293, 3.7965545654296875, 4.7572479248046875, 5.7179412841796875, 6.6786346435546875, 7.6393280029296875, 8.600021362304688, 9.560714721679688, 10.521408081054688, 11.482102394104004, 12.442795753479004, 13.403489112854004, 14.364182472229004, 15.324875831604004, 16.28557014465332, 17.24626350402832, 18.20695686340332, 19.16765022277832, 20.12834358215332, 21.08903694152832, 22.04973030090332, 23.01042366027832, 23.97111701965332, 24.93181037902832, 25.89250373840332, 26.853199005126953, 27.813892364501953, 28.774585723876953, 29.735279083251953, 30.695972442626953, 31.656665802001953, 32.61735916137695, 33.57805252075195, 34.53874588012695, 35.49943923950195, 36.46013259887695]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 5.0, 11.0, 21.0, 29.0, 43.0, 53.0, 104.0, 178.0, 286.0, 386.0, 662.0, 928.0, 1513.0, 2376.0, 3531.0, 5274.0, 8198.0, 11993.0, 17554.0, 25352.0, 35644.0, 48321.0, 63151.0, 77870.0, 91875.0, 101140.0, 102985.0, 97348.0, 85665.0, 71177.0, 56525.0, 41933.0, 30549.0, 21433.0, 14760.0, 10150.0, 6706.0, 4499.0, 2951.0, 1913.0, 1243.0, 807.0, 497.0, 310.0, 239.0, 122.0, 81.0, 58.0, 45.0, 15.0, 12.0, 15.0, 8.0, 4.0, 3.0, 3.0, 2.0], "bins": [-9.921875, -9.6236572265625, -9.325439453125, -9.0272216796875, -8.72900390625, -8.4307861328125, -8.132568359375, -7.8343505859375, -7.5361328125, -7.2379150390625, -6.939697265625, -6.6414794921875, -6.34326171875, -6.0450439453125, -5.746826171875, -5.4486083984375, -5.150390625, -4.8521728515625, -4.553955078125, -4.2557373046875, -3.95751953125, -3.6593017578125, -3.361083984375, -3.0628662109375, -2.7646484375, -2.4664306640625, -2.168212890625, -1.8699951171875, -1.57177734375, -1.2735595703125, -0.975341796875, -0.6771240234375, -0.37890625, -0.0806884765625, 0.217529296875, 0.5157470703125, 0.81396484375, 1.1121826171875, 1.410400390625, 1.7086181640625, 2.0068359375, 2.3050537109375, 2.603271484375, 2.9014892578125, 3.19970703125, 3.4979248046875, 3.796142578125, 4.0943603515625, 4.392578125, 4.6907958984375, 4.989013671875, 5.2872314453125, 5.58544921875, 5.8836669921875, 6.181884765625, 6.4801025390625, 6.7783203125, 7.0765380859375, 7.374755859375, 7.6729736328125, 7.97119140625, 8.2694091796875, 8.567626953125, 8.8658447265625, 9.1640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 9.0, 9.0, 10.0, 13.0, 17.0, 23.0, 27.0, 22.0, 19.0, 25.0, 25.0, 37.0, 41.0, 28.0, 36.0, 24.0, 39.0, 37.0, 41.0, 36.0, 44.0, 38.0, 38.0, 40.0, 42.0, 26.0, 37.0, 30.0, 25.0, 30.0, 20.0, 19.0, 21.0, 10.0, 14.0, 10.0, 11.0, 4.0, 9.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.387939453125, -23.41650390625, -22.445068359375, -21.4736328125, -20.502197265625, -19.53076171875, -18.559326171875, -17.587890625, -16.616455078125, -15.64501953125, -14.673583984375, -13.7021484375, -12.730712890625, -11.75927734375, -10.787841796875, -9.81640625, -8.844970703125, -7.87353515625, -6.902099609375, -5.9306640625, -4.959228515625, -3.98779296875, -3.016357421875, -2.044921875, -1.073486328125, -0.10205078125, 0.869384765625, 1.8408203125, 2.812255859375, 3.78369140625, 4.755126953125, 5.7265625, 6.697998046875, 7.66943359375, 8.640869140625, 9.6123046875, 10.583740234375, 11.55517578125, 12.526611328125, 13.498046875, 14.469482421875, 15.44091796875, 16.412353515625, 17.3837890625, 18.355224609375, 19.32666015625, 20.298095703125, 21.26953125, 22.240966796875, 23.21240234375, 24.183837890625, 25.1552734375, 26.126708984375, 27.09814453125, 28.069580078125, 29.041015625, 30.012451171875, 30.98388671875, 31.955322265625, 32.9267578125, 33.898193359375, 34.86962890625, 35.841064453125, 36.8125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 12.0, 21.0, 29.0, 44.0, 60.0, 90.0, 150.0, 195.0, 351.0, 552.0, 800.0, 1242.0, 2001.0, 3132.0, 4882.0, 7403.0, 11819.0, 19232.0, 33873.0, 618931.0, 267039.0, 29918.0, 17109.0, 10698.0, 6664.0, 4378.0, 2823.0, 1859.0, 1157.0, 728.0, 475.0, 322.0, 194.0, 121.0, 73.0, 66.0, 35.0, 18.0, 15.0, 14.0, 9.0, 7.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.352783203125, -25.47119140625, -24.589599609375, -23.7080078125, -22.826416015625, -21.94482421875, -21.063232421875, -20.181640625, -19.300048828125, -18.41845703125, -17.536865234375, -16.6552734375, -15.773681640625, -14.89208984375, -14.010498046875, -13.12890625, -12.247314453125, -11.36572265625, -10.484130859375, -9.6025390625, -8.720947265625, -7.83935546875, -6.957763671875, -6.076171875, -5.194580078125, -4.31298828125, -3.431396484375, -2.5498046875, -1.668212890625, -0.78662109375, 0.094970703125, 0.9765625, 1.858154296875, 2.73974609375, 3.621337890625, 4.5029296875, 5.384521484375, 6.26611328125, 7.147705078125, 8.029296875, 8.910888671875, 9.79248046875, 10.674072265625, 11.5556640625, 12.437255859375, 13.31884765625, 14.200439453125, 15.08203125, 15.963623046875, 16.84521484375, 17.726806640625, 18.6083984375, 19.489990234375, 20.37158203125, 21.253173828125, 22.134765625, 23.016357421875, 23.89794921875, 24.779541015625, 25.6611328125, 26.542724609375, 27.42431640625, 28.305908203125, 29.1875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 12.0, 10.0, 16.0, 12.0, 17.0, 11.0, 32.0, 25.0, 26.0, 34.0, 34.0, 38.0, 40.0, 37.0, 36.0, 38.0, 47.0, 40.0, 52.0, 37.0, 34.0, 26.0, 36.0, 41.0, 38.0, 29.0, 25.0, 30.0, 25.0, 19.0, 21.0, 14.0, 13.0, 7.0, 13.0, 14.0, 5.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.314208984375, -21.61279296875, -20.911376953125, -20.2099609375, -19.508544921875, -18.80712890625, -18.105712890625, -17.404296875, -16.702880859375, -16.00146484375, -15.300048828125, -14.5986328125, -13.897216796875, -13.19580078125, -12.494384765625, -11.79296875, -11.091552734375, -10.39013671875, -9.688720703125, -8.9873046875, -8.285888671875, -7.58447265625, -6.883056640625, -6.181640625, -5.480224609375, -4.77880859375, -4.077392578125, -3.3759765625, -2.674560546875, -1.97314453125, -1.271728515625, -0.5703125, 0.131103515625, 0.83251953125, 1.533935546875, 2.2353515625, 2.936767578125, 3.63818359375, 4.339599609375, 5.041015625, 5.742431640625, 6.44384765625, 7.145263671875, 7.8466796875, 8.548095703125, 9.24951171875, 9.950927734375, 10.65234375, 11.353759765625, 12.05517578125, 12.756591796875, 13.4580078125, 14.159423828125, 14.86083984375, 15.562255859375, 16.263671875, 16.965087890625, 17.66650390625, 18.367919921875, 19.0693359375, 19.770751953125, 20.47216796875, 21.173583984375, 21.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 5.0, 11.0, 21.0, 19.0, 39.0, 37.0, 60.0, 70.0, 99.0, 137.0, 200.0, 273.0, 401.0, 560.0, 841.0, 1250.0, 1785.0, 2749.0, 4136.0, 6164.0, 9768.0, 15615.0, 27392.0, 143622.0, 727701.0, 48177.0, 21069.0, 12500.0, 8014.0, 5289.0, 3523.0, 2231.0, 1517.0, 924.0, 701.0, 482.0, 349.0, 216.0, 154.0, 125.0, 83.0, 58.0, 48.0, 36.0, 33.0, 17.0, 16.0, 10.0, 5.0, 1.0, 9.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.044921875, -1.981597900390625, -1.91827392578125, -1.854949951171875, -1.7916259765625, -1.728302001953125, -1.66497802734375, -1.601654052734375, -1.538330078125, -1.475006103515625, -1.41168212890625, -1.348358154296875, -1.2850341796875, -1.221710205078125, -1.15838623046875, -1.095062255859375, -1.03173828125, -0.968414306640625, -0.90509033203125, -0.841766357421875, -0.7784423828125, -0.715118408203125, -0.65179443359375, -0.588470458984375, -0.525146484375, -0.461822509765625, -0.39849853515625, -0.335174560546875, -0.2718505859375, -0.208526611328125, -0.14520263671875, -0.081878662109375, -0.0185546875, 0.044769287109375, 0.10809326171875, 0.171417236328125, 0.2347412109375, 0.298065185546875, 0.36138916015625, 0.424713134765625, 0.488037109375, 0.551361083984375, 0.61468505859375, 0.678009033203125, 0.7413330078125, 0.804656982421875, 0.86798095703125, 0.931304931640625, 0.99462890625, 1.057952880859375, 1.12127685546875, 1.184600830078125, 1.2479248046875, 1.311248779296875, 1.37457275390625, 1.437896728515625, 1.501220703125, 1.564544677734375, 1.62786865234375, 1.691192626953125, 1.7545166015625, 1.817840576171875, 1.88116455078125, 1.944488525390625, 2.0078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 14.0, 20.0, 32.0, 40.0, 37.0, 46.0, 50.0, 65.0, 99.0, 76.0, 84.0, 84.0, 60.0, 58.0, 46.0, 28.0, 24.0, 20.0, 12.0, 10.0, 12.0, 10.0, 4.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004992485046386719, -0.00048423558473587036, -0.00046922266483306885, -0.00045420974493026733, -0.0004391968250274658, -0.0004241839051246643, -0.0004091709852218628, -0.0003941580653190613, -0.00037914514541625977, -0.00036413222551345825, -0.00034911930561065674, -0.0003341063857078552, -0.0003190934658050537, -0.0003040805459022522, -0.0002890676259994507, -0.00027405470609664917, -0.00025904178619384766, -0.00024402886629104614, -0.00022901594638824463, -0.00021400302648544312, -0.0001989901065826416, -0.0001839771866798401, -0.00016896426677703857, -0.00015395134687423706, -0.00013893842697143555, -0.00012392550706863403, -0.00010891258716583252, -9.3899667263031e-05, -7.888674736022949e-05, -6.387382745742798e-05, -4.8860907554626465e-05, -3.384798765182495e-05, -1.8835067749023438e-05, -3.822147846221924e-06, 1.119077205657959e-05, 2.6203691959381104e-05, 4.121661186218262e-05, 5.622953176498413e-05, 7.124245166778564e-05, 8.625537157058716e-05, 0.00010126829147338867, 0.00011628121137619019, 0.0001312941312789917, 0.0001463070511817932, 0.00016131997108459473, 0.00017633289098739624, 0.00019134581089019775, 0.00020635873079299927, 0.00022137165069580078, 0.0002363845705986023, 0.0002513974905014038, 0.0002664104104042053, 0.00028142333030700684, 0.00029643625020980835, 0.00031144917011260986, 0.0003264620900154114, 0.0003414750099182129, 0.0003564879298210144, 0.0003715008497238159, 0.00038651376962661743, 0.00040152668952941895, 0.00041653960943222046, 0.00043155252933502197, 0.0004465654492378235, 0.000461578369140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 4.0, 12.0, 15.0, 26.0, 39.0, 45.0, 79.0, 101.0, 146.0, 250.0, 394.0, 668.0, 1076.0, 1859.0, 3205.0, 5735.0, 10454.0, 18946.0, 34130.0, 58885.0, 94553.0, 136058.0, 162919.0, 161939.0, 132529.0, 92603.0, 57568.0, 32875.0, 18218.0, 9983.0, 5541.0, 3161.0, 1763.0, 1030.0, 625.0, 345.0, 267.0, 161.0, 112.0, 64.0, 53.0, 37.0, 23.0, 17.0, 12.0, 8.0, 8.0, 7.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.345703125, -1.307220458984375, -1.26873779296875, -1.230255126953125, -1.1917724609375, -1.153289794921875, -1.11480712890625, -1.076324462890625, -1.037841796875, -0.999359130859375, -0.96087646484375, -0.922393798828125, -0.8839111328125, -0.845428466796875, -0.80694580078125, -0.768463134765625, -0.72998046875, -0.691497802734375, -0.65301513671875, -0.614532470703125, -0.5760498046875, -0.537567138671875, -0.49908447265625, -0.460601806640625, -0.422119140625, -0.383636474609375, -0.34515380859375, -0.306671142578125, -0.2681884765625, -0.229705810546875, -0.19122314453125, -0.152740478515625, -0.1142578125, -0.075775146484375, -0.03729248046875, 0.001190185546875, 0.0396728515625, 0.078155517578125, 0.11663818359375, 0.155120849609375, 0.193603515625, 0.232086181640625, 0.27056884765625, 0.309051513671875, 0.3475341796875, 0.386016845703125, 0.42449951171875, 0.462982177734375, 0.50146484375, 0.539947509765625, 0.57843017578125, 0.616912841796875, 0.6553955078125, 0.693878173828125, 0.73236083984375, 0.770843505859375, 0.809326171875, 0.847808837890625, 0.88629150390625, 0.924774169921875, 0.9632568359375, 1.001739501953125, 1.04022216796875, 1.078704833984375, 1.1171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 19.0, 22.0, 9.0, 16.0, 22.0, 25.0, 27.0, 24.0, 34.0, 43.0, 39.0, 43.0, 47.0, 49.0, 55.0, 46.0, 49.0, 42.0, 53.0, 39.0, 48.0, 31.0, 32.0, 29.0, 22.0, 9.0, 14.0, 15.0, 13.0, 9.0, 11.0, 10.0, 5.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.476806640625, -0.46414947509765625, -0.4514923095703125, -0.43883514404296875, -0.426177978515625, -0.41352081298828125, -0.4008636474609375, -0.38820648193359375, -0.37554931640625, -0.36289215087890625, -0.3502349853515625, -0.33757781982421875, -0.324920654296875, -0.31226348876953125, -0.2996063232421875, -0.28694915771484375, -0.2742919921875, -0.26163482666015625, -0.2489776611328125, -0.23632049560546875, -0.223663330078125, -0.21100616455078125, -0.1983489990234375, -0.18569183349609375, -0.17303466796875, -0.16037750244140625, -0.1477203369140625, -0.13506317138671875, -0.122406005859375, -0.10974884033203125, -0.0970916748046875, -0.08443450927734375, -0.07177734375, -0.05912017822265625, -0.0464630126953125, -0.03380584716796875, -0.021148681640625, -0.00849151611328125, 0.0041656494140625, 0.01682281494140625, 0.02947998046875, 0.04213714599609375, 0.0547943115234375, 0.06745147705078125, 0.080108642578125, 0.09276580810546875, 0.1054229736328125, 0.11808013916015625, 0.1307373046875, 0.14339447021484375, 0.1560516357421875, 0.16870880126953125, 0.181365966796875, 0.19402313232421875, 0.2066802978515625, 0.21933746337890625, 0.23199462890625, 0.24465179443359375, 0.2573089599609375, 0.26996612548828125, 0.282623291015625, 0.29528045654296875, 0.3079376220703125, 0.32059478759765625, 0.333251953125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 16.0, 12.0, 11.0, 19.0, 15.0, 13.0, 16.0, 23.0, 30.0, 32.0, 38.0, 35.0, 28.0, 48.0, 45.0, 41.0, 38.0, 43.0, 42.0, 46.0, 38.0, 36.0, 40.0, 29.0, 36.0, 24.0, 26.0, 29.0, 15.0, 12.0, 18.0, 13.0, 19.0, 17.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.57131576538086, -26.71919059753418, -25.8670654296875, -25.01494026184082, -24.16281509399414, -23.31068992614746, -22.45856475830078, -21.60643768310547, -20.754314422607422, -19.902189254760742, -19.050064086914062, -18.197938919067383, -17.345813751220703, -16.493688583374023, -15.641562461853027, -14.789437294006348, -13.937311172485352, -13.085186004638672, -12.233060836791992, -11.380935668945312, -10.528810501098633, -9.676685333251953, -8.824559211730957, -7.972434043884277, -7.120308876037598, -6.268183708190918, -5.416058540344238, -4.5639328956604, -3.7118077278137207, -2.859682559967041, -2.007556915283203, -1.1554317474365234, -0.30330467224121094, 0.5488206148147583, 1.4009459018707275, 2.2530713081359863, 3.105196475982666, 3.9573216438293457, 4.809447288513184, 5.661572456359863, 6.513697624206543, 7.365822792053223, 8.217947959899902, 9.070074081420898, 9.922199249267578, 10.774324417114258, 11.626449584960938, 12.478574752807617, 13.330699920654297, 14.182825088500977, 15.034950256347656, 15.887075424194336, 16.739200592041016, 17.591325759887695, 18.443450927734375, 19.295578002929688, 20.147701263427734, 20.999826431274414, 21.851951599121094, 22.704076766967773, 23.556201934814453, 24.408327102661133, 25.260452270507812, 26.112579345703125, 26.964704513549805]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 15.0, 18.0, 23.0, 24.0, 21.0, 22.0, 26.0, 25.0, 38.0, 38.0, 26.0, 30.0, 42.0, 32.0, 34.0, 33.0, 45.0, 42.0, 33.0, 43.0, 31.0, 50.0, 27.0, 34.0, 29.0, 27.0, 22.0, 24.0, 18.0, 23.0, 14.0, 10.0, 8.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.958290100097656, -24.000320434570312, -23.04235076904297, -22.084381103515625, -21.12641143798828, -20.168441772460938, -19.210472106933594, -18.25250244140625, -17.294532775878906, -16.336563110351562, -15.378593444824219, -14.420623779296875, -13.462654113769531, -12.504684448242188, -11.546713829040527, -10.588744163513184, -9.630773544311523, -8.67280387878418, -7.714834213256836, -6.756864070892334, -5.79889440536499, -4.8409247398376465, -3.8829545974731445, -2.924984931945801, -1.967015266418457, -1.0090454816818237, -0.05107569694519043, 0.9068942070007324, 1.8648638725280762, 2.82283353805542, 3.780803680419922, 4.738773345947266, 5.696743011474609, 6.654712677001953, 7.612682342529297, 8.57065200805664, 9.528621673583984, 10.486591339111328, 11.444561958312988, 12.402531623840332, 13.360501289367676, 14.31847095489502, 15.276440620422363, 16.234411239624023, 17.192380905151367, 18.15035057067871, 19.108320236206055, 20.0662899017334, 21.024259567260742, 21.982229232788086, 22.94019889831543, 23.898168563842773, 24.856138229370117, 25.81410789489746, 26.772079467773438, 27.73004913330078, 28.688018798828125, 29.64598846435547, 30.603958129882812, 31.561927795410156, 32.5198974609375, 33.477867126464844, 34.43583679199219, 35.39380645751953, 36.351776123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 9.0, 22.0, 21.0, 26.0, 32.0, 58.0, 80.0, 125.0, 165.0, 284.0, 453.0, 687.0, 1149.0, 1846.0, 2969.0, 4958.0, 7939.0, 13113.0, 21287.0, 32904.0, 49464.0, 70019.0, 92088.0, 112129.0, 123278.0, 122300.0, 109002.0, 88531.0, 66079.0, 46133.0, 30500.0, 19577.0, 12094.0, 7421.0, 4548.0, 2667.0, 1664.0, 1095.0, 626.0, 387.0, 267.0, 178.0, 113.0, 86.0, 54.0, 42.0, 28.0, 22.0, 7.0, 13.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.71875, -24.912841796875, -24.10693359375, -23.301025390625, -22.4951171875, -21.689208984375, -20.88330078125, -20.077392578125, -19.271484375, -18.465576171875, -17.65966796875, -16.853759765625, -16.0478515625, -15.241943359375, -14.43603515625, -13.630126953125, -12.82421875, -12.018310546875, -11.21240234375, -10.406494140625, -9.6005859375, -8.794677734375, -7.98876953125, -7.182861328125, -6.376953125, -5.571044921875, -4.76513671875, -3.959228515625, -3.1533203125, -2.347412109375, -1.54150390625, -0.735595703125, 0.0703125, 0.876220703125, 1.68212890625, 2.488037109375, 3.2939453125, 4.099853515625, 4.90576171875, 5.711669921875, 6.517578125, 7.323486328125, 8.12939453125, 8.935302734375, 9.7412109375, 10.547119140625, 11.35302734375, 12.158935546875, 12.96484375, 13.770751953125, 14.57666015625, 15.382568359375, 16.1884765625, 16.994384765625, 17.80029296875, 18.606201171875, 19.412109375, 20.218017578125, 21.02392578125, 21.829833984375, 22.6357421875, 23.441650390625, 24.24755859375, 25.053466796875, 25.859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 10.0, 7.0, 12.0, 23.0, 19.0, 22.0, 23.0, 26.0, 21.0, 27.0, 35.0, 38.0, 29.0, 27.0, 43.0, 36.0, 26.0, 40.0, 45.0, 36.0, 38.0, 41.0, 32.0, 44.0, 36.0, 27.0, 35.0, 23.0, 25.0, 21.0, 17.0, 28.0, 10.0, 15.0, 8.0, 13.0, 7.0, 5.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -22.875, -21.96875, -21.0625, -20.15625, -19.25, -18.34375, -17.4375, -16.53125, -15.625, -14.71875, -13.8125, -12.90625, -12.0, -11.09375, -10.1875, -9.28125, -8.375, -7.46875, -6.5625, -5.65625, -4.75, -3.84375, -2.9375, -2.03125, -1.125, -0.21875, 0.6875, 1.59375, 2.5, 3.40625, 4.3125, 5.21875, 6.125, 7.03125, 7.9375, 8.84375, 9.75, 10.65625, 11.5625, 12.46875, 13.375, 14.28125, 15.1875, 16.09375, 17.0, 17.90625, 18.8125, 19.71875, 20.625, 21.53125, 22.4375, 23.34375, 24.25, 25.15625, 26.0625, 26.96875, 27.875, 28.78125, 29.6875, 30.59375, 31.5, 32.40625, 33.3125, 34.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 6.0, 7.0, 20.0, 22.0, 30.0, 53.0, 87.0, 136.0, 220.0, 361.0, 565.0, 1016.0, 1510.0, 2546.0, 4249.0, 6859.0, 11014.0, 17661.0, 26856.0, 39783.0, 57608.0, 77126.0, 96313.0, 110797.0, 116512.0, 112037.0, 99161.0, 80786.0, 61021.0, 43530.0, 29701.0, 19203.0, 12181.0, 7557.0, 4721.0, 2829.0, 1714.0, 1068.0, 662.0, 400.0, 240.0, 147.0, 106.0, 53.0, 34.0, 25.0, 13.0, 7.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.8017578125, -22.056640625, -21.3115234375, -20.56640625, -19.8212890625, -19.076171875, -18.3310546875, -17.5859375, -16.8408203125, -16.095703125, -15.3505859375, -14.60546875, -13.8603515625, -13.115234375, -12.3701171875, -11.625, -10.8798828125, -10.134765625, -9.3896484375, -8.64453125, -7.8994140625, -7.154296875, -6.4091796875, -5.6640625, -4.9189453125, -4.173828125, -3.4287109375, -2.68359375, -1.9384765625, -1.193359375, -0.4482421875, 0.296875, 1.0419921875, 1.787109375, 2.5322265625, 3.27734375, 4.0224609375, 4.767578125, 5.5126953125, 6.2578125, 7.0029296875, 7.748046875, 8.4931640625, 9.23828125, 9.9833984375, 10.728515625, 11.4736328125, 12.21875, 12.9638671875, 13.708984375, 14.4541015625, 15.19921875, 15.9443359375, 16.689453125, 17.4345703125, 18.1796875, 18.9248046875, 19.669921875, 20.4150390625, 21.16015625, 21.9052734375, 22.650390625, 23.3955078125, 24.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 11.0, 6.0, 7.0, 17.0, 10.0, 15.0, 24.0, 29.0, 36.0, 35.0, 36.0, 30.0, 47.0, 56.0, 43.0, 52.0, 45.0, 42.0, 41.0, 38.0, 46.0, 42.0, 36.0, 50.0, 24.0, 24.0, 27.0, 36.0, 21.0, 15.0, 11.0, 7.0, 6.0, 4.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.447265625, -17.76953125, -17.091796875, -16.4140625, -15.736328125, -15.05859375, -14.380859375, -13.703125, -13.025390625, -12.34765625, -11.669921875, -10.9921875, -10.314453125, -9.63671875, -8.958984375, -8.28125, -7.603515625, -6.92578125, -6.248046875, -5.5703125, -4.892578125, -4.21484375, -3.537109375, -2.859375, -2.181640625, -1.50390625, -0.826171875, -0.1484375, 0.529296875, 1.20703125, 1.884765625, 2.5625, 3.240234375, 3.91796875, 4.595703125, 5.2734375, 5.951171875, 6.62890625, 7.306640625, 7.984375, 8.662109375, 9.33984375, 10.017578125, 10.6953125, 11.373046875, 12.05078125, 12.728515625, 13.40625, 14.083984375, 14.76171875, 15.439453125, 16.1171875, 16.794921875, 17.47265625, 18.150390625, 18.828125, 19.505859375, 20.18359375, 20.861328125, 21.5390625, 22.216796875, 22.89453125, 23.572265625, 24.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 23.0, 40.0, 34.0, 54.0, 107.0, 128.0, 213.0, 349.0, 550.0, 1010.0, 2117.0, 4768.0, 13761.0, 45120.0, 143263.0, 308149.0, 311170.0, 147198.0, 46752.0, 14093.0, 4880.0, 2076.0, 982.0, 625.0, 357.0, 209.0, 132.0, 119.0, 81.0, 54.0, 35.0, 27.0, 17.0, 8.0, 13.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-30.984375, -30.1240234375, -29.263671875, -28.4033203125, -27.54296875, -26.6826171875, -25.822265625, -24.9619140625, -24.1015625, -23.2412109375, -22.380859375, -21.5205078125, -20.66015625, -19.7998046875, -18.939453125, -18.0791015625, -17.21875, -16.3583984375, -15.498046875, -14.6376953125, -13.77734375, -12.9169921875, -12.056640625, -11.1962890625, -10.3359375, -9.4755859375, -8.615234375, -7.7548828125, -6.89453125, -6.0341796875, -5.173828125, -4.3134765625, -3.453125, -2.5927734375, -1.732421875, -0.8720703125, -0.01171875, 0.8486328125, 1.708984375, 2.5693359375, 3.4296875, 4.2900390625, 5.150390625, 6.0107421875, 6.87109375, 7.7314453125, 8.591796875, 9.4521484375, 10.3125, 11.1728515625, 12.033203125, 12.8935546875, 13.75390625, 14.6142578125, 15.474609375, 16.3349609375, 17.1953125, 18.0556640625, 18.916015625, 19.7763671875, 20.63671875, 21.4970703125, 22.357421875, 23.2177734375, 24.078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 10.0, 9.0, 14.0, 11.0, 15.0, 21.0, 28.0, 40.0, 35.0, 50.0, 51.0, 48.0, 58.0, 45.0, 54.0, 65.0, 64.0, 64.0, 50.0, 41.0, 28.0, 32.0, 27.0, 25.0, 21.0, 12.0, 19.0, 9.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0016613006591796875, -0.0016154050827026367, -0.001569509506225586, -0.0015236139297485352, -0.0014777183532714844, -0.0014318227767944336, -0.0013859272003173828, -0.001340031623840332, -0.0012941360473632812, -0.0012482404708862305, -0.0012023448944091797, -0.001156449317932129, -0.0011105537414550781, -0.0010646581649780273, -0.0010187625885009766, -0.0009728670120239258, -0.000926971435546875, -0.0008810758590698242, -0.0008351802825927734, -0.0007892847061157227, -0.0007433891296386719, -0.0006974935531616211, -0.0006515979766845703, -0.0006057024002075195, -0.0005598068237304688, -0.000513911247253418, -0.0004680156707763672, -0.0004221200942993164, -0.0003762245178222656, -0.00033032894134521484, -0.00028443336486816406, -0.00023853778839111328, -0.0001926422119140625, -0.00014674663543701172, -0.00010085105895996094, -5.4955482482910156e-05, -9.059906005859375e-06, 3.6835670471191406e-05, 8.273124694824219e-05, 0.00012862682342529297, 0.00017452239990234375, 0.00022041797637939453, 0.0002663135528564453, 0.0003122091293334961, 0.0003581047058105469, 0.00040400028228759766, 0.00044989585876464844, 0.0004957914352416992, 0.00054168701171875, 0.0005875825881958008, 0.0006334781646728516, 0.0006793737411499023, 0.0007252693176269531, 0.0007711648941040039, 0.0008170604705810547, 0.0008629560470581055, 0.0009088516235351562, 0.000954747200012207, 0.0010006427764892578, 0.0010465383529663086, 0.0010924339294433594, 0.0011383295059204102, 0.001184225082397461, 0.0012301206588745117, 0.0012760162353515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 11.0, 16.0, 18.0, 32.0, 37.0, 62.0, 78.0, 85.0, 178.0, 214.0, 370.0, 532.0, 1060.0, 2221.0, 5253.0, 15065.0, 45207.0, 126667.0, 257472.0, 296093.0, 183979.0, 74232.0, 24596.0, 8262.0, 3289.0, 1475.0, 737.0, 426.0, 253.0, 179.0, 132.0, 85.0, 63.0, 50.0, 23.0, 27.0, 18.0, 18.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.83056640625, -23.0673828125, -22.30419921875, -21.541015625, -20.77783203125, -20.0146484375, -19.25146484375, -18.48828125, -17.72509765625, -16.9619140625, -16.19873046875, -15.435546875, -14.67236328125, -13.9091796875, -13.14599609375, -12.3828125, -11.61962890625, -10.8564453125, -10.09326171875, -9.330078125, -8.56689453125, -7.8037109375, -7.04052734375, -6.27734375, -5.51416015625, -4.7509765625, -3.98779296875, -3.224609375, -2.46142578125, -1.6982421875, -0.93505859375, -0.171875, 0.59130859375, 1.3544921875, 2.11767578125, 2.880859375, 3.64404296875, 4.4072265625, 5.17041015625, 5.93359375, 6.69677734375, 7.4599609375, 8.22314453125, 8.986328125, 9.74951171875, 10.5126953125, 11.27587890625, 12.0390625, 12.80224609375, 13.5654296875, 14.32861328125, 15.091796875, 15.85498046875, 16.6181640625, 17.38134765625, 18.14453125, 18.90771484375, 19.6708984375, 20.43408203125, 21.197265625, 21.96044921875, 22.7236328125, 23.48681640625, 24.25]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 18.0, 29.0, 35.0, 54.0, 59.0, 85.0, 85.0, 103.0, 78.0, 95.0, 73.0, 71.0, 65.0, 38.0, 30.0, 21.0, 17.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.0625, -5.778564453125, -5.49462890625, -5.210693359375, -4.9267578125, -4.642822265625, -4.35888671875, -4.074951171875, -3.791015625, -3.507080078125, -3.22314453125, -2.939208984375, -2.6552734375, -2.371337890625, -2.08740234375, -1.803466796875, -1.51953125, -1.235595703125, -0.95166015625, -0.667724609375, -0.3837890625, -0.099853515625, 0.18408203125, 0.468017578125, 0.751953125, 1.035888671875, 1.31982421875, 1.603759765625, 1.8876953125, 2.171630859375, 2.45556640625, 2.739501953125, 3.0234375, 3.307373046875, 3.59130859375, 3.875244140625, 4.1591796875, 4.443115234375, 4.72705078125, 5.010986328125, 5.294921875, 5.578857421875, 5.86279296875, 6.146728515625, 6.4306640625, 6.714599609375, 6.99853515625, 7.282470703125, 7.56640625, 7.850341796875, 8.13427734375, 8.418212890625, 8.7021484375, 8.986083984375, 9.27001953125, 9.553955078125, 9.837890625, 10.121826171875, 10.40576171875, 10.689697265625, 10.9736328125, 11.257568359375, 11.54150390625, 11.825439453125, 12.109375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 9.0, 12.0, 9.0, 27.0, 19.0, 15.0, 25.0, 29.0, 40.0, 28.0, 35.0, 44.0, 44.0, 48.0, 42.0, 48.0, 55.0, 67.0, 27.0, 54.0, 41.0, 39.0, 38.0, 33.0, 22.0, 22.0, 13.0, 22.0, 14.0, 13.0, 13.0, 13.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35939598083496, -23.42682456970215, -22.494253158569336, -21.561681747436523, -20.629112243652344, -19.69654083251953, -18.76396942138672, -17.831398010253906, -16.898826599121094, -15.966255187988281, -15.033683776855469, -14.101113319396973, -13.16854190826416, -12.235970497131348, -11.303400039672852, -10.370828628540039, -9.438257217407227, -8.505685806274414, -7.57311487197876, -6.6405439376831055, -5.707972526550293, -4.7754011154174805, -3.842830181121826, -2.910259246826172, -1.9776878356933594, -1.045116662979126, -0.11254549026489258, 0.8200256824493408, 1.7525968551635742, 2.6851682662963867, 3.617739200592041, 4.550310134887695, 5.482883453369141, 6.415454864501953, 7.348025798797607, 8.280596733093262, 9.213168144226074, 10.145739555358887, 11.078310012817383, 12.010881423950195, 12.943452835083008, 13.87602424621582, 14.808595657348633, 15.741166114807129, 16.673736572265625, 17.606307983398438, 18.53887939453125, 19.471450805664062, 20.404022216796875, 21.336593627929688, 22.2691650390625, 23.201736450195312, 24.134307861328125, 25.066879272460938, 25.999448776245117, 26.93202018737793, 27.864591598510742, 28.797163009643555, 29.729734420776367, 30.66230583190918, 31.59487533569336, 32.52744674682617, 33.460018157958984, 34.3925895690918, 35.32516098022461]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 10.0, 20.0, 20.0, 26.0, 28.0, 35.0, 32.0, 27.0, 32.0, 38.0, 37.0, 32.0, 43.0, 47.0, 42.0, 48.0, 35.0, 40.0, 34.0, 46.0, 32.0, 32.0, 33.0, 33.0, 16.0, 23.0, 24.0, 19.0, 17.0, 10.0, 10.0, 3.0, 7.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.959009170532227, -25.94156265258789, -24.924118041992188, -23.90667152404785, -22.889225006103516, -21.87177848815918, -20.854331970214844, -19.83688735961914, -18.819440841674805, -17.80199432373047, -16.784549713134766, -15.76710319519043, -14.749656677246094, -13.732210159301758, -12.714764595031738, -11.697319030761719, -10.679872512817383, -9.662425994873047, -8.644980430603027, -7.62753438949585, -6.610088348388672, -5.592642307281494, -4.575196266174316, -3.5577502250671387, -2.540304183959961, -1.5228581428527832, -0.5054121017456055, 0.5120339393615723, 1.52947998046875, 2.5469260215759277, 3.5643720626831055, 4.581818103790283, 5.599262237548828, 6.616708278656006, 7.634154319763184, 8.651599884033203, 9.669046401977539, 10.686492919921875, 11.703938484191895, 12.721384048461914, 13.73883056640625, 14.756277084350586, 15.773722648620605, 16.791168212890625, 17.80861473083496, 18.826061248779297, 19.843505859375, 20.860952377319336, 21.878398895263672, 22.895845413208008, 23.913291931152344, 24.930736541748047, 25.948183059692383, 26.96562957763672, 27.983074188232422, 29.000520706176758, 30.017967224121094, 31.03541374206543, 32.052860260009766, 33.07030487060547, 34.08775329589844, 35.10519790649414, 36.122642517089844, 37.14009094238281, 38.157535552978516]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 14.0, 30.0, 28.0, 105.0, 160.0, 369.0, 619.0, 1328.0, 2467.0, 4666.0, 8951.0, 17189.0, 32310.0, 60135.0, 107740.0, 184072.0, 294970.0, 432022.0, 555511.0, 614662.0, 579756.0, 470220.0, 331251.0, 212252.0, 126489.0, 71944.0, 39580.0, 21530.0, 11372.0, 5869.0, 3079.0, 1688.0, 883.0, 484.0, 229.0, 123.0, 82.0, 44.0, 29.0, 20.0, 7.0, 5.0, 0.0, 4.0, 2.0], "bins": [-32.46875, -31.628662109375, -30.78857421875, -29.948486328125, -29.1083984375, -28.268310546875, -27.42822265625, -26.588134765625, -25.748046875, -24.907958984375, -24.06787109375, -23.227783203125, -22.3876953125, -21.547607421875, -20.70751953125, -19.867431640625, -19.02734375, -18.187255859375, -17.34716796875, -16.507080078125, -15.6669921875, -14.826904296875, -13.98681640625, -13.146728515625, -12.306640625, -11.466552734375, -10.62646484375, -9.786376953125, -8.9462890625, -8.106201171875, -7.26611328125, -6.426025390625, -5.5859375, -4.745849609375, -3.90576171875, -3.065673828125, -2.2255859375, -1.385498046875, -0.54541015625, 0.294677734375, 1.134765625, 1.974853515625, 2.81494140625, 3.655029296875, 4.4951171875, 5.335205078125, 6.17529296875, 7.015380859375, 7.85546875, 8.695556640625, 9.53564453125, 10.375732421875, 11.2158203125, 12.055908203125, 12.89599609375, 13.736083984375, 14.576171875, 15.416259765625, 16.25634765625, 17.096435546875, 17.9365234375, 18.776611328125, 19.61669921875, 20.456787109375, 21.296875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 6.0, 5.0, 16.0, 7.0, 14.0, 18.0, 19.0, 17.0, 33.0, 35.0, 24.0, 34.0, 26.0, 39.0, 32.0, 38.0, 38.0, 37.0, 52.0, 39.0, 37.0, 41.0, 42.0, 38.0, 35.0, 40.0, 32.0, 31.0, 25.0, 22.0, 21.0, 23.0, 18.0, 17.0, 8.0, 10.0, 2.0, 6.0, 9.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0625, -22.17919921875, -21.2958984375, -20.41259765625, -19.529296875, -18.64599609375, -17.7626953125, -16.87939453125, -15.99609375, -15.11279296875, -14.2294921875, -13.34619140625, -12.462890625, -11.57958984375, -10.6962890625, -9.81298828125, -8.9296875, -8.04638671875, -7.1630859375, -6.27978515625, -5.396484375, -4.51318359375, -3.6298828125, -2.74658203125, -1.86328125, -0.97998046875, -0.0966796875, 0.78662109375, 1.669921875, 2.55322265625, 3.4365234375, 4.31982421875, 5.203125, 6.08642578125, 6.9697265625, 7.85302734375, 8.736328125, 9.61962890625, 10.5029296875, 11.38623046875, 12.26953125, 13.15283203125, 14.0361328125, 14.91943359375, 15.802734375, 16.68603515625, 17.5693359375, 18.45263671875, 19.3359375, 20.21923828125, 21.1025390625, 21.98583984375, 22.869140625, 23.75244140625, 24.6357421875, 25.51904296875, 26.40234375, 27.28564453125, 28.1689453125, 29.05224609375, 29.935546875, 30.81884765625, 31.7021484375, 32.58544921875, 33.46875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 14.0, 31.0, 49.0, 122.0, 179.0, 303.0, 506.0, 859.0, 1540.0, 2595.0, 4234.0, 7011.0, 11582.0, 18833.0, 30727.0, 48609.0, 75441.0, 112061.0, 163805.0, 226164.0, 297436.0, 367285.0, 422619.0, 446963.0, 433793.0, 389725.0, 324624.0, 251985.0, 185977.0, 129857.0, 87626.0, 57256.0, 36717.0, 22802.0, 13851.0, 8447.0, 5175.0, 3044.0, 1886.0, 1057.0, 608.0, 364.0, 213.0, 122.0, 75.0, 53.0, 24.0, 19.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.3662109375, -20.669921875, -19.9736328125, -19.27734375, -18.5810546875, -17.884765625, -17.1884765625, -16.4921875, -15.7958984375, -15.099609375, -14.4033203125, -13.70703125, -13.0107421875, -12.314453125, -11.6181640625, -10.921875, -10.2255859375, -9.529296875, -8.8330078125, -8.13671875, -7.4404296875, -6.744140625, -6.0478515625, -5.3515625, -4.6552734375, -3.958984375, -3.2626953125, -2.56640625, -1.8701171875, -1.173828125, -0.4775390625, 0.21875, 0.9150390625, 1.611328125, 2.3076171875, 3.00390625, 3.7001953125, 4.396484375, 5.0927734375, 5.7890625, 6.4853515625, 7.181640625, 7.8779296875, 8.57421875, 9.2705078125, 9.966796875, 10.6630859375, 11.359375, 12.0556640625, 12.751953125, 13.4482421875, 14.14453125, 14.8408203125, 15.537109375, 16.2333984375, 16.9296875, 17.6259765625, 18.322265625, 19.0185546875, 19.71484375, 20.4111328125, 21.107421875, 21.8037109375, 22.5]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 7.0, 6.0, 27.0, 20.0, 32.0, 31.0, 42.0, 36.0, 80.0, 68.0, 84.0, 105.0, 119.0, 148.0, 151.0, 176.0, 194.0, 195.0, 207.0, 223.0, 200.0, 213.0, 204.0, 202.0, 170.0, 161.0, 140.0, 131.0, 112.0, 101.0, 110.0, 84.0, 51.0, 56.0, 29.0, 34.0, 25.0, 22.0, 12.0, 20.0, 13.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6171875, -12.2391357421875, -11.861083984375, -11.4830322265625, -11.10498046875, -10.7269287109375, -10.348876953125, -9.9708251953125, -9.5927734375, -9.2147216796875, -8.836669921875, -8.4586181640625, -8.08056640625, -7.7025146484375, -7.324462890625, -6.9464111328125, -6.568359375, -6.1903076171875, -5.812255859375, -5.4342041015625, -5.05615234375, -4.6781005859375, -4.300048828125, -3.9219970703125, -3.5439453125, -3.1658935546875, -2.787841796875, -2.4097900390625, -2.03173828125, -1.6536865234375, -1.275634765625, -0.8975830078125, -0.51953125, -0.1414794921875, 0.236572265625, 0.6146240234375, 0.99267578125, 1.3707275390625, 1.748779296875, 2.1268310546875, 2.5048828125, 2.8829345703125, 3.260986328125, 3.6390380859375, 4.01708984375, 4.3951416015625, 4.773193359375, 5.1512451171875, 5.529296875, 5.9073486328125, 6.285400390625, 6.6634521484375, 7.04150390625, 7.4195556640625, 7.797607421875, 8.1756591796875, 8.5537109375, 8.9317626953125, 9.309814453125, 9.6878662109375, 10.06591796875, 10.4439697265625, 10.822021484375, 11.2000732421875, 11.578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 8.0, 6.0, 6.0, 12.0, 9.0, 22.0, 21.0, 20.0, 21.0, 26.0, 34.0, 34.0, 37.0, 36.0, 32.0, 38.0, 44.0, 48.0, 43.0, 42.0, 33.0, 46.0, 46.0, 28.0, 30.0, 29.0, 30.0, 12.0, 22.0, 22.0, 27.0, 12.0, 19.0, 11.0, 14.0, 8.0, 10.0, 14.0, 5.0, 7.0, 4.0, 4.0, 9.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.50648307800293, -23.714515686035156, -22.92254638671875, -22.130578994750977, -21.338611602783203, -20.54664421081543, -19.754674911499023, -18.96270751953125, -18.170740127563477, -17.378772735595703, -16.586803436279297, -15.794836044311523, -15.00286865234375, -14.21090030670166, -13.41893196105957, -12.626964569091797, -11.834996223449707, -11.043027877807617, -10.251060485839844, -9.459092140197754, -8.66712474822998, -7.875156402587891, -7.083188533782959, -6.291220664978027, -5.499252796173096, -4.707284927368164, -3.9153170585632324, -3.1233489513397217, -2.33138108253479, -1.5394132137298584, -0.7474451065063477, 0.044522762298583984, 0.8364906311035156, 1.6284584999084473, 2.420426368713379, 3.2123944759368896, 4.004362106323242, 4.796330451965332, 5.588298320770264, 6.380266189575195, 7.172234058380127, 7.964201927185059, 8.756170272827148, 9.548137664794922, 10.340106010437012, 11.132073402404785, 11.924041748046875, 12.716009140014648, 13.507977485656738, 14.299945831298828, 15.091913223266602, 15.883881568908691, 16.67584991455078, 17.467817306518555, 18.259784698486328, 19.051753997802734, 19.843721389770508, 20.63568878173828, 21.427658081054688, 22.21962547302246, 23.011592864990234, 23.803560256958008, 24.595529556274414, 25.387496948242188, 26.17946434020996]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 16.0, 22.0, 10.0, 16.0, 20.0, 14.0, 27.0, 17.0, 34.0, 39.0, 34.0, 30.0, 39.0, 31.0, 28.0, 43.0, 50.0, 36.0, 38.0, 33.0, 38.0, 49.0, 29.0, 45.0, 29.0, 24.0, 24.0, 32.0, 15.0, 13.0, 15.0, 13.0, 16.0, 10.0, 7.0, 8.0, 4.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.261606216430664, -30.33831024169922, -29.415016174316406, -28.49172019958496, -27.56842613220215, -26.645130157470703, -25.72183609008789, -24.798540115356445, -23.875246047973633, -22.951950073242188, -22.028656005859375, -21.10536003112793, -20.182065963745117, -19.258769989013672, -18.33547592163086, -17.412179946899414, -16.48888397216797, -15.56558895111084, -14.642293930053711, -13.718998908996582, -12.795703887939453, -11.872407913208008, -10.949113845825195, -10.02581787109375, -9.102523803710938, -8.179228782653809, -7.25593376159668, -6.332638740539551, -5.409343719482422, -4.486048221588135, -3.562753200531006, -2.639458179473877, -1.7161636352539062, -0.7928685545921326, 0.1304265260696411, 1.0537216663360596, 1.9770166873931885, 2.9003119468688965, 3.8236069679260254, 4.746901988983154, 5.670197010040283, 6.593492031097412, 7.516787052154541, 8.440082550048828, 9.363377571105957, 10.286672592163086, 11.209967613220215, 12.133262634277344, 13.056557655334473, 13.979852676391602, 14.90314769744873, 15.82644271850586, 16.749738693237305, 17.673032760620117, 18.596328735351562, 19.519622802734375, 20.44291877746582, 21.366214752197266, 22.289508819580078, 23.212804794311523, 24.136098861694336, 25.05939483642578, 25.982688903808594, 26.90598487854004, 27.82927894592285]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 5.0, 1.0, 6.0, 9.0, 21.0, 27.0, 47.0, 80.0, 129.0, 185.0, 350.0, 545.0, 916.0, 1428.0, 2236.0, 3707.0, 5798.0, 9111.0, 13752.0, 20406.0, 29354.0, 41098.0, 54730.0, 70183.0, 85122.0, 95155.0, 102479.0, 101093.0, 93717.0, 81521.0, 66587.0, 51478.0, 38009.0, 26742.0, 18498.0, 12173.0, 7993.0, 5204.0, 3289.0, 2046.0, 1325.0, 794.0, 454.0, 293.0, 166.0, 116.0, 77.0, 47.0, 29.0, 14.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.85302734375, -7.5810546875, -7.30908203125, -7.037109375, -6.76513671875, -6.4931640625, -6.22119140625, -5.94921875, -5.67724609375, -5.4052734375, -5.13330078125, -4.861328125, -4.58935546875, -4.3173828125, -4.04541015625, -3.7734375, -3.50146484375, -3.2294921875, -2.95751953125, -2.685546875, -2.41357421875, -2.1416015625, -1.86962890625, -1.59765625, -1.32568359375, -1.0537109375, -0.78173828125, -0.509765625, -0.23779296875, 0.0341796875, 0.30615234375, 0.578125, 0.85009765625, 1.1220703125, 1.39404296875, 1.666015625, 1.93798828125, 2.2099609375, 2.48193359375, 2.75390625, 3.02587890625, 3.2978515625, 3.56982421875, 3.841796875, 4.11376953125, 4.3857421875, 4.65771484375, 4.9296875, 5.20166015625, 5.4736328125, 5.74560546875, 6.017578125, 6.28955078125, 6.5615234375, 6.83349609375, 7.10546875, 7.37744140625, 7.6494140625, 7.92138671875, 8.193359375, 8.46533203125, 8.7373046875, 9.00927734375, 9.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 14.0, 18.0, 20.0, 12.0, 13.0, 21.0, 14.0, 29.0, 16.0, 35.0, 36.0, 34.0, 31.0, 36.0, 34.0, 27.0, 41.0, 53.0, 40.0, 33.0, 35.0, 39.0, 48.0, 27.0, 45.0, 32.0, 23.0, 28.0, 28.0, 16.0, 13.0, 14.0, 12.0, 16.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.21875, -30.29150390625, -29.3642578125, -28.43701171875, -27.509765625, -26.58251953125, -25.6552734375, -24.72802734375, -23.80078125, -22.87353515625, -21.9462890625, -21.01904296875, -20.091796875, -19.16455078125, -18.2373046875, -17.31005859375, -16.3828125, -15.45556640625, -14.5283203125, -13.60107421875, -12.673828125, -11.74658203125, -10.8193359375, -9.89208984375, -8.96484375, -8.03759765625, -7.1103515625, -6.18310546875, -5.255859375, -4.32861328125, -3.4013671875, -2.47412109375, -1.546875, -0.61962890625, 0.3076171875, 1.23486328125, 2.162109375, 3.08935546875, 4.0166015625, 4.94384765625, 5.87109375, 6.79833984375, 7.7255859375, 8.65283203125, 9.580078125, 10.50732421875, 11.4345703125, 12.36181640625, 13.2890625, 14.21630859375, 15.1435546875, 16.07080078125, 16.998046875, 17.92529296875, 18.8525390625, 19.77978515625, 20.70703125, 21.63427734375, 22.5615234375, 23.48876953125, 24.416015625, 25.34326171875, 26.2705078125, 27.19775390625, 28.125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 10.0, 15.0, 21.0, 33.0, 62.0, 89.0, 142.0, 189.0, 311.0, 523.0, 873.0, 1320.0, 2159.0, 3508.0, 5757.0, 8922.0, 14705.0, 25572.0, 75338.0, 814052.0, 40477.0, 21018.0, 12672.0, 7763.0, 4864.0, 3079.0, 1958.0, 1213.0, 747.0, 471.0, 261.0, 162.0, 105.0, 63.0, 29.0, 27.0, 15.0, 18.0, 4.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.703125, -29.7822265625, -28.861328125, -27.9404296875, -27.01953125, -26.0986328125, -25.177734375, -24.2568359375, -23.3359375, -22.4150390625, -21.494140625, -20.5732421875, -19.65234375, -18.7314453125, -17.810546875, -16.8896484375, -15.96875, -15.0478515625, -14.126953125, -13.2060546875, -12.28515625, -11.3642578125, -10.443359375, -9.5224609375, -8.6015625, -7.6806640625, -6.759765625, -5.8388671875, -4.91796875, -3.9970703125, -3.076171875, -2.1552734375, -1.234375, -0.3134765625, 0.607421875, 1.5283203125, 2.44921875, 3.3701171875, 4.291015625, 5.2119140625, 6.1328125, 7.0537109375, 7.974609375, 8.8955078125, 9.81640625, 10.7373046875, 11.658203125, 12.5791015625, 13.5, 14.4208984375, 15.341796875, 16.2626953125, 17.18359375, 18.1044921875, 19.025390625, 19.9462890625, 20.8671875, 21.7880859375, 22.708984375, 23.6298828125, 24.55078125, 25.4716796875, 26.392578125, 27.3134765625, 28.234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 14.0, 15.0, 18.0, 18.0, 21.0, 27.0, 23.0, 27.0, 35.0, 41.0, 41.0, 37.0, 42.0, 40.0, 46.0, 45.0, 50.0, 43.0, 45.0, 38.0, 39.0, 38.0, 38.0, 27.0, 28.0, 28.0, 16.0, 24.0, 13.0, 14.0, 13.0, 5.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -24.0263671875, -23.287109375, -22.5478515625, -21.80859375, -21.0693359375, -20.330078125, -19.5908203125, -18.8515625, -18.1123046875, -17.373046875, -16.6337890625, -15.89453125, -15.1552734375, -14.416015625, -13.6767578125, -12.9375, -12.1982421875, -11.458984375, -10.7197265625, -9.98046875, -9.2412109375, -8.501953125, -7.7626953125, -7.0234375, -6.2841796875, -5.544921875, -4.8056640625, -4.06640625, -3.3271484375, -2.587890625, -1.8486328125, -1.109375, -0.3701171875, 0.369140625, 1.1083984375, 1.84765625, 2.5869140625, 3.326171875, 4.0654296875, 4.8046875, 5.5439453125, 6.283203125, 7.0224609375, 7.76171875, 8.5009765625, 9.240234375, 9.9794921875, 10.71875, 11.4580078125, 12.197265625, 12.9365234375, 13.67578125, 14.4150390625, 15.154296875, 15.8935546875, 16.6328125, 17.3720703125, 18.111328125, 18.8505859375, 19.58984375, 20.3291015625, 21.068359375, 21.8076171875, 22.546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 15.0, 28.0, 32.0, 74.0, 59.0, 110.0, 156.0, 259.0, 391.0, 678.0, 1100.0, 1723.0, 2762.0, 4738.0, 7915.0, 13512.0, 24379.0, 75956.0, 804961.0, 56194.0, 22403.0, 12406.0, 7333.0, 4377.0, 2617.0, 1618.0, 996.0, 616.0, 403.0, 239.0, 159.0, 95.0, 85.0, 47.0, 25.0, 23.0, 14.0, 14.0, 11.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.232421875, -2.1656494140625, -2.098876953125, -2.0321044921875, -1.96533203125, -1.8985595703125, -1.831787109375, -1.7650146484375, -1.6982421875, -1.6314697265625, -1.564697265625, -1.4979248046875, -1.43115234375, -1.3643798828125, -1.297607421875, -1.2308349609375, -1.1640625, -1.0972900390625, -1.030517578125, -0.9637451171875, -0.89697265625, -0.8302001953125, -0.763427734375, -0.6966552734375, -0.6298828125, -0.5631103515625, -0.496337890625, -0.4295654296875, -0.36279296875, -0.2960205078125, -0.229248046875, -0.1624755859375, -0.095703125, -0.0289306640625, 0.037841796875, 0.1046142578125, 0.17138671875, 0.2381591796875, 0.304931640625, 0.3717041015625, 0.4384765625, 0.5052490234375, 0.572021484375, 0.6387939453125, 0.70556640625, 0.7723388671875, 0.839111328125, 0.9058837890625, 0.97265625, 1.0394287109375, 1.106201171875, 1.1729736328125, 1.23974609375, 1.3065185546875, 1.373291015625, 1.4400634765625, 1.5068359375, 1.5736083984375, 1.640380859375, 1.7071533203125, 1.77392578125, 1.8406982421875, 1.907470703125, 1.9742431640625, 2.041015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 16.0, 21.0, 16.0, 22.0, 27.0, 27.0, 53.0, 49.0, 63.0, 59.0, 54.0, 53.0, 67.0, 43.0, 52.0, 56.0, 44.0, 35.0, 43.0, 29.0, 19.0, 26.0, 19.0, 16.0, 13.0, 8.0, 6.0, 2.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00029659271240234375, -0.00028759241104125977, -0.0002785921096801758, -0.0002695918083190918, -0.0002605915069580078, -0.00025159120559692383, -0.00024259090423583984, -0.00023359060287475586, -0.00022459030151367188, -0.0002155900001525879, -0.0002065896987915039, -0.00019758939743041992, -0.00018858909606933594, -0.00017958879470825195, -0.00017058849334716797, -0.00016158819198608398, -0.000152587890625, -0.00014358758926391602, -0.00013458728790283203, -0.00012558698654174805, -0.00011658668518066406, -0.00010758638381958008, -9.85860824584961e-05, -8.958578109741211e-05, -8.058547973632812e-05, -7.158517837524414e-05, -6.258487701416016e-05, -5.358457565307617e-05, -4.458427429199219e-05, -3.55839729309082e-05, -2.658367156982422e-05, -1.7583370208740234e-05, -8.58306884765625e-06, 4.172325134277344e-07, 9.417533874511719e-06, 1.8417835235595703e-05, 2.7418136596679688e-05, 3.641843795776367e-05, 4.5418739318847656e-05, 5.441904067993164e-05, 6.341934204101562e-05, 7.241964340209961e-05, 8.14199447631836e-05, 9.042024612426758e-05, 9.942054748535156e-05, 0.00010842084884643555, 0.00011742115020751953, 0.00012642145156860352, 0.0001354217529296875, 0.00014442205429077148, 0.00015342235565185547, 0.00016242265701293945, 0.00017142295837402344, 0.00018042325973510742, 0.0001894235610961914, 0.0001984238624572754, 0.00020742416381835938, 0.00021642446517944336, 0.00022542476654052734, 0.00023442506790161133, 0.0002434253692626953, 0.0002524256706237793, 0.0002614259719848633, 0.00027042627334594727, 0.00027942657470703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 15.0, 12.0, 19.0, 37.0, 68.0, 81.0, 127.0, 239.0, 326.0, 541.0, 842.0, 1297.0, 2161.0, 3351.0, 5727.0, 9316.0, 15786.0, 25619.0, 41143.0, 62719.0, 89589.0, 116459.0, 135683.0, 137695.0, 121176.0, 94915.0, 67181.0, 44691.0, 27947.0, 16998.0, 10488.0, 6352.0, 3790.0, 2258.0, 1412.0, 885.0, 589.0, 387.0, 228.0, 143.0, 86.0, 63.0, 47.0, 31.0, 12.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1240234375, -1.090057373046875, -1.05609130859375, -1.022125244140625, -0.9881591796875, -0.954193115234375, -0.92022705078125, -0.886260986328125, -0.852294921875, -0.818328857421875, -0.78436279296875, -0.750396728515625, -0.7164306640625, -0.682464599609375, -0.64849853515625, -0.614532470703125, -0.58056640625, -0.546600341796875, -0.51263427734375, -0.478668212890625, -0.4447021484375, -0.410736083984375, -0.37677001953125, -0.342803955078125, -0.308837890625, -0.274871826171875, -0.24090576171875, -0.206939697265625, -0.1729736328125, -0.139007568359375, -0.10504150390625, -0.071075439453125, -0.037109375, -0.003143310546875, 0.03082275390625, 0.064788818359375, 0.0987548828125, 0.132720947265625, 0.16668701171875, 0.200653076171875, 0.234619140625, 0.268585205078125, 0.30255126953125, 0.336517333984375, 0.3704833984375, 0.404449462890625, 0.43841552734375, 0.472381591796875, 0.50634765625, 0.540313720703125, 0.57427978515625, 0.608245849609375, 0.6422119140625, 0.676177978515625, 0.71014404296875, 0.744110107421875, 0.778076171875, 0.812042236328125, 0.84600830078125, 0.879974365234375, 0.9139404296875, 0.947906494140625, 0.98187255859375, 1.015838623046875, 1.0498046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 7.0, 7.0, 13.0, 11.0, 8.0, 22.0, 16.0, 18.0, 30.0, 32.0, 28.0, 45.0, 30.0, 51.0, 40.0, 47.0, 41.0, 34.0, 48.0, 58.0, 49.0, 38.0, 45.0, 32.0, 33.0, 26.0, 26.0, 29.0, 20.0, 19.0, 12.0, 14.0, 10.0, 16.0, 9.0, 4.0, 12.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40478515625, -0.3917884826660156, -0.37879180908203125, -0.3657951354980469, -0.3527984619140625, -0.3398017883300781, -0.32680511474609375, -0.3138084411621094, -0.300811767578125, -0.2878150939941406, -0.27481842041015625, -0.2618217468261719, -0.2488250732421875, -0.23582839965820312, -0.22283172607421875, -0.20983505249023438, -0.19683837890625, -0.18384170532226562, -0.17084503173828125, -0.15784835815429688, -0.1448516845703125, -0.13185501098632812, -0.11885833740234375, -0.10586166381835938, -0.092864990234375, -0.07986831665039062, -0.06687164306640625, -0.053874969482421875, -0.0408782958984375, -0.027881622314453125, -0.01488494873046875, -0.001888275146484375, 0.0111083984375, 0.024105072021484375, 0.03710174560546875, 0.050098419189453125, 0.0630950927734375, 0.07609176635742188, 0.08908843994140625, 0.10208511352539062, 0.115081787109375, 0.12807846069335938, 0.14107513427734375, 0.15407180786132812, 0.1670684814453125, 0.18006515502929688, 0.19306182861328125, 0.20605850219726562, 0.21905517578125, 0.23205184936523438, 0.24504852294921875, 0.2580451965332031, 0.2710418701171875, 0.2840385437011719, 0.29703521728515625, 0.3100318908691406, 0.323028564453125, 0.3360252380371094, 0.34902191162109375, 0.3620185852050781, 0.3750152587890625, 0.3880119323730469, 0.40100860595703125, 0.4140052795410156, 0.427001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 15.0, 14.0, 15.0, 14.0, 27.0, 18.0, 25.0, 34.0, 33.0, 36.0, 37.0, 38.0, 30.0, 40.0, 53.0, 44.0, 41.0, 34.0, 42.0, 41.0, 36.0, 26.0, 28.0, 28.0, 26.0, 21.0, 18.0, 20.0, 20.0, 18.0, 16.0, 10.0, 12.0, 12.0, 10.0, 7.0, 8.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.580408096313477, -23.788970947265625, -22.997535705566406, -22.206098556518555, -21.414661407470703, -20.623226165771484, -19.831789016723633, -19.04035186767578, -18.248916625976562, -17.45747947692871, -16.666044235229492, -15.87460708618164, -15.083169937133789, -14.291733741760254, -13.500297546386719, -12.708860397338867, -11.917423248291016, -11.12598705291748, -10.334549903869629, -9.543113708496094, -8.751676559448242, -7.960240364074707, -7.168804168701172, -6.3773674964904785, -5.585930824279785, -4.794494152069092, -4.003057479858398, -3.2116212844848633, -2.42018461227417, -1.6287479400634766, -0.8373117446899414, -0.04587507247924805, 0.7455615997314453, 1.5369981527328491, 2.328434705734253, 3.119871139526367, 3.9113078117370605, 4.702744483947754, 5.494180679321289, 6.285617351531982, 7.077054023742676, 7.868490695953369, 8.659927368164062, 9.451363563537598, 10.242799758911133, 11.034236907958984, 11.82567310333252, 12.617109298706055, 13.408546447753906, 14.199982643127441, 14.991419792175293, 15.782855987548828, 16.57429313659668, 17.36573028564453, 18.15716552734375, 18.9486026763916, 19.740039825439453, 20.531476974487305, 21.322912216186523, 22.114349365234375, 22.905786514282227, 23.697223663330078, 24.488658905029297, 25.28009605407715, 26.071531295776367]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 6.0, 7.0, 6.0, 11.0, 18.0, 14.0, 19.0, 10.0, 16.0, 22.0, 21.0, 24.0, 20.0, 41.0, 33.0, 38.0, 32.0, 34.0, 28.0, 31.0, 50.0, 45.0, 42.0, 35.0, 34.0, 52.0, 31.0, 39.0, 35.0, 26.0, 25.0, 26.0, 25.0, 11.0, 18.0, 12.0, 18.0, 5.0, 10.0, 8.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.796035766601562, -29.865793228149414, -28.935548782348633, -28.005306243896484, -27.075063705444336, -26.144821166992188, -25.214576721191406, -24.284334182739258, -23.35409164428711, -22.42384910583496, -21.49360466003418, -20.56336212158203, -19.633119583129883, -18.702877044677734, -17.772632598876953, -16.842390060424805, -15.91214656829834, -14.981903076171875, -14.051660537719727, -13.121417045593262, -12.191174507141113, -11.260931015014648, -10.3306884765625, -9.400444984436035, -8.47020149230957, -7.539958477020264, -6.609715461730957, -5.679471969604492, -4.749229431152344, -3.818985939025879, -2.8887429237365723, -1.9584999084472656, -1.0282573699951172, -0.09801429510116577, 0.8322287797927856, 1.7624719142913818, 2.6927149295806885, 3.622958183288574, 4.553201198577881, 5.4834442138671875, 6.413687229156494, 7.343930244445801, 8.274173736572266, 9.204416275024414, 10.134659767150879, 11.064903259277344, 11.995145797729492, 12.92538833618164, 13.855631828308105, 14.78587532043457, 15.716117858886719, 16.646360397338867, 17.57660484313965, 18.506847381591797, 19.437089920043945, 20.367332458496094, 21.297576904296875, 22.227819442749023, 23.158063888549805, 24.088306427001953, 25.0185489654541, 25.94879150390625, 26.87903594970703, 27.80927848815918, 28.739521026611328]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 13.0, 20.0, 22.0, 40.0, 63.0, 88.0, 144.0, 234.0, 443.0, 634.0, 1064.0, 1893.0, 3125.0, 5314.0, 8912.0, 14609.0, 23395.0, 35884.0, 52248.0, 71800.0, 92497.0, 108848.0, 118444.0, 116577.0, 105181.0, 87227.0, 66631.0, 48110.0, 32153.0, 20746.0, 12908.0, 7816.0, 4735.0, 2798.0, 1572.0, 871.0, 553.0, 311.0, 201.0, 159.0, 86.0, 55.0, 40.0, 33.0, 22.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.965576171875, -22.19677734375, -21.427978515625, -20.6591796875, -19.890380859375, -19.12158203125, -18.352783203125, -17.583984375, -16.815185546875, -16.04638671875, -15.277587890625, -14.5087890625, -13.739990234375, -12.97119140625, -12.202392578125, -11.43359375, -10.664794921875, -9.89599609375, -9.127197265625, -8.3583984375, -7.589599609375, -6.82080078125, -6.052001953125, -5.283203125, -4.514404296875, -3.74560546875, -2.976806640625, -2.2080078125, -1.439208984375, -0.67041015625, 0.098388671875, 0.8671875, 1.635986328125, 2.40478515625, 3.173583984375, 3.9423828125, 4.711181640625, 5.47998046875, 6.248779296875, 7.017578125, 7.786376953125, 8.55517578125, 9.323974609375, 10.0927734375, 10.861572265625, 11.63037109375, 12.399169921875, 13.16796875, 13.936767578125, 14.70556640625, 15.474365234375, 16.2431640625, 17.011962890625, 17.78076171875, 18.549560546875, 19.318359375, 20.087158203125, 20.85595703125, 21.624755859375, 22.3935546875, 23.162353515625, 23.93115234375, 24.699951171875, 25.46875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 3.0, 17.0, 11.0, 17.0, 21.0, 9.0, 19.0, 18.0, 26.0, 23.0, 22.0, 42.0, 30.0, 43.0, 29.0, 33.0, 26.0, 38.0, 51.0, 43.0, 37.0, 37.0, 34.0, 52.0, 30.0, 40.0, 32.0, 22.0, 27.0, 26.0, 22.0, 14.0, 15.0, 15.0, 15.0, 7.0, 8.0, 8.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-29.25, -28.359130859375, -27.46826171875, -26.577392578125, -25.6865234375, -24.795654296875, -23.90478515625, -23.013916015625, -22.123046875, -21.232177734375, -20.34130859375, -19.450439453125, -18.5595703125, -17.668701171875, -16.77783203125, -15.886962890625, -14.99609375, -14.105224609375, -13.21435546875, -12.323486328125, -11.4326171875, -10.541748046875, -9.65087890625, -8.760009765625, -7.869140625, -6.978271484375, -6.08740234375, -5.196533203125, -4.3056640625, -3.414794921875, -2.52392578125, -1.633056640625, -0.7421875, 0.148681640625, 1.03955078125, 1.930419921875, 2.8212890625, 3.712158203125, 4.60302734375, 5.493896484375, 6.384765625, 7.275634765625, 8.16650390625, 9.057373046875, 9.9482421875, 10.839111328125, 11.72998046875, 12.620849609375, 13.51171875, 14.402587890625, 15.29345703125, 16.184326171875, 17.0751953125, 17.966064453125, 18.85693359375, 19.747802734375, 20.638671875, 21.529541015625, 22.42041015625, 23.311279296875, 24.2021484375, 25.093017578125, 25.98388671875, 26.874755859375, 27.765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 6.0, 13.0, 17.0, 24.0, 37.0, 65.0, 118.0, 163.0, 235.0, 401.0, 643.0, 1021.0, 1649.0, 2351.0, 3621.0, 5174.0, 7801.0, 11203.0, 16176.0, 22714.0, 31339.0, 40942.0, 53423.0, 65640.0, 77534.0, 87013.0, 92383.0, 91937.0, 87146.0, 77870.0, 66616.0, 53888.0, 42030.0, 31734.0, 23291.0, 16577.0, 11878.0, 8043.0, 5466.0, 3577.0, 2395.0, 1556.0, 999.0, 665.0, 430.0, 274.0, 202.0, 101.0, 65.0, 44.0, 25.0, 18.0, 13.0, 11.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0625, -18.4482421875, -17.833984375, -17.2197265625, -16.60546875, -15.9912109375, -15.376953125, -14.7626953125, -14.1484375, -13.5341796875, -12.919921875, -12.3056640625, -11.69140625, -11.0771484375, -10.462890625, -9.8486328125, -9.234375, -8.6201171875, -8.005859375, -7.3916015625, -6.77734375, -6.1630859375, -5.548828125, -4.9345703125, -4.3203125, -3.7060546875, -3.091796875, -2.4775390625, -1.86328125, -1.2490234375, -0.634765625, -0.0205078125, 0.59375, 1.2080078125, 1.822265625, 2.4365234375, 3.05078125, 3.6650390625, 4.279296875, 4.8935546875, 5.5078125, 6.1220703125, 6.736328125, 7.3505859375, 7.96484375, 8.5791015625, 9.193359375, 9.8076171875, 10.421875, 11.0361328125, 11.650390625, 12.2646484375, 12.87890625, 13.4931640625, 14.107421875, 14.7216796875, 15.3359375, 15.9501953125, 16.564453125, 17.1787109375, 17.79296875, 18.4072265625, 19.021484375, 19.6357421875, 20.25]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 8.0, 8.0, 13.0, 11.0, 15.0, 22.0, 22.0, 14.0, 27.0, 27.0, 27.0, 37.0, 32.0, 41.0, 40.0, 37.0, 49.0, 54.0, 41.0, 51.0, 40.0, 43.0, 33.0, 36.0, 30.0, 25.0, 26.0, 29.0, 30.0, 16.0, 25.0, 24.0, 11.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.4375, -20.835205078125, -20.23291015625, -19.630615234375, -19.0283203125, -18.426025390625, -17.82373046875, -17.221435546875, -16.619140625, -16.016845703125, -15.41455078125, -14.812255859375, -14.2099609375, -13.607666015625, -13.00537109375, -12.403076171875, -11.80078125, -11.198486328125, -10.59619140625, -9.993896484375, -9.3916015625, -8.789306640625, -8.18701171875, -7.584716796875, -6.982421875, -6.380126953125, -5.77783203125, -5.175537109375, -4.5732421875, -3.970947265625, -3.36865234375, -2.766357421875, -2.1640625, -1.561767578125, -0.95947265625, -0.357177734375, 0.2451171875, 0.847412109375, 1.44970703125, 2.052001953125, 2.654296875, 3.256591796875, 3.85888671875, 4.461181640625, 5.0634765625, 5.665771484375, 6.26806640625, 6.870361328125, 7.47265625, 8.074951171875, 8.67724609375, 9.279541015625, 9.8818359375, 10.484130859375, 11.08642578125, 11.688720703125, 12.291015625, 12.893310546875, 13.49560546875, 14.097900390625, 14.7001953125, 15.302490234375, 15.90478515625, 16.507080078125, 17.109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 10.0, 13.0, 12.0, 26.0, 27.0, 62.0, 64.0, 105.0, 164.0, 238.0, 340.0, 524.0, 836.0, 1196.0, 1815.0, 2724.0, 4223.0, 6355.0, 9736.0, 14742.0, 22239.0, 32447.0, 46475.0, 63540.0, 82739.0, 99778.0, 110978.0, 112938.0, 104862.0, 90385.0, 71569.0, 52575.0, 37600.0, 25996.0, 17302.0, 11508.0, 7660.0, 5028.0, 3276.0, 2202.0, 1429.0, 937.0, 629.0, 401.0, 255.0, 187.0, 130.0, 77.0, 73.0, 45.0, 29.0, 13.0, 13.0, 10.0, 9.0, 7.0, 4.0, 4.0], "bins": [-8.84375, -8.577392578125, -8.31103515625, -8.044677734375, -7.7783203125, -7.511962890625, -7.24560546875, -6.979248046875, -6.712890625, -6.446533203125, -6.18017578125, -5.913818359375, -5.6474609375, -5.381103515625, -5.11474609375, -4.848388671875, -4.58203125, -4.315673828125, -4.04931640625, -3.782958984375, -3.5166015625, -3.250244140625, -2.98388671875, -2.717529296875, -2.451171875, -2.184814453125, -1.91845703125, -1.652099609375, -1.3857421875, -1.119384765625, -0.85302734375, -0.586669921875, -0.3203125, -0.053955078125, 0.21240234375, 0.478759765625, 0.7451171875, 1.011474609375, 1.27783203125, 1.544189453125, 1.810546875, 2.076904296875, 2.34326171875, 2.609619140625, 2.8759765625, 3.142333984375, 3.40869140625, 3.675048828125, 3.94140625, 4.207763671875, 4.47412109375, 4.740478515625, 5.0068359375, 5.273193359375, 5.53955078125, 5.805908203125, 6.072265625, 6.338623046875, 6.60498046875, 6.871337890625, 7.1376953125, 7.404052734375, 7.67041015625, 7.936767578125, 8.203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 9.0, 7.0, 3.0, 8.0, 17.0, 10.0, 22.0, 25.0, 18.0, 29.0, 36.0, 40.0, 43.0, 43.0, 49.0, 54.0, 51.0, 40.0, 52.0, 38.0, 47.0, 41.0, 47.0, 38.0, 35.0, 29.0, 21.0, 30.0, 19.0, 11.0, 25.0, 11.0, 6.0, 11.0, 4.0, 4.0, 3.0, 8.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00122833251953125, -0.0011920034885406494, -0.0011556744575500488, -0.0011193454265594482, -0.0010830163955688477, -0.001046687364578247, -0.0010103583335876465, -0.0009740293025970459, -0.0009377002716064453, -0.0009013712406158447, -0.0008650422096252441, -0.0008287131786346436, -0.000792384147644043, -0.0007560551166534424, -0.0007197260856628418, -0.0006833970546722412, -0.0006470680236816406, -0.00061073899269104, -0.0005744099617004395, -0.0005380809307098389, -0.0005017518997192383, -0.0004654228687286377, -0.0004290938377380371, -0.0003927648067474365, -0.00035643577575683594, -0.00032010674476623535, -0.00028377771377563477, -0.0002474486827850342, -0.0002111196517944336, -0.000174790620803833, -0.00013846158981323242, -0.00010213255882263184, -6.580352783203125e-05, -2.9474496841430664e-05, 6.854534149169922e-06, 4.318356513977051e-05, 7.95125961303711e-05, 0.00011584162712097168, 0.00015217065811157227, 0.00018849968910217285, 0.00022482872009277344, 0.000261157751083374, 0.0002974867820739746, 0.0003338158130645752, 0.0003701448440551758, 0.00040647387504577637, 0.00044280290603637695, 0.00047913193702697754, 0.0005154609680175781, 0.0005517899990081787, 0.0005881190299987793, 0.0006244480609893799, 0.0006607770919799805, 0.0006971061229705811, 0.0007334351539611816, 0.0007697641849517822, 0.0008060932159423828, 0.0008424222469329834, 0.000878751277923584, 0.0009150803089141846, 0.0009514093399047852, 0.0009877383708953857, 0.0010240674018859863, 0.001060396432876587, 0.0010967254638671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 10.0, 20.0, 35.0, 57.0, 97.0, 134.0, 245.0, 399.0, 623.0, 1070.0, 1654.0, 2775.0, 4563.0, 7291.0, 11522.0, 18153.0, 27809.0, 40453.0, 56843.0, 76262.0, 94356.0, 109052.0, 115398.0, 111028.0, 98355.0, 80353.0, 61291.0, 43898.0, 30367.0, 20155.0, 12867.0, 8276.0, 5130.0, 3157.0, 1897.0, 1168.0, 700.0, 428.0, 253.0, 169.0, 93.0, 53.0, 35.0, 24.0, 16.0, 8.0, 2.0, 7.0, 0.0, 1.0, 2.0], "bins": [-9.7890625, -9.51422119140625, -9.2393798828125, -8.96453857421875, -8.689697265625, -8.41485595703125, -8.1400146484375, -7.86517333984375, -7.59033203125, -7.31549072265625, -7.0406494140625, -6.76580810546875, -6.490966796875, -6.21612548828125, -5.9412841796875, -5.66644287109375, -5.3916015625, -5.11676025390625, -4.8419189453125, -4.56707763671875, -4.292236328125, -4.01739501953125, -3.7425537109375, -3.46771240234375, -3.19287109375, -2.91802978515625, -2.6431884765625, -2.36834716796875, -2.093505859375, -1.81866455078125, -1.5438232421875, -1.26898193359375, -0.994140625, -0.71929931640625, -0.4444580078125, -0.16961669921875, 0.105224609375, 0.38006591796875, 0.6549072265625, 0.92974853515625, 1.20458984375, 1.47943115234375, 1.7542724609375, 2.02911376953125, 2.303955078125, 2.57879638671875, 2.8536376953125, 3.12847900390625, 3.4033203125, 3.67816162109375, 3.9530029296875, 4.22784423828125, 4.502685546875, 4.77752685546875, 5.0523681640625, 5.32720947265625, 5.60205078125, 5.87689208984375, 6.1517333984375, 6.42657470703125, 6.701416015625, 6.97625732421875, 7.2510986328125, 7.52593994140625, 7.80078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 21.0, 15.0, 21.0, 19.0, 32.0, 32.0, 36.0, 38.0, 42.0, 43.0, 48.0, 43.0, 54.0, 52.0, 55.0, 45.0, 53.0, 55.0, 29.0, 45.0, 23.0, 26.0, 15.0, 17.0, 22.0, 12.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 2.0, 9.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.19140625, -4.05523681640625, -3.9190673828125, -3.78289794921875, -3.646728515625, -3.51055908203125, -3.3743896484375, -3.23822021484375, -3.10205078125, -2.96588134765625, -2.8297119140625, -2.69354248046875, -2.557373046875, -2.42120361328125, -2.2850341796875, -2.14886474609375, -2.0126953125, -1.87652587890625, -1.7403564453125, -1.60418701171875, -1.468017578125, -1.33184814453125, -1.1956787109375, -1.05950927734375, -0.92333984375, -0.78717041015625, -0.6510009765625, -0.51483154296875, -0.378662109375, -0.24249267578125, -0.1063232421875, 0.02984619140625, 0.166015625, 0.30218505859375, 0.4383544921875, 0.57452392578125, 0.710693359375, 0.84686279296875, 0.9830322265625, 1.11920166015625, 1.25537109375, 1.39154052734375, 1.5277099609375, 1.66387939453125, 1.800048828125, 1.93621826171875, 2.0723876953125, 2.20855712890625, 2.3447265625, 2.48089599609375, 2.6170654296875, 2.75323486328125, 2.889404296875, 3.02557373046875, 3.1617431640625, 3.29791259765625, 3.43408203125, 3.57025146484375, 3.7064208984375, 3.84259033203125, 3.978759765625, 4.11492919921875, 4.2510986328125, 4.38726806640625, 4.5234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 11.0, 7.0, 3.0, 20.0, 16.0, 17.0, 19.0, 17.0, 26.0, 31.0, 30.0, 35.0, 35.0, 37.0, 38.0, 31.0, 42.0, 43.0, 45.0, 51.0, 50.0, 41.0, 45.0, 27.0, 40.0, 24.0, 23.0, 36.0, 28.0, 10.0, 16.0, 15.0, 12.0, 11.0, 14.0, 11.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.628761291503906, -26.781553268432617, -25.934343338012695, -25.087135314941406, -24.239925384521484, -23.392717361450195, -22.545509338378906, -21.698299407958984, -20.851089477539062, -20.003881454467773, -19.15667152404785, -18.309463500976562, -17.46225357055664, -16.61504554748535, -15.767836570739746, -14.92062759399414, -14.073419570922852, -13.226210594177246, -12.37900161743164, -11.531793594360352, -10.68458366394043, -9.83737564086914, -8.990166664123535, -8.14295768737793, -7.295748710632324, -6.448539733886719, -5.601330757141113, -4.754122257232666, -3.9069132804870605, -3.059704303741455, -2.212495803833008, -1.3652868270874023, -0.5180759429931641, 0.32913291454315186, 1.1763417720794678, 2.023550510406494, 2.8707594871520996, 3.717968463897705, 4.565176963806152, 5.412385940551758, 6.259594917297363, 7.106803894042969, 7.954012870788574, 8.80122184753418, 9.648429870605469, 10.49563980102539, 11.34284782409668, 12.190056800842285, 13.03726577758789, 13.884474754333496, 14.731683731079102, 15.57889175415039, 16.426101684570312, 17.2733097076416, 18.12051773071289, 18.967727661132812, 19.814937591552734, 20.662145614624023, 21.509355545043945, 22.356563568115234, 23.203773498535156, 24.050981521606445, 24.898189544677734, 25.745399475097656, 26.592607498168945]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 8.0, 5.0, 10.0, 11.0, 13.0, 18.0, 19.0, 22.0, 21.0, 16.0, 29.0, 30.0, 33.0, 23.0, 37.0, 39.0, 43.0, 43.0, 33.0, 40.0, 31.0, 41.0, 41.0, 40.0, 31.0, 36.0, 38.0, 30.0, 26.0, 28.0, 34.0, 14.0, 14.0, 16.0, 11.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.764745712280273, -28.830656051635742, -27.89656639099121, -26.96247673034668, -26.02838897705078, -25.09429931640625, -24.16020965576172, -23.226119995117188, -22.292030334472656, -21.357940673828125, -20.423851013183594, -19.489761352539062, -18.55567169189453, -17.62158203125, -16.6874942779541, -15.75340461730957, -14.819314956665039, -13.885225296020508, -12.951135635375977, -12.017046928405762, -11.08295726776123, -10.1488676071167, -9.214778900146484, -8.280689239501953, -7.346599578857422, -6.412509918212891, -5.478420734405518, -4.5443315505981445, -3.6102418899536133, -2.676152229309082, -1.742063045501709, -0.8079738616943359, 0.12611770629882812, 1.0602071285247803, 1.9942965507507324, 2.9283859729766846, 3.8624753952026367, 4.796565055847168, 5.730654239654541, 6.664743423461914, 7.598833084106445, 8.532922744750977, 9.467012405395508, 10.401101112365723, 11.335190773010254, 12.269280433654785, 13.203369140625, 14.137458801269531, 15.071548461914062, 16.005638122558594, 16.939727783203125, 17.873817443847656, 18.807907104492188, 19.74199676513672, 20.676084518432617, 21.61017417907715, 22.54426383972168, 23.47835350036621, 24.412443161010742, 25.346532821655273, 26.280620574951172, 27.214710235595703, 28.148799896240234, 29.082889556884766, 30.016979217529297]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 13.0, 30.0, 44.0, 84.0, 130.0, 210.0, 397.0, 632.0, 1080.0, 1737.0, 2916.0, 4900.0, 8017.0, 13355.0, 21775.0, 34928.0, 56198.0, 87434.0, 133166.0, 193867.0, 271529.0, 353335.0, 427493.0, 472617.0, 472669.0, 430510.0, 357569.0, 274745.0, 197425.0, 135854.0, 89588.0, 57210.0, 36232.0, 22308.0, 13651.0, 8264.0, 4988.0, 3003.0, 1808.0, 1030.0, 650.0, 383.0, 207.0, 114.0, 67.0, 44.0, 24.0, 15.0, 16.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.0625, -20.40478515625, -19.7470703125, -19.08935546875, -18.431640625, -17.77392578125, -17.1162109375, -16.45849609375, -15.80078125, -15.14306640625, -14.4853515625, -13.82763671875, -13.169921875, -12.51220703125, -11.8544921875, -11.19677734375, -10.5390625, -9.88134765625, -9.2236328125, -8.56591796875, -7.908203125, -7.25048828125, -6.5927734375, -5.93505859375, -5.27734375, -4.61962890625, -3.9619140625, -3.30419921875, -2.646484375, -1.98876953125, -1.3310546875, -0.67333984375, -0.015625, 0.64208984375, 1.2998046875, 1.95751953125, 2.615234375, 3.27294921875, 3.9306640625, 4.58837890625, 5.24609375, 5.90380859375, 6.5615234375, 7.21923828125, 7.876953125, 8.53466796875, 9.1923828125, 9.85009765625, 10.5078125, 11.16552734375, 11.8232421875, 12.48095703125, 13.138671875, 13.79638671875, 14.4541015625, 15.11181640625, 15.76953125, 16.42724609375, 17.0849609375, 17.74267578125, 18.400390625, 19.05810546875, 19.7158203125, 20.37353515625, 21.03125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 5.0, 11.0, 10.0, 12.0, 19.0, 19.0, 21.0, 19.0, 19.0, 22.0, 34.0, 31.0, 23.0, 34.0, 44.0, 36.0, 44.0, 35.0, 45.0, 35.0, 31.0, 35.0, 51.0, 28.0, 29.0, 44.0, 31.0, 30.0, 31.0, 23.0, 23.0, 11.0, 14.0, 14.0, 10.0, 19.0, 7.0, 11.0, 3.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.015625, -25.201416015625, -24.38720703125, -23.572998046875, -22.7587890625, -21.944580078125, -21.13037109375, -20.316162109375, -19.501953125, -18.687744140625, -17.87353515625, -17.059326171875, -16.2451171875, -15.430908203125, -14.61669921875, -13.802490234375, -12.98828125, -12.174072265625, -11.35986328125, -10.545654296875, -9.7314453125, -8.917236328125, -8.10302734375, -7.288818359375, -6.474609375, -5.660400390625, -4.84619140625, -4.031982421875, -3.2177734375, -2.403564453125, -1.58935546875, -0.775146484375, 0.0390625, 0.853271484375, 1.66748046875, 2.481689453125, 3.2958984375, 4.110107421875, 4.92431640625, 5.738525390625, 6.552734375, 7.366943359375, 8.18115234375, 8.995361328125, 9.8095703125, 10.623779296875, 11.43798828125, 12.252197265625, 13.06640625, 13.880615234375, 14.69482421875, 15.509033203125, 16.3232421875, 17.137451171875, 17.95166015625, 18.765869140625, 19.580078125, 20.394287109375, 21.20849609375, 22.022705078125, 22.8369140625, 23.651123046875, 24.46533203125, 25.279541015625, 26.09375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 20.0, 25.0, 54.0, 76.0, 143.0, 231.0, 402.0, 655.0, 1154.0, 1975.0, 3346.0, 5519.0, 9072.0, 15003.0, 23880.0, 37452.0, 58011.0, 87649.0, 128097.0, 179854.0, 242047.0, 310599.0, 371804.0, 415509.0, 431050.0, 412445.0, 369045.0, 306511.0, 238996.0, 177742.0, 125792.0, 85945.0, 56954.0, 36751.0, 23614.0, 14559.0, 8925.0, 5368.0, 3342.0, 1908.0, 1114.0, 667.0, 435.0, 216.0, 130.0, 91.0, 45.0, 29.0, 12.0, 11.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-21.8125, -21.140869140625, -20.46923828125, -19.797607421875, -19.1259765625, -18.454345703125, -17.78271484375, -17.111083984375, -16.439453125, -15.767822265625, -15.09619140625, -14.424560546875, -13.7529296875, -13.081298828125, -12.40966796875, -11.738037109375, -11.06640625, -10.394775390625, -9.72314453125, -9.051513671875, -8.3798828125, -7.708251953125, -7.03662109375, -6.364990234375, -5.693359375, -5.021728515625, -4.35009765625, -3.678466796875, -3.0068359375, -2.335205078125, -1.66357421875, -0.991943359375, -0.3203125, 0.351318359375, 1.02294921875, 1.694580078125, 2.3662109375, 3.037841796875, 3.70947265625, 4.381103515625, 5.052734375, 5.724365234375, 6.39599609375, 7.067626953125, 7.7392578125, 8.410888671875, 9.08251953125, 9.754150390625, 10.42578125, 11.097412109375, 11.76904296875, 12.440673828125, 13.1123046875, 13.783935546875, 14.45556640625, 15.127197265625, 15.798828125, 16.470458984375, 17.14208984375, 17.813720703125, 18.4853515625, 19.156982421875, 19.82861328125, 20.500244140625, 21.171875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 4.0, 7.0, 10.0, 20.0, 21.0, 30.0, 30.0, 43.0, 54.0, 77.0, 69.0, 89.0, 103.0, 126.0, 117.0, 131.0, 159.0, 170.0, 170.0, 183.0, 183.0, 194.0, 188.0, 201.0, 210.0, 165.0, 204.0, 164.0, 143.0, 110.0, 126.0, 85.0, 80.0, 74.0, 80.0, 53.0, 43.0, 38.0, 21.0, 22.0, 18.0, 12.0, 13.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.8203125, -11.4708251953125, -11.121337890625, -10.7718505859375, -10.42236328125, -10.0728759765625, -9.723388671875, -9.3739013671875, -9.0244140625, -8.6749267578125, -8.325439453125, -7.9759521484375, -7.62646484375, -7.2769775390625, -6.927490234375, -6.5780029296875, -6.228515625, -5.8790283203125, -5.529541015625, -5.1800537109375, -4.83056640625, -4.4810791015625, -4.131591796875, -3.7821044921875, -3.4326171875, -3.0831298828125, -2.733642578125, -2.3841552734375, -2.03466796875, -1.6851806640625, -1.335693359375, -0.9862060546875, -0.63671875, -0.2872314453125, 0.062255859375, 0.4117431640625, 0.76123046875, 1.1107177734375, 1.460205078125, 1.8096923828125, 2.1591796875, 2.5086669921875, 2.858154296875, 3.2076416015625, 3.55712890625, 3.9066162109375, 4.256103515625, 4.6055908203125, 4.955078125, 5.3045654296875, 5.654052734375, 6.0035400390625, 6.35302734375, 6.7025146484375, 7.052001953125, 7.4014892578125, 7.7509765625, 8.1004638671875, 8.449951171875, 8.7994384765625, 9.14892578125, 9.4984130859375, 9.847900390625, 10.1973876953125, 10.546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 5.0, 7.0, 8.0, 13.0, 14.0, 12.0, 17.0, 23.0, 23.0, 37.0, 25.0, 34.0, 28.0, 41.0, 39.0, 33.0, 45.0, 41.0, 46.0, 42.0, 40.0, 56.0, 31.0, 31.0, 36.0, 35.0, 28.0, 19.0, 35.0, 24.0, 26.0, 18.0, 12.0, 13.0, 18.0, 8.0, 4.0, 8.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.142011642456055, -27.26846694946289, -26.394922256469727, -25.521377563476562, -24.6478328704834, -23.774288177490234, -22.900741577148438, -22.027196884155273, -21.15365219116211, -20.280107498168945, -19.40656280517578, -18.533018112182617, -17.659473419189453, -16.785926818847656, -15.912383079528809, -15.038837432861328, -14.16529369354248, -13.291749000549316, -12.418204307556152, -11.544658660888672, -10.671113967895508, -9.797569274902344, -8.92402458190918, -8.050479888916016, -7.176934719085693, -6.303390026092529, -5.429844856262207, -4.556300163269043, -3.6827552318573, -2.8092103004455566, -1.9356656074523926, -1.0621204376220703, -0.18857574462890625, 0.6849691271781921, 1.5585139989852905, 2.432058811187744, 3.3056037425994873, 4.1791486740112305, 5.0526933670043945, 5.926238536834717, 6.799783229827881, 7.673327922821045, 8.546873092651367, 9.420417785644531, 10.293962478637695, 11.16750717163086, 12.041051864624023, 12.914597511291504, 13.788142204284668, 14.661686897277832, 15.535231590270996, 16.408777236938477, 17.28232192993164, 18.155866622924805, 19.02941131591797, 19.902956008911133, 20.776500701904297, 21.65004539489746, 22.523590087890625, 23.39713478088379, 24.270679473876953, 25.14422607421875, 26.01776885986328, 26.891315460205078, 27.764860153198242]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 12.0, 10.0, 12.0, 13.0, 18.0, 15.0, 24.0, 20.0, 22.0, 18.0, 24.0, 43.0, 30.0, 34.0, 34.0, 29.0, 32.0, 34.0, 31.0, 27.0, 45.0, 38.0, 39.0, 25.0, 27.0, 29.0, 35.0, 22.0, 25.0, 30.0, 27.0, 15.0, 25.0, 16.0, 13.0, 11.0, 14.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 2.0, 6.0, 1.0, 2.0], "bins": [-27.159069061279297, -26.358509063720703, -25.557947158813477, -24.75738525390625, -23.956825256347656, -23.156265258789062, -22.355703353881836, -21.55514144897461, -20.754581451416016, -19.954021453857422, -19.153459548950195, -18.35289764404297, -17.552337646484375, -16.75177764892578, -15.951215744018555, -15.150654792785645, -14.350093841552734, -13.549532890319824, -12.748971939086914, -11.948410987854004, -11.147850036621094, -10.347289085388184, -9.546728134155273, -8.746167182922363, -7.945606231689453, -7.145045280456543, -6.344484329223633, -5.543923377990723, -4.7433624267578125, -3.9428014755249023, -3.142240524291992, -2.341679573059082, -1.5411205291748047, -0.7405595779418945, 0.060001373291015625, 0.8605623245239258, 1.661123275756836, 2.461684226989746, 3.2622451782226562, 4.062806129455566, 4.863367080688477, 5.663928031921387, 6.464488983154297, 7.265049934387207, 8.065610885620117, 8.866171836853027, 9.666732788085938, 10.467293739318848, 11.267854690551758, 12.068415641784668, 12.868976593017578, 13.669537544250488, 14.470098495483398, 15.270659446716309, 16.07122039794922, 16.871780395507812, 17.67234230041504, 18.472904205322266, 19.27346420288086, 20.074024200439453, 20.87458610534668, 21.675148010253906, 22.4757080078125, 23.276268005371094, 24.07682991027832]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 12.0, 7.0, 30.0, 28.0, 62.0, 77.0, 138.0, 249.0, 348.0, 595.0, 950.0, 1542.0, 2341.0, 3793.0, 6017.0, 8948.0, 13370.0, 19573.0, 28378.0, 38789.0, 51911.0, 66210.0, 80646.0, 91755.0, 98769.0, 99144.0, 93527.0, 82463.0, 68998.0, 54692.0, 41303.0, 30405.0, 21327.0, 14701.0, 9834.0, 6373.0, 4199.0, 2634.0, 1650.0, 1053.0, 645.0, 408.0, 251.0, 152.0, 91.0, 61.0, 48.0, 26.0, 9.0, 12.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.90234375, -6.680419921875, -6.45849609375, -6.236572265625, -6.0146484375, -5.792724609375, -5.57080078125, -5.348876953125, -5.126953125, -4.905029296875, -4.68310546875, -4.461181640625, -4.2392578125, -4.017333984375, -3.79541015625, -3.573486328125, -3.3515625, -3.129638671875, -2.90771484375, -2.685791015625, -2.4638671875, -2.241943359375, -2.02001953125, -1.798095703125, -1.576171875, -1.354248046875, -1.13232421875, -0.910400390625, -0.6884765625, -0.466552734375, -0.24462890625, -0.022705078125, 0.19921875, 0.421142578125, 0.64306640625, 0.864990234375, 1.0869140625, 1.308837890625, 1.53076171875, 1.752685546875, 1.974609375, 2.196533203125, 2.41845703125, 2.640380859375, 2.8623046875, 3.084228515625, 3.30615234375, 3.528076171875, 3.75, 3.971923828125, 4.19384765625, 4.415771484375, 4.6376953125, 4.859619140625, 5.08154296875, 5.303466796875, 5.525390625, 5.747314453125, 5.96923828125, 6.191162109375, 6.4130859375, 6.635009765625, 6.85693359375, 7.078857421875, 7.30078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 8.0, 6.0, 12.0, 16.0, 10.0, 10.0, 13.0, 18.0, 16.0, 23.0, 22.0, 22.0, 17.0, 24.0, 42.0, 34.0, 31.0, 33.0, 34.0, 29.0, 35.0, 30.0, 29.0, 45.0, 38.0, 35.0, 28.0, 26.0, 29.0, 35.0, 22.0, 27.0, 27.0, 25.0, 22.0, 20.0, 16.0, 13.0, 13.0, 10.0, 10.0, 8.0, 7.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 6.0, 1.0, 2.0], "bins": [-27.15625, -26.353759765625, -25.55126953125, -24.748779296875, -23.9462890625, -23.143798828125, -22.34130859375, -21.538818359375, -20.736328125, -19.933837890625, -19.13134765625, -18.328857421875, -17.5263671875, -16.723876953125, -15.92138671875, -15.118896484375, -14.31640625, -13.513916015625, -12.71142578125, -11.908935546875, -11.1064453125, -10.303955078125, -9.50146484375, -8.698974609375, -7.896484375, -7.093994140625, -6.29150390625, -5.489013671875, -4.6865234375, -3.884033203125, -3.08154296875, -2.279052734375, -1.4765625, -0.674072265625, 0.12841796875, 0.930908203125, 1.7333984375, 2.535888671875, 3.33837890625, 4.140869140625, 4.943359375, 5.745849609375, 6.54833984375, 7.350830078125, 8.1533203125, 8.955810546875, 9.75830078125, 10.560791015625, 11.36328125, 12.165771484375, 12.96826171875, 13.770751953125, 14.5732421875, 15.375732421875, 16.17822265625, 16.980712890625, 17.783203125, 18.585693359375, 19.38818359375, 20.190673828125, 20.9931640625, 21.795654296875, 22.59814453125, 23.400634765625, 24.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 11.0, 28.0, 32.0, 46.0, 69.0, 136.0, 169.0, 292.0, 427.0, 732.0, 1111.0, 1718.0, 2583.0, 4042.0, 6141.0, 9645.0, 15375.0, 26537.0, 118180.0, 770764.0, 36438.0, 20252.0, 12329.0, 7640.0, 4859.0, 3191.0, 2038.0, 1353.0, 845.0, 574.0, 355.0, 252.0, 143.0, 82.0, 51.0, 36.0, 27.0, 19.0, 22.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3125, -24.551025390625, -23.78955078125, -23.028076171875, -22.2666015625, -21.505126953125, -20.74365234375, -19.982177734375, -19.220703125, -18.459228515625, -17.69775390625, -16.936279296875, -16.1748046875, -15.413330078125, -14.65185546875, -13.890380859375, -13.12890625, -12.367431640625, -11.60595703125, -10.844482421875, -10.0830078125, -9.321533203125, -8.56005859375, -7.798583984375, -7.037109375, -6.275634765625, -5.51416015625, -4.752685546875, -3.9912109375, -3.229736328125, -2.46826171875, -1.706787109375, -0.9453125, -0.183837890625, 0.57763671875, 1.339111328125, 2.1005859375, 2.862060546875, 3.62353515625, 4.385009765625, 5.146484375, 5.907958984375, 6.66943359375, 7.430908203125, 8.1923828125, 8.953857421875, 9.71533203125, 10.476806640625, 11.23828125, 11.999755859375, 12.76123046875, 13.522705078125, 14.2841796875, 15.045654296875, 15.80712890625, 16.568603515625, 17.330078125, 18.091552734375, 18.85302734375, 19.614501953125, 20.3759765625, 21.137451171875, 21.89892578125, 22.660400390625, 23.421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 4.0, 4.0, 5.0, 8.0, 9.0, 13.0, 15.0, 20.0, 19.0, 16.0, 27.0, 36.0, 37.0, 33.0, 36.0, 28.0, 39.0, 31.0, 37.0, 37.0, 37.0, 43.0, 38.0, 40.0, 32.0, 43.0, 35.0, 50.0, 27.0, 31.0, 21.0, 24.0, 16.0, 25.0, 12.0, 10.0, 11.0, 8.0, 5.0, 11.0, 5.0, 2.0, 8.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.15625, -16.550048828125, -15.94384765625, -15.337646484375, -14.7314453125, -14.125244140625, -13.51904296875, -12.912841796875, -12.306640625, -11.700439453125, -11.09423828125, -10.488037109375, -9.8818359375, -9.275634765625, -8.66943359375, -8.063232421875, -7.45703125, -6.850830078125, -6.24462890625, -5.638427734375, -5.0322265625, -4.426025390625, -3.81982421875, -3.213623046875, -2.607421875, -2.001220703125, -1.39501953125, -0.788818359375, -0.1826171875, 0.423583984375, 1.02978515625, 1.635986328125, 2.2421875, 2.848388671875, 3.45458984375, 4.060791015625, 4.6669921875, 5.273193359375, 5.87939453125, 6.485595703125, 7.091796875, 7.697998046875, 8.30419921875, 8.910400390625, 9.5166015625, 10.122802734375, 10.72900390625, 11.335205078125, 11.94140625, 12.547607421875, 13.15380859375, 13.760009765625, 14.3662109375, 14.972412109375, 15.57861328125, 16.184814453125, 16.791015625, 17.397216796875, 18.00341796875, 18.609619140625, 19.2158203125, 19.822021484375, 20.42822265625, 21.034423828125, 21.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 11.0, 12.0, 19.0, 16.0, 34.0, 40.0, 65.0, 97.0, 150.0, 231.0, 370.0, 631.0, 1036.0, 1631.0, 2620.0, 4606.0, 7728.0, 13949.0, 26168.0, 113989.0, 789849.0, 40477.0, 19088.0, 10433.0, 5995.0, 3615.0, 2204.0, 1283.0, 806.0, 530.0, 315.0, 175.0, 119.0, 84.0, 58.0, 38.0, 20.0, 19.0, 12.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8726959228515625, -1.810821533203125, -1.7489471435546875, -1.68707275390625, -1.6251983642578125, -1.563323974609375, -1.5014495849609375, -1.4395751953125, -1.3777008056640625, -1.315826416015625, -1.2539520263671875, -1.19207763671875, -1.1302032470703125, -1.068328857421875, -1.0064544677734375, -0.944580078125, -0.8827056884765625, -0.820831298828125, -0.7589569091796875, -0.69708251953125, -0.6352081298828125, -0.573333740234375, -0.5114593505859375, -0.4495849609375, -0.3877105712890625, -0.325836181640625, -0.2639617919921875, -0.20208740234375, -0.1402130126953125, -0.078338623046875, -0.0164642333984375, 0.04541015625, 0.1072845458984375, 0.169158935546875, 0.2310333251953125, 0.29290771484375, 0.3547821044921875, 0.416656494140625, 0.4785308837890625, 0.5404052734375, 0.6022796630859375, 0.664154052734375, 0.7260284423828125, 0.78790283203125, 0.8497772216796875, 0.911651611328125, 0.9735260009765625, 1.035400390625, 1.0972747802734375, 1.159149169921875, 1.2210235595703125, 1.28289794921875, 1.3447723388671875, 1.406646728515625, 1.4685211181640625, 1.5303955078125, 1.5922698974609375, 1.654144287109375, 1.7160186767578125, 1.77789306640625, 1.8397674560546875, 1.901641845703125, 1.9635162353515625, 2.025390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 1.0, 5.0, 2.0, 5.0, 10.0, 8.0, 14.0, 13.0, 26.0, 20.0, 33.0, 41.0, 38.0, 40.0, 34.0, 44.0, 51.0, 63.0, 53.0, 60.0, 56.0, 43.0, 53.0, 42.0, 47.0, 25.0, 32.0, 30.0, 23.0, 16.0, 11.0, 14.0, 8.0, 6.0, 2.0, 5.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015353411436080933, -0.00014899671077728271, -0.0001444593071937561, -0.0001399219036102295, -0.00013538450002670288, -0.00013084709644317627, -0.00012630969285964966, -0.00012177228927612305, -0.00011723488569259644, -0.00011269748210906982, -0.00010816007852554321, -0.0001036226749420166, -9.908527135848999e-05, -9.454786777496338e-05, -9.001046419143677e-05, -8.547306060791016e-05, -8.093565702438354e-05, -7.639825344085693e-05, -7.186084985733032e-05, -6.732344627380371e-05, -6.27860426902771e-05, -5.824863910675049e-05, -5.371123552322388e-05, -4.9173831939697266e-05, -4.4636428356170654e-05, -4.009902477264404e-05, -3.556162118911743e-05, -3.102421760559082e-05, -2.648681402206421e-05, -2.1949410438537598e-05, -1.7412006855010986e-05, -1.2874603271484375e-05, -8.337199687957764e-06, -3.7997961044311523e-06, 7.37607479095459e-07, 5.27501106262207e-06, 9.812414646148682e-06, 1.4349818229675293e-05, 1.8887221813201904e-05, 2.3424625396728516e-05, 2.7962028980255127e-05, 3.249943256378174e-05, 3.703683614730835e-05, 4.157423973083496e-05, 4.611164331436157e-05, 5.0649046897888184e-05, 5.5186450481414795e-05, 5.9723854064941406e-05, 6.426125764846802e-05, 6.879866123199463e-05, 7.333606481552124e-05, 7.787346839904785e-05, 8.241087198257446e-05, 8.694827556610107e-05, 9.148567914962769e-05, 9.60230827331543e-05, 0.00010056048631668091, 0.00010509788990020752, 0.00010963529348373413, 0.00011417269706726074, 0.00011871010065078735, 0.00012324750423431396, 0.00012778490781784058, 0.0001323223114013672]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 17.0, 37.0, 36.0, 73.0, 92.0, 170.0, 240.0, 424.0, 702.0, 1221.0, 1987.0, 3232.0, 5323.0, 8185.0, 13349.0, 20669.0, 30856.0, 44845.0, 62202.0, 81472.0, 99056.0, 110863.0, 114385.0, 108292.0, 93645.0, 75338.0, 56321.0, 40173.0, 27181.0, 17731.0, 11574.0, 7353.0, 4459.0, 2806.0, 1641.0, 1016.0, 620.0, 373.0, 222.0, 134.0, 75.0, 56.0, 36.0, 25.0, 12.0, 9.0, 11.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95068359375, -0.92034912109375, -0.8900146484375, -0.85968017578125, -0.829345703125, -0.79901123046875, -0.7686767578125, -0.73834228515625, -0.7080078125, -0.67767333984375, -0.6473388671875, -0.61700439453125, -0.586669921875, -0.55633544921875, -0.5260009765625, -0.49566650390625, -0.46533203125, -0.43499755859375, -0.4046630859375, -0.37432861328125, -0.343994140625, -0.31365966796875, -0.2833251953125, -0.25299072265625, -0.22265625, -0.19232177734375, -0.1619873046875, -0.13165283203125, -0.101318359375, -0.07098388671875, -0.0406494140625, -0.01031494140625, 0.02001953125, 0.05035400390625, 0.0806884765625, 0.11102294921875, 0.141357421875, 0.17169189453125, 0.2020263671875, 0.23236083984375, 0.2626953125, 0.29302978515625, 0.3233642578125, 0.35369873046875, 0.384033203125, 0.41436767578125, 0.4447021484375, 0.47503662109375, 0.50537109375, 0.53570556640625, 0.5660400390625, 0.59637451171875, 0.626708984375, 0.65704345703125, 0.6873779296875, 0.71771240234375, 0.748046875, 0.77838134765625, 0.8087158203125, 0.83905029296875, 0.869384765625, 0.89971923828125, 0.9300537109375, 0.96038818359375, 0.99072265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 4.0, 8.0, 4.0, 4.0, 10.0, 16.0, 10.0, 11.0, 14.0, 18.0, 16.0, 22.0, 19.0, 20.0, 28.0, 28.0, 26.0, 29.0, 22.0, 42.0, 30.0, 29.0, 42.0, 32.0, 34.0, 24.0, 30.0, 31.0, 34.0, 34.0, 28.0, 24.0, 27.0, 27.0, 17.0, 25.0, 20.0, 18.0, 19.0, 18.0, 18.0, 18.0, 10.0, 16.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3726806640625, -0.3603515625, -0.3480224609375, -0.335693359375, -0.3233642578125, -0.31103515625, -0.2987060546875, -0.286376953125, -0.2740478515625, -0.26171875, -0.2493896484375, -0.237060546875, -0.2247314453125, -0.21240234375, -0.2000732421875, -0.187744140625, -0.1754150390625, -0.1630859375, -0.1507568359375, -0.138427734375, -0.1260986328125, -0.11376953125, -0.1014404296875, -0.089111328125, -0.0767822265625, -0.064453125, -0.0521240234375, -0.039794921875, -0.0274658203125, -0.01513671875, -0.0028076171875, 0.009521484375, 0.0218505859375, 0.0341796875, 0.0465087890625, 0.058837890625, 0.0711669921875, 0.08349609375, 0.0958251953125, 0.108154296875, 0.1204833984375, 0.1328125, 0.1451416015625, 0.157470703125, 0.1697998046875, 0.18212890625, 0.1944580078125, 0.206787109375, 0.2191162109375, 0.2314453125, 0.2437744140625, 0.256103515625, 0.2684326171875, 0.28076171875, 0.2930908203125, 0.305419921875, 0.3177490234375, 0.330078125, 0.3424072265625, 0.354736328125, 0.3670654296875, 0.37939453125, 0.3917236328125, 0.404052734375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 8.0, 9.0, 3.0, 6.0, 20.0, 11.0, 20.0, 16.0, 17.0, 38.0, 27.0, 26.0, 37.0, 41.0, 32.0, 36.0, 43.0, 34.0, 44.0, 47.0, 38.0, 54.0, 33.0, 45.0, 39.0, 26.0, 34.0, 23.0, 32.0, 24.0, 24.0, 21.0, 21.0, 14.0, 15.0, 9.0, 8.0, 7.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.845993041992188, -27.963638305664062, -27.081281661987305, -26.19892692565918, -25.316570281982422, -24.434215545654297, -23.551860809326172, -22.669506072998047, -21.78714942932129, -20.904794692993164, -20.022438049316406, -19.14008331298828, -18.257728576660156, -17.3753719329834, -16.493017196655273, -15.610661506652832, -14.72830581665039, -13.84595012664795, -12.963594436645508, -12.081239700317383, -11.198884010314941, -10.3165283203125, -9.434173583984375, -8.551817893981934, -7.669462203979492, -6.787106513977051, -5.904751300811768, -5.022396087646484, -4.140040397644043, -3.2576847076416016, -2.3753294944763184, -1.4929742813110352, -0.6106185913085938, 0.27173686027526855, 1.1540923118591309, 2.036447763442993, 2.9188032150268555, 3.801158905029297, 4.68351411819458, 5.565869331359863, 6.448225021362305, 7.330580711364746, 8.212936401367188, 9.095291137695312, 9.977646827697754, 10.860002517700195, 11.74235725402832, 12.624712944030762, 13.507068634033203, 14.389424324035645, 15.271780014038086, 16.15413475036621, 17.03649139404297, 17.918846130371094, 18.80120086669922, 19.683555603027344, 20.5659122467041, 21.448266983032227, 22.330623626708984, 23.21297836303711, 24.095333099365234, 24.977689743041992, 25.860044479370117, 26.742401123046875, 27.624755859375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 7.0, 10.0, 8.0, 11.0, 15.0, 14.0, 8.0, 19.0, 18.0, 19.0, 25.0, 19.0, 17.0, 16.0, 42.0, 31.0, 43.0, 26.0, 34.0, 23.0, 37.0, 35.0, 30.0, 34.0, 38.0, 40.0, 30.0, 33.0, 24.0, 26.0, 28.0, 24.0, 32.0, 27.0, 20.0, 26.0, 17.0, 11.0, 11.0, 16.0, 10.0, 6.0, 11.0, 4.0, 5.0, 2.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-26.567829132080078, -25.769271850585938, -24.97071647644043, -24.172161102294922, -23.37360382080078, -22.57504653930664, -21.776491165161133, -20.977935791015625, -20.179378509521484, -19.380821228027344, -18.582265853881836, -17.783710479736328, -16.985153198242188, -16.186595916748047, -15.388040542602539, -14.589484214782715, -13.79092788696289, -12.992371559143066, -12.193815231323242, -11.395258903503418, -10.596702575683594, -9.79814624786377, -8.999589920043945, -8.201033592224121, -7.402477264404297, -6.603920936584473, -5.805364608764648, -5.006808280944824, -4.208251953125, -3.409695625305176, -2.6111392974853516, -1.8125829696655273, -1.014028549194336, -0.21547222137451172, 0.5830841064453125, 1.3816404342651367, 2.180196762084961, 2.978753089904785, 3.7773094177246094, 4.575865745544434, 5.374422073364258, 6.172978401184082, 6.971534729003906, 7.7700910568237305, 8.568647384643555, 9.367203712463379, 10.165760040283203, 10.964316368103027, 11.762872695922852, 12.561429023742676, 13.3599853515625, 14.158541679382324, 14.957098007202148, 15.755654335021973, 16.554210662841797, 17.352767944335938, 18.151323318481445, 18.949878692626953, 19.748435974121094, 20.546993255615234, 21.345548629760742, 22.14410400390625, 22.94266128540039, 23.74121856689453, 24.53977394104004]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 14.0, 19.0, 40.0, 41.0, 67.0, 114.0, 176.0, 269.0, 437.0, 678.0, 1152.0, 1838.0, 2782.0, 4254.0, 6588.0, 10001.0, 15081.0, 22082.0, 31114.0, 42849.0, 56675.0, 71160.0, 84292.0, 94513.0, 99378.0, 98697.0, 90607.0, 78943.0, 64494.0, 50533.0, 37827.0, 26950.0, 18455.0, 12776.0, 8445.0, 5569.0, 3447.0, 2228.0, 1459.0, 960.0, 541.0, 368.0, 233.0, 145.0, 97.0, 55.0, 45.0, 16.0, 19.0, 3.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.53125, -19.88525390625, -19.2392578125, -18.59326171875, -17.947265625, -17.30126953125, -16.6552734375, -16.00927734375, -15.36328125, -14.71728515625, -14.0712890625, -13.42529296875, -12.779296875, -12.13330078125, -11.4873046875, -10.84130859375, -10.1953125, -9.54931640625, -8.9033203125, -8.25732421875, -7.611328125, -6.96533203125, -6.3193359375, -5.67333984375, -5.02734375, -4.38134765625, -3.7353515625, -3.08935546875, -2.443359375, -1.79736328125, -1.1513671875, -0.50537109375, 0.140625, 0.78662109375, 1.4326171875, 2.07861328125, 2.724609375, 3.37060546875, 4.0166015625, 4.66259765625, 5.30859375, 5.95458984375, 6.6005859375, 7.24658203125, 7.892578125, 8.53857421875, 9.1845703125, 9.83056640625, 10.4765625, 11.12255859375, 11.7685546875, 12.41455078125, 13.060546875, 13.70654296875, 14.3525390625, 14.99853515625, 15.64453125, 16.29052734375, 16.9365234375, 17.58251953125, 18.228515625, 18.87451171875, 19.5205078125, 20.16650390625, 20.8125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 10.0, 9.0, 8.0, 6.0, 15.0, 16.0, 8.0, 11.0, 18.0, 24.0, 19.0, 25.0, 17.0, 15.0, 29.0, 35.0, 41.0, 28.0, 28.0, 36.0, 26.0, 35.0, 33.0, 30.0, 38.0, 37.0, 34.0, 34.0, 31.0, 26.0, 27.0, 24.0, 27.0, 28.0, 25.0, 23.0, 25.0, 15.0, 11.0, 10.0, 13.0, 12.0, 7.0, 9.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-25.21875, -24.453125, -23.6875, -22.921875, -22.15625, -21.390625, -20.625, -19.859375, -19.09375, -18.328125, -17.5625, -16.796875, -16.03125, -15.265625, -14.5, -13.734375, -12.96875, -12.203125, -11.4375, -10.671875, -9.90625, -9.140625, -8.375, -7.609375, -6.84375, -6.078125, -5.3125, -4.546875, -3.78125, -3.015625, -2.25, -1.484375, -0.71875, 0.046875, 0.8125, 1.578125, 2.34375, 3.109375, 3.875, 4.640625, 5.40625, 6.171875, 6.9375, 7.703125, 8.46875, 9.234375, 10.0, 10.765625, 11.53125, 12.296875, 13.0625, 13.828125, 14.59375, 15.359375, 16.125, 16.890625, 17.65625, 18.421875, 19.1875, 19.953125, 20.71875, 21.484375, 22.25, 23.015625, 23.78125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 12.0, 25.0, 40.0, 69.0, 110.0, 167.0, 263.0, 437.0, 759.0, 1176.0, 1845.0, 2963.0, 4608.0, 7236.0, 11014.0, 16475.0, 23701.0, 33259.0, 45043.0, 58390.0, 71929.0, 84857.0, 93847.0, 97504.0, 95731.0, 88349.0, 76717.0, 63801.0, 49198.0, 36962.0, 26798.0, 18879.0, 12930.0, 8515.0, 5480.0, 3497.0, 2295.0, 1428.0, 881.0, 504.0, 309.0, 229.0, 117.0, 83.0, 50.0, 20.0, 18.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.078125, -18.456298828125, -17.83447265625, -17.212646484375, -16.5908203125, -15.968994140625, -15.34716796875, -14.725341796875, -14.103515625, -13.481689453125, -12.85986328125, -12.238037109375, -11.6162109375, -10.994384765625, -10.37255859375, -9.750732421875, -9.12890625, -8.507080078125, -7.88525390625, -7.263427734375, -6.6416015625, -6.019775390625, -5.39794921875, -4.776123046875, -4.154296875, -3.532470703125, -2.91064453125, -2.288818359375, -1.6669921875, -1.045166015625, -0.42333984375, 0.198486328125, 0.8203125, 1.442138671875, 2.06396484375, 2.685791015625, 3.3076171875, 3.929443359375, 4.55126953125, 5.173095703125, 5.794921875, 6.416748046875, 7.03857421875, 7.660400390625, 8.2822265625, 8.904052734375, 9.52587890625, 10.147705078125, 10.76953125, 11.391357421875, 12.01318359375, 12.635009765625, 13.2568359375, 13.878662109375, 14.50048828125, 15.122314453125, 15.744140625, 16.365966796875, 16.98779296875, 17.609619140625, 18.2314453125, 18.853271484375, 19.47509765625, 20.096923828125, 20.71875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 12.0, 11.0, 10.0, 23.0, 23.0, 19.0, 26.0, 19.0, 21.0, 25.0, 27.0, 29.0, 45.0, 34.0, 30.0, 28.0, 39.0, 31.0, 36.0, 40.0, 38.0, 45.0, 23.0, 34.0, 29.0, 29.0, 32.0, 26.0, 30.0, 18.0, 22.0, 19.0, 16.0, 11.0, 15.0, 9.0, 11.0, 6.0, 14.0, 10.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.78125, -17.25927734375, -16.7373046875, -16.21533203125, -15.693359375, -15.17138671875, -14.6494140625, -14.12744140625, -13.60546875, -13.08349609375, -12.5615234375, -12.03955078125, -11.517578125, -10.99560546875, -10.4736328125, -9.95166015625, -9.4296875, -8.90771484375, -8.3857421875, -7.86376953125, -7.341796875, -6.81982421875, -6.2978515625, -5.77587890625, -5.25390625, -4.73193359375, -4.2099609375, -3.68798828125, -3.166015625, -2.64404296875, -2.1220703125, -1.60009765625, -1.078125, -0.55615234375, -0.0341796875, 0.48779296875, 1.009765625, 1.53173828125, 2.0537109375, 2.57568359375, 3.09765625, 3.61962890625, 4.1416015625, 4.66357421875, 5.185546875, 5.70751953125, 6.2294921875, 6.75146484375, 7.2734375, 7.79541015625, 8.3173828125, 8.83935546875, 9.361328125, 9.88330078125, 10.4052734375, 10.92724609375, 11.44921875, 11.97119140625, 12.4931640625, 13.01513671875, 13.537109375, 14.05908203125, 14.5810546875, 15.10302734375, 15.625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 21.0, 12.0, 37.0, 35.0, 66.0, 127.0, 162.0, 318.0, 514.0, 861.0, 1461.0, 2435.0, 4116.0, 7102.0, 12282.0, 20902.0, 35131.0, 57254.0, 86589.0, 119133.0, 142941.0, 149114.0, 131367.0, 100333.0, 69018.0, 43798.0, 26669.0, 15152.0, 9027.0, 5132.0, 3005.0, 1797.0, 1047.0, 602.0, 356.0, 236.0, 150.0, 103.0, 55.0, 35.0, 22.0, 8.0, 10.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.5631103515625, -10.188720703125, -9.8143310546875, -9.43994140625, -9.0655517578125, -8.691162109375, -8.3167724609375, -7.9423828125, -7.5679931640625, -7.193603515625, -6.8192138671875, -6.44482421875, -6.0704345703125, -5.696044921875, -5.3216552734375, -4.947265625, -4.5728759765625, -4.198486328125, -3.8240966796875, -3.44970703125, -3.0753173828125, -2.700927734375, -2.3265380859375, -1.9521484375, -1.5777587890625, -1.203369140625, -0.8289794921875, -0.45458984375, -0.0802001953125, 0.294189453125, 0.6685791015625, 1.04296875, 1.4173583984375, 1.791748046875, 2.1661376953125, 2.54052734375, 2.9149169921875, 3.289306640625, 3.6636962890625, 4.0380859375, 4.4124755859375, 4.786865234375, 5.1612548828125, 5.53564453125, 5.9100341796875, 6.284423828125, 6.6588134765625, 7.033203125, 7.4075927734375, 7.781982421875, 8.1563720703125, 8.53076171875, 8.9051513671875, 9.279541015625, 9.6539306640625, 10.0283203125, 10.4027099609375, 10.777099609375, 11.1514892578125, 11.52587890625, 11.9002685546875, 12.274658203125, 12.6490478515625, 13.0234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 5.0, 7.0, 5.0, 8.0, 12.0, 11.0, 14.0, 25.0, 27.0, 20.0, 41.0, 35.0, 50.0, 46.0, 67.0, 55.0, 62.0, 63.0, 62.0, 51.0, 49.0, 38.0, 39.0, 38.0, 27.0, 26.0, 20.0, 17.0, 17.0, 18.0, 8.0, 7.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014162063598632812, -0.001373589038848877, -0.0013309717178344727, -0.0012883543968200684, -0.001245737075805664, -0.0012031197547912598, -0.0011605024337768555, -0.0011178851127624512, -0.0010752677917480469, -0.0010326504707336426, -0.0009900331497192383, -0.000947415828704834, -0.0009047985076904297, -0.0008621811866760254, -0.0008195638656616211, -0.0007769465446472168, -0.0007343292236328125, -0.0006917119026184082, -0.0006490945816040039, -0.0006064772605895996, -0.0005638599395751953, -0.000521242618560791, -0.0004786252975463867, -0.0004360079765319824, -0.0003933906555175781, -0.00035077333450317383, -0.00030815601348876953, -0.00026553869247436523, -0.00022292137145996094, -0.00018030405044555664, -0.00013768672943115234, -9.506940841674805e-05, -5.245208740234375e-05, -9.834766387939453e-06, 3.2782554626464844e-05, 7.539987564086914e-05, 0.00011801719665527344, 0.00016063451766967773, 0.00020325183868408203, 0.00024586915969848633, 0.0002884864807128906, 0.0003311038017272949, 0.0003737211227416992, 0.0004163384437561035, 0.0004589557647705078, 0.0005015730857849121, 0.0005441904067993164, 0.0005868077278137207, 0.000629425048828125, 0.0006720423698425293, 0.0007146596908569336, 0.0007572770118713379, 0.0007998943328857422, 0.0008425116539001465, 0.0008851289749145508, 0.0009277462959289551, 0.0009703636169433594, 0.0010129809379577637, 0.001055598258972168, 0.0010982155799865723, 0.0011408329010009766, 0.0011834502220153809, 0.0012260675430297852, 0.0012686848640441895, 0.0013113021850585938]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 22.0, 26.0, 44.0, 67.0, 118.0, 179.0, 346.0, 627.0, 1119.0, 1975.0, 3736.0, 6687.0, 12393.0, 22413.0, 39004.0, 64550.0, 97771.0, 131214.0, 153161.0, 151326.0, 126892.0, 92674.0, 60132.0, 36238.0, 20682.0, 11352.0, 6226.0, 3330.0, 1864.0, 1077.0, 542.0, 306.0, 195.0, 97.0, 65.0, 43.0, 20.0, 9.0, 10.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.754638671875, -13.36083984375, -12.967041015625, -12.5732421875, -12.179443359375, -11.78564453125, -11.391845703125, -10.998046875, -10.604248046875, -10.21044921875, -9.816650390625, -9.4228515625, -9.029052734375, -8.63525390625, -8.241455078125, -7.84765625, -7.453857421875, -7.06005859375, -6.666259765625, -6.2724609375, -5.878662109375, -5.48486328125, -5.091064453125, -4.697265625, -4.303466796875, -3.90966796875, -3.515869140625, -3.1220703125, -2.728271484375, -2.33447265625, -1.940673828125, -1.546875, -1.153076171875, -0.75927734375, -0.365478515625, 0.0283203125, 0.422119140625, 0.81591796875, 1.209716796875, 1.603515625, 1.997314453125, 2.39111328125, 2.784912109375, 3.1787109375, 3.572509765625, 3.96630859375, 4.360107421875, 4.75390625, 5.147705078125, 5.54150390625, 5.935302734375, 6.3291015625, 6.722900390625, 7.11669921875, 7.510498046875, 7.904296875, 8.298095703125, 8.69189453125, 9.085693359375, 9.4794921875, 9.873291015625, 10.26708984375, 10.660888671875, 11.0546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 3.0, 4.0, 15.0, 14.0, 8.0, 16.0, 12.0, 16.0, 27.0, 28.0, 24.0, 27.0, 36.0, 40.0, 37.0, 43.0, 31.0, 49.0, 42.0, 41.0, 47.0, 40.0, 31.0, 36.0, 32.0, 31.0, 38.0, 30.0, 25.0, 32.0, 23.0, 26.0, 14.0, 16.0, 11.0, 10.0, 6.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.1875, -4.065826416015625, -3.94415283203125, -3.822479248046875, -3.7008056640625, -3.579132080078125, -3.45745849609375, -3.335784912109375, -3.214111328125, -3.092437744140625, -2.97076416015625, -2.849090576171875, -2.7274169921875, -2.605743408203125, -2.48406982421875, -2.362396240234375, -2.24072265625, -2.119049072265625, -1.99737548828125, -1.875701904296875, -1.7540283203125, -1.632354736328125, -1.51068115234375, -1.389007568359375, -1.267333984375, -1.145660400390625, -1.02398681640625, -0.902313232421875, -0.7806396484375, -0.658966064453125, -0.53729248046875, -0.415618896484375, -0.2939453125, -0.172271728515625, -0.05059814453125, 0.071075439453125, 0.1927490234375, 0.314422607421875, 0.43609619140625, 0.557769775390625, 0.679443359375, 0.801116943359375, 0.92279052734375, 1.044464111328125, 1.1661376953125, 1.287811279296875, 1.40948486328125, 1.531158447265625, 1.65283203125, 1.774505615234375, 1.89617919921875, 2.017852783203125, 2.1395263671875, 2.261199951171875, 2.38287353515625, 2.504547119140625, 2.626220703125, 2.747894287109375, 2.86956787109375, 2.991241455078125, 3.1129150390625, 3.234588623046875, 3.35626220703125, 3.477935791015625, 3.599609375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 7.0, 6.0, 8.0, 8.0, 9.0, 16.0, 8.0, 16.0, 12.0, 28.0, 18.0, 37.0, 21.0, 20.0, 25.0, 37.0, 39.0, 34.0, 41.0, 27.0, 35.0, 32.0, 43.0, 49.0, 36.0, 39.0, 38.0, 22.0, 31.0, 36.0, 28.0, 28.0, 15.0, 27.0, 20.0, 15.0, 15.0, 12.0, 16.0, 14.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-25.63030433654785, -24.85382652282715, -24.077346801757812, -23.30086898803711, -22.524391174316406, -21.74791145324707, -20.971433639526367, -20.19495391845703, -19.418476104736328, -18.641998291015625, -17.86551856994629, -17.089040756225586, -16.31256103515625, -15.536083221435547, -14.759605407714844, -13.983126640319824, -13.206647872924805, -12.430169105529785, -11.653690338134766, -10.877212524414062, -10.100733757019043, -9.324254989624023, -8.54777717590332, -7.771298408508301, -6.994819641113281, -6.218340873718262, -5.4418625831604, -4.665384292602539, -3.8889055252075195, -3.112426996231079, -2.3359484672546387, -1.5594701766967773, -0.782989501953125, -0.00651097297668457, 0.7699675559997559, 1.5464460849761963, 2.3229246139526367, 3.099403142929077, 3.8758816719055176, 4.652359962463379, 5.428838729858398, 6.205317497253418, 6.981795787811279, 7.758274078369141, 8.53475284576416, 9.31123161315918, 10.087709426879883, 10.864188194274902, 11.640666961669922, 12.417145729064941, 13.193624496459961, 13.970102310180664, 14.746581077575684, 15.523059844970703, 16.299537658691406, 17.07601547241211, 17.852495193481445, 18.62897300720215, 19.405452728271484, 20.181930541992188, 20.95840835571289, 21.734888076782227, 22.51136589050293, 23.287845611572266, 24.06432342529297]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 6.0, 6.0, 8.0, 12.0, 8.0, 16.0, 17.0, 16.0, 21.0, 32.0, 24.0, 17.0, 30.0, 26.0, 28.0, 18.0, 41.0, 32.0, 53.0, 35.0, 37.0, 33.0, 31.0, 50.0, 35.0, 25.0, 30.0, 19.0, 32.0, 31.0, 24.0, 28.0, 24.0, 21.0, 24.0, 13.0, 10.0, 18.0, 13.0, 9.0, 8.0, 9.0, 4.0, 8.0, 3.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-28.252376556396484, -27.406330108642578, -26.56028175354004, -25.7142333984375, -24.868186950683594, -24.022140502929688, -23.17609214782715, -22.33004379272461, -21.483997344970703, -20.637950897216797, -19.791902542114258, -18.94585418701172, -18.099807739257812, -17.253761291503906, -16.407712936401367, -15.561665534973145, -14.715618133544922, -13.8695707321167, -13.023523330688477, -12.177475929260254, -11.331428527832031, -10.485381126403809, -9.639333724975586, -8.793286323547363, -7.947238922119141, -7.101191520690918, -6.255144119262695, -5.409096717834473, -4.56304931640625, -3.7170019149780273, -2.8709545135498047, -2.024907112121582, -1.1788578033447266, -0.3328104019165039, 0.5132369995117188, 1.3592844009399414, 2.205331802368164, 3.0513792037963867, 3.8974266052246094, 4.743474006652832, 5.589521408081055, 6.435568809509277, 7.2816162109375, 8.127663612365723, 8.973711013793945, 9.819758415222168, 10.66580581665039, 11.511853218078613, 12.357900619506836, 13.203948020935059, 14.049995422363281, 14.896042823791504, 15.742090225219727, 16.588138580322266, 17.434185028076172, 18.280231475830078, 19.126279830932617, 19.972328186035156, 20.818374633789062, 21.66442108154297, 22.510469436645508, 23.356517791748047, 24.202564239501953, 25.04861068725586, 25.8946590423584]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 2.0, 7.0, 7.0, 17.0, 35.0, 61.0, 90.0, 107.0, 209.0, 327.0, 570.0, 866.0, 1374.0, 2194.0, 3622.0, 5643.0, 8646.0, 13609.0, 21393.0, 32668.0, 49037.0, 73227.0, 105770.0, 149478.0, 203951.0, 267203.0, 327205.0, 382307.0, 414181.0, 416653.0, 388898.0, 338046.0, 275118.0, 213227.0, 157396.0, 111875.0, 77417.0, 52769.0, 35101.0, 22857.0, 14866.0, 9580.0, 6236.0, 3894.0, 2480.0, 1549.0, 969.0, 605.0, 403.0, 193.0, 141.0, 92.0, 48.0, 39.0, 14.0, 7.0, 7.0, 3.0, 0.0, 1.0, 3.0], "bins": [-18.59375, -18.01416015625, -17.4345703125, -16.85498046875, -16.275390625, -15.69580078125, -15.1162109375, -14.53662109375, -13.95703125, -13.37744140625, -12.7978515625, -12.21826171875, -11.638671875, -11.05908203125, -10.4794921875, -9.89990234375, -9.3203125, -8.74072265625, -8.1611328125, -7.58154296875, -7.001953125, -6.42236328125, -5.8427734375, -5.26318359375, -4.68359375, -4.10400390625, -3.5244140625, -2.94482421875, -2.365234375, -1.78564453125, -1.2060546875, -0.62646484375, -0.046875, 0.53271484375, 1.1123046875, 1.69189453125, 2.271484375, 2.85107421875, 3.4306640625, 4.01025390625, 4.58984375, 5.16943359375, 5.7490234375, 6.32861328125, 6.908203125, 7.48779296875, 8.0673828125, 8.64697265625, 9.2265625, 9.80615234375, 10.3857421875, 10.96533203125, 11.544921875, 12.12451171875, 12.7041015625, 13.28369140625, 13.86328125, 14.44287109375, 15.0224609375, 15.60205078125, 16.181640625, 16.76123046875, 17.3408203125, 17.92041015625, 18.5]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 6.0, 14.0, 11.0, 5.0, 18.0, 17.0, 17.0, 13.0, 31.0, 29.0, 19.0, 24.0, 32.0, 23.0, 19.0, 34.0, 27.0, 50.0, 45.0, 32.0, 33.0, 33.0, 50.0, 40.0, 23.0, 28.0, 23.0, 34.0, 26.0, 22.0, 31.0, 24.0, 17.0, 22.0, 22.0, 8.0, 13.0, 20.0, 11.0, 7.0, 8.0, 8.0, 6.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-24.53125, -23.798828125, -23.06640625, -22.333984375, -21.6015625, -20.869140625, -20.13671875, -19.404296875, -18.671875, -17.939453125, -17.20703125, -16.474609375, -15.7421875, -15.009765625, -14.27734375, -13.544921875, -12.8125, -12.080078125, -11.34765625, -10.615234375, -9.8828125, -9.150390625, -8.41796875, -7.685546875, -6.953125, -6.220703125, -5.48828125, -4.755859375, -4.0234375, -3.291015625, -2.55859375, -1.826171875, -1.09375, -0.361328125, 0.37109375, 1.103515625, 1.8359375, 2.568359375, 3.30078125, 4.033203125, 4.765625, 5.498046875, 6.23046875, 6.962890625, 7.6953125, 8.427734375, 9.16015625, 9.892578125, 10.625, 11.357421875, 12.08984375, 12.822265625, 13.5546875, 14.287109375, 15.01953125, 15.751953125, 16.484375, 17.216796875, 17.94921875, 18.681640625, 19.4140625, 20.146484375, 20.87890625, 21.611328125, 22.34375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 19.0, 33.0, 48.0, 85.0, 152.0, 281.0, 420.0, 845.0, 1508.0, 2615.0, 4726.0, 8326.0, 14122.0, 24548.0, 40085.0, 66157.0, 103215.0, 157544.0, 225166.0, 305926.0, 384404.0, 447468.0, 475367.0, 460431.0, 405994.0, 330219.0, 249778.0, 176178.0, 118702.0, 75509.0, 46848.0, 28188.0, 16849.0, 9761.0, 5532.0, 3195.0, 1735.0, 1028.0, 536.0, 334.0, 167.0, 100.0, 67.0, 31.0, 23.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-26.46875, -25.726318359375, -24.98388671875, -24.241455078125, -23.4990234375, -22.756591796875, -22.01416015625, -21.271728515625, -20.529296875, -19.786865234375, -19.04443359375, -18.302001953125, -17.5595703125, -16.817138671875, -16.07470703125, -15.332275390625, -14.58984375, -13.847412109375, -13.10498046875, -12.362548828125, -11.6201171875, -10.877685546875, -10.13525390625, -9.392822265625, -8.650390625, -7.907958984375, -7.16552734375, -6.423095703125, -5.6806640625, -4.938232421875, -4.19580078125, -3.453369140625, -2.7109375, -1.968505859375, -1.22607421875, -0.483642578125, 0.2587890625, 1.001220703125, 1.74365234375, 2.486083984375, 3.228515625, 3.970947265625, 4.71337890625, 5.455810546875, 6.1982421875, 6.940673828125, 7.68310546875, 8.425537109375, 9.16796875, 9.910400390625, 10.65283203125, 11.395263671875, 12.1376953125, 12.880126953125, 13.62255859375, 14.364990234375, 15.107421875, 15.849853515625, 16.59228515625, 17.334716796875, 18.0771484375, 18.819580078125, 19.56201171875, 20.304443359375, 21.046875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 13.0, 14.0, 23.0, 24.0, 30.0, 42.0, 55.0, 74.0, 72.0, 87.0, 112.0, 124.0, 151.0, 170.0, 179.0, 198.0, 216.0, 207.0, 225.0, 203.0, 223.0, 199.0, 194.0, 191.0, 161.0, 167.0, 118.0, 123.0, 105.0, 83.0, 61.0, 58.0, 44.0, 41.0, 27.0, 19.0, 12.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.19873046875, -10.8115234375, -10.42431640625, -10.037109375, -9.64990234375, -9.2626953125, -8.87548828125, -8.48828125, -8.10107421875, -7.7138671875, -7.32666015625, -6.939453125, -6.55224609375, -6.1650390625, -5.77783203125, -5.390625, -5.00341796875, -4.6162109375, -4.22900390625, -3.841796875, -3.45458984375, -3.0673828125, -2.68017578125, -2.29296875, -1.90576171875, -1.5185546875, -1.13134765625, -0.744140625, -0.35693359375, 0.0302734375, 0.41748046875, 0.8046875, 1.19189453125, 1.5791015625, 1.96630859375, 2.353515625, 2.74072265625, 3.1279296875, 3.51513671875, 3.90234375, 4.28955078125, 4.6767578125, 5.06396484375, 5.451171875, 5.83837890625, 6.2255859375, 6.61279296875, 7.0, 7.38720703125, 7.7744140625, 8.16162109375, 8.548828125, 8.93603515625, 9.3232421875, 9.71044921875, 10.09765625, 10.48486328125, 10.8720703125, 11.25927734375, 11.646484375, 12.03369140625, 12.4208984375, 12.80810546875, 13.1953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 6.0, 10.0, 16.0, 20.0, 17.0, 21.0, 25.0, 22.0, 39.0, 31.0, 31.0, 28.0, 45.0, 37.0, 37.0, 42.0, 48.0, 34.0, 55.0, 36.0, 45.0, 33.0, 41.0, 36.0, 30.0, 28.0, 34.0, 26.0, 18.0, 14.0, 13.0, 13.0, 9.0, 9.0, 5.0, 7.0, 6.0, 2.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-30.24650001525879, -29.386260986328125, -28.526020050048828, -27.665781021118164, -26.8055419921875, -25.945301055908203, -25.08506202697754, -24.224822998046875, -23.364582061767578, -22.504343032836914, -21.644102096557617, -20.783863067626953, -19.923622131347656, -19.063383102416992, -18.203144073486328, -17.34290313720703, -16.482664108276367, -15.622424125671387, -14.762184143066406, -13.901945114135742, -13.041705131530762, -12.181465148925781, -11.321226119995117, -10.460986137390137, -9.600746154785156, -8.740506172180176, -7.8802666664123535, -7.020027160644531, -6.159787178039551, -5.29954719543457, -4.439307689666748, -3.579068183898926, -2.7188262939453125, -1.8585865497589111, -0.9983468055725098, -0.1381070613861084, 0.722132682800293, 1.5823726654052734, 2.4426121711730957, 3.302851676940918, 4.163091659545898, 5.023331642150879, 5.883571147918701, 6.743810653686523, 7.604050636291504, 8.464290618896484, 9.324529647827148, 10.184769630432129, 11.04500961303711, 11.90524959564209, 12.76548957824707, 13.625728607177734, 14.485968589782715, 15.346208572387695, 16.20644760131836, 17.066688537597656, 17.92692756652832, 18.787166595458984, 19.64740753173828, 20.507646560668945, 21.36788558959961, 22.228126525878906, 23.08836555480957, 23.948604583740234, 24.80884552001953]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 4.0, 9.0, 9.0, 6.0, 10.0, 11.0, 14.0, 13.0, 10.0, 17.0, 16.0, 18.0, 33.0, 31.0, 28.0, 28.0, 31.0, 31.0, 28.0, 31.0, 25.0, 32.0, 34.0, 39.0, 34.0, 31.0, 36.0, 27.0, 32.0, 30.0, 26.0, 31.0, 30.0, 18.0, 20.0, 12.0, 28.0, 26.0, 21.0, 16.0, 15.0, 11.0, 8.0, 3.0, 5.0, 11.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.26994514465332, -23.497737884521484, -22.72553062438965, -21.953323364257812, -21.18111801147461, -20.408910751342773, -19.636703491210938, -18.8644962310791, -18.092288970947266, -17.32008171081543, -16.547874450683594, -15.775668144226074, -15.003461837768555, -14.231254577636719, -13.459047317504883, -12.686840057373047, -11.914634704589844, -11.142427444458008, -10.370221138000488, -9.598013877868652, -8.825807571411133, -8.053600311279297, -7.281393051147461, -6.509186267852783, -5.7369794845581055, -4.964772701263428, -4.19256591796875, -3.420358657836914, -2.6481518745422363, -1.8759450912475586, -1.1037378311157227, -0.3315310478210449, 0.440673828125, 1.2128807306289673, 1.9850876331329346, 2.7572946548461914, 3.529501438140869, 4.301708221435547, 5.073915481567383, 5.8461222648620605, 6.618329048156738, 7.390535831451416, 8.162742614746094, 8.93494987487793, 9.707157135009766, 10.479363441467285, 11.251570701599121, 12.02377700805664, 12.795984268188477, 13.568191528320312, 14.340397834777832, 15.112605094909668, 15.884811401367188, 16.657018661499023, 17.42922592163086, 18.201433181762695, 18.97364044189453, 19.745847702026367, 20.518054962158203, 21.290260314941406, 22.062467575073242, 22.834674835205078, 23.606882095336914, 24.37908935546875, 25.151294708251953]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 24.0, 50.0, 66.0, 103.0, 150.0, 232.0, 398.0, 594.0, 1012.0, 1464.0, 2241.0, 3687.0, 5697.0, 8344.0, 12604.0, 18435.0, 27045.0, 37558.0, 51217.0, 67443.0, 83648.0, 97554.0, 105544.0, 105869.0, 97464.0, 83526.0, 67205.0, 50842.0, 37261.0, 26433.0, 18156.0, 12785.0, 8298.0, 5432.0, 3572.0, 2378.0, 1492.0, 1003.0, 638.0, 418.0, 259.0, 172.0, 91.0, 57.0, 34.0, 19.0, 11.0, 3.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -5.99407958984375, -5.8006591796875, -5.60723876953125, -5.413818359375, -5.22039794921875, -5.0269775390625, -4.83355712890625, -4.64013671875, -4.44671630859375, -4.2532958984375, -4.05987548828125, -3.866455078125, -3.67303466796875, -3.4796142578125, -3.28619384765625, -3.0927734375, -2.89935302734375, -2.7059326171875, -2.51251220703125, -2.319091796875, -2.12567138671875, -1.9322509765625, -1.73883056640625, -1.54541015625, -1.35198974609375, -1.1585693359375, -0.96514892578125, -0.771728515625, -0.57830810546875, -0.3848876953125, -0.19146728515625, 0.001953125, 0.19537353515625, 0.3887939453125, 0.58221435546875, 0.775634765625, 0.96905517578125, 1.1624755859375, 1.35589599609375, 1.54931640625, 1.74273681640625, 1.9361572265625, 2.12957763671875, 2.322998046875, 2.51641845703125, 2.7098388671875, 2.90325927734375, 3.0966796875, 3.29010009765625, 3.4835205078125, 3.67694091796875, 3.870361328125, 4.06378173828125, 4.2572021484375, 4.45062255859375, 4.64404296875, 4.83746337890625, 5.0308837890625, 5.22430419921875, 5.417724609375, 5.61114501953125, 5.8045654296875, 5.99798583984375, 6.19140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 9.0, 7.0, 10.0, 11.0, 13.0, 13.0, 11.0, 16.0, 17.0, 19.0, 34.0, 30.0, 26.0, 29.0, 37.0, 25.0, 30.0, 29.0, 27.0, 33.0, 31.0, 39.0, 33.0, 32.0, 35.0, 26.0, 33.0, 29.0, 30.0, 30.0, 31.0, 15.0, 20.0, 15.0, 24.0, 28.0, 20.0, 16.0, 16.0, 8.0, 8.0, 4.0, 5.0, 13.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.296875, -23.52587890625, -22.7548828125, -21.98388671875, -21.212890625, -20.44189453125, -19.6708984375, -18.89990234375, -18.12890625, -17.35791015625, -16.5869140625, -15.81591796875, -15.044921875, -14.27392578125, -13.5029296875, -12.73193359375, -11.9609375, -11.18994140625, -10.4189453125, -9.64794921875, -8.876953125, -8.10595703125, -7.3349609375, -6.56396484375, -5.79296875, -5.02197265625, -4.2509765625, -3.47998046875, -2.708984375, -1.93798828125, -1.1669921875, -0.39599609375, 0.375, 1.14599609375, 1.9169921875, 2.68798828125, 3.458984375, 4.22998046875, 5.0009765625, 5.77197265625, 6.54296875, 7.31396484375, 8.0849609375, 8.85595703125, 9.626953125, 10.39794921875, 11.1689453125, 11.93994140625, 12.7109375, 13.48193359375, 14.2529296875, 15.02392578125, 15.794921875, 16.56591796875, 17.3369140625, 18.10791015625, 18.87890625, 19.64990234375, 20.4208984375, 21.19189453125, 21.962890625, 22.73388671875, 23.5048828125, 24.27587890625, 25.046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 10.0, 18.0, 22.0, 16.0, 42.0, 46.0, 71.0, 89.0, 112.0, 174.0, 282.0, 420.0, 558.0, 878.0, 1330.0, 1962.0, 2908.0, 4381.0, 6319.0, 9854.0, 15762.0, 26979.0, 167602.0, 721185.0, 33995.0, 19055.0, 11743.0, 7508.0, 5051.0, 3297.0, 2258.0, 1465.0, 1002.0, 636.0, 440.0, 328.0, 225.0, 140.0, 92.0, 85.0, 57.0, 53.0, 19.0, 32.0, 17.0, 5.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.65625, -20.014404296875, -19.37255859375, -18.730712890625, -18.0888671875, -17.447021484375, -16.80517578125, -16.163330078125, -15.521484375, -14.879638671875, -14.23779296875, -13.595947265625, -12.9541015625, -12.312255859375, -11.67041015625, -11.028564453125, -10.38671875, -9.744873046875, -9.10302734375, -8.461181640625, -7.8193359375, -7.177490234375, -6.53564453125, -5.893798828125, -5.251953125, -4.610107421875, -3.96826171875, -3.326416015625, -2.6845703125, -2.042724609375, -1.40087890625, -0.759033203125, -0.1171875, 0.524658203125, 1.16650390625, 1.808349609375, 2.4501953125, 3.092041015625, 3.73388671875, 4.375732421875, 5.017578125, 5.659423828125, 6.30126953125, 6.943115234375, 7.5849609375, 8.226806640625, 8.86865234375, 9.510498046875, 10.15234375, 10.794189453125, 11.43603515625, 12.077880859375, 12.7197265625, 13.361572265625, 14.00341796875, 14.645263671875, 15.287109375, 15.928955078125, 16.57080078125, 17.212646484375, 17.8544921875, 18.496337890625, 19.13818359375, 19.780029296875, 20.421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 5.0, 9.0, 8.0, 11.0, 8.0, 9.0, 18.0, 18.0, 24.0, 23.0, 26.0, 30.0, 30.0, 36.0, 35.0, 40.0, 45.0, 37.0, 41.0, 45.0, 41.0, 43.0, 35.0, 36.0, 32.0, 46.0, 31.0, 23.0, 25.0, 24.0, 32.0, 24.0, 28.0, 13.0, 22.0, 6.0, 10.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.3505859375, -19.732421875, -19.1142578125, -18.49609375, -17.8779296875, -17.259765625, -16.6416015625, -16.0234375, -15.4052734375, -14.787109375, -14.1689453125, -13.55078125, -12.9326171875, -12.314453125, -11.6962890625, -11.078125, -10.4599609375, -9.841796875, -9.2236328125, -8.60546875, -7.9873046875, -7.369140625, -6.7509765625, -6.1328125, -5.5146484375, -4.896484375, -4.2783203125, -3.66015625, -3.0419921875, -2.423828125, -1.8056640625, -1.1875, -0.5693359375, 0.048828125, 0.6669921875, 1.28515625, 1.9033203125, 2.521484375, 3.1396484375, 3.7578125, 4.3759765625, 4.994140625, 5.6123046875, 6.23046875, 6.8486328125, 7.466796875, 8.0849609375, 8.703125, 9.3212890625, 9.939453125, 10.5576171875, 11.17578125, 11.7939453125, 12.412109375, 13.0302734375, 13.6484375, 14.2666015625, 14.884765625, 15.5029296875, 16.12109375, 16.7392578125, 17.357421875, 17.9755859375, 18.59375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 11.0, 17.0, 9.0, 34.0, 42.0, 54.0, 60.0, 97.0, 118.0, 200.0, 255.0, 370.0, 533.0, 758.0, 1281.0, 1867.0, 2964.0, 4609.0, 7808.0, 12922.0, 22803.0, 57387.0, 828973.0, 50563.0, 21950.0, 12529.0, 7415.0, 4596.0, 2909.0, 1817.0, 1072.0, 768.0, 513.0, 335.0, 238.0, 175.0, 125.0, 86.0, 81.0, 56.0, 44.0, 30.0, 19.0, 15.0, 10.0, 7.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.3740234375, -1.327392578125, -1.28076171875, -1.234130859375, -1.1875, -1.140869140625, -1.09423828125, -1.047607421875, -1.0009765625, -0.954345703125, -0.90771484375, -0.861083984375, -0.814453125, -0.767822265625, -0.72119140625, -0.674560546875, -0.6279296875, -0.581298828125, -0.53466796875, -0.488037109375, -0.44140625, -0.394775390625, -0.34814453125, -0.301513671875, -0.2548828125, -0.208251953125, -0.16162109375, -0.114990234375, -0.068359375, -0.021728515625, 0.02490234375, 0.071533203125, 0.1181640625, 0.164794921875, 0.21142578125, 0.258056640625, 0.3046875, 0.351318359375, 0.39794921875, 0.444580078125, 0.4912109375, 0.537841796875, 0.58447265625, 0.631103515625, 0.677734375, 0.724365234375, 0.77099609375, 0.817626953125, 0.8642578125, 0.910888671875, 0.95751953125, 1.004150390625, 1.05078125, 1.097412109375, 1.14404296875, 1.190673828125, 1.2373046875, 1.283935546875, 1.33056640625, 1.377197265625, 1.423828125, 1.470458984375, 1.51708984375, 1.563720703125, 1.6103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 4.0, 10.0, 21.0, 8.0, 21.0, 38.0, 26.0, 35.0, 37.0, 56.0, 54.0, 91.0, 72.0, 76.0, 62.0, 68.0, 47.0, 51.0, 44.0, 29.0, 35.0, 19.0, 21.0, 13.0, 14.0, 16.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.822845458984375e-05, -9.500514715909958e-05, -9.178183972835541e-05, -8.855853229761124e-05, -8.533522486686707e-05, -8.21119174361229e-05, -7.888861000537872e-05, -7.566530257463455e-05, -7.244199514389038e-05, -6.921868771314621e-05, -6.599538028240204e-05, -6.277207285165787e-05, -5.9548765420913696e-05, -5.6325457990169525e-05, -5.3102150559425354e-05, -4.987884312868118e-05, -4.665553569793701e-05, -4.343222826719284e-05, -4.020892083644867e-05, -3.69856134057045e-05, -3.376230597496033e-05, -3.0538998544216156e-05, -2.7315691113471985e-05, -2.4092383682727814e-05, -2.0869076251983643e-05, -1.764576882123947e-05, -1.44224613904953e-05, -1.1199153959751129e-05, -7.975846529006958e-06, -4.752539098262787e-06, -1.5292316675186157e-06, 1.6940757632255554e-06, 4.9173831939697266e-06, 8.140690624713898e-06, 1.1363998055458069e-05, 1.458730548620224e-05, 1.781061291694641e-05, 2.1033920347690582e-05, 2.4257227778434753e-05, 2.7480535209178925e-05, 3.0703842639923096e-05, 3.392715007066727e-05, 3.715045750141144e-05, 4.037376493215561e-05, 4.359707236289978e-05, 4.682037979364395e-05, 5.004368722438812e-05, 5.3266994655132294e-05, 5.6490302085876465e-05, 5.9713609516620636e-05, 6.293691694736481e-05, 6.616022437810898e-05, 6.938353180885315e-05, 7.260683923959732e-05, 7.583014667034149e-05, 7.905345410108566e-05, 8.227676153182983e-05, 8.5500068962574e-05, 8.872337639331818e-05, 9.194668382406235e-05, 9.516999125480652e-05, 9.839329868555069e-05, 0.00010161660611629486, 0.00010483991354703903, 0.0001080632209777832]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 18.0, 27.0, 46.0, 88.0, 111.0, 198.0, 314.0, 458.0, 764.0, 1076.0, 1878.0, 2880.0, 4525.0, 7211.0, 11202.0, 17471.0, 26389.0, 39716.0, 57121.0, 78431.0, 102181.0, 121126.0, 128143.0, 117852.0, 97705.0, 74093.0, 53271.0, 35926.0, 24409.0, 15785.0, 10193.0, 6663.0, 4044.0, 2686.0, 1653.0, 1079.0, 650.0, 433.0, 271.0, 167.0, 96.0, 72.0, 56.0, 25.0, 15.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1708984375, -1.1368560791015625, -1.102813720703125, -1.0687713623046875, -1.03472900390625, -1.0006866455078125, -0.966644287109375, -0.9326019287109375, -0.8985595703125, -0.8645172119140625, -0.830474853515625, -0.7964324951171875, -0.76239013671875, -0.7283477783203125, -0.694305419921875, -0.6602630615234375, -0.626220703125, -0.5921783447265625, -0.558135986328125, -0.5240936279296875, -0.49005126953125, -0.4560089111328125, -0.421966552734375, -0.3879241943359375, -0.3538818359375, -0.3198394775390625, -0.285797119140625, -0.2517547607421875, -0.21771240234375, -0.1836700439453125, -0.149627685546875, -0.1155853271484375, -0.08154296875, -0.0475006103515625, -0.013458251953125, 0.0205841064453125, 0.05462646484375, 0.0886688232421875, 0.122711181640625, 0.1567535400390625, 0.1907958984375, 0.2248382568359375, 0.258880615234375, 0.2929229736328125, 0.32696533203125, 0.3610076904296875, 0.395050048828125, 0.4290924072265625, 0.463134765625, 0.4971771240234375, 0.531219482421875, 0.5652618408203125, 0.59930419921875, 0.6333465576171875, 0.667388916015625, 0.7014312744140625, 0.7354736328125, 0.7695159912109375, 0.803558349609375, 0.8376007080078125, 0.87164306640625, 0.9056854248046875, 0.939727783203125, 0.9737701416015625, 1.0078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 6.0, 7.0, 7.0, 4.0, 7.0, 19.0, 18.0, 14.0, 18.0, 20.0, 20.0, 28.0, 33.0, 29.0, 37.0, 47.0, 40.0, 40.0, 43.0, 53.0, 31.0, 33.0, 34.0, 41.0, 38.0, 27.0, 39.0, 35.0, 24.0, 24.0, 19.0, 22.0, 27.0, 16.0, 16.0, 13.0, 11.0, 11.0, 3.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.52978515625, -0.5149192810058594, -0.5000534057617188, -0.4851875305175781, -0.4703216552734375, -0.4554557800292969, -0.44058990478515625, -0.4257240295410156, -0.410858154296875, -0.3959922790527344, -0.38112640380859375, -0.3662605285644531, -0.3513946533203125, -0.3365287780761719, -0.32166290283203125, -0.3067970275878906, -0.29193115234375, -0.2770652770996094, -0.26219940185546875, -0.24733352661132812, -0.2324676513671875, -0.21760177612304688, -0.20273590087890625, -0.18787002563476562, -0.173004150390625, -0.15813827514648438, -0.14327239990234375, -0.12840652465820312, -0.1135406494140625, -0.09867477416992188, -0.08380889892578125, -0.06894302368164062, -0.0540771484375, -0.039211273193359375, -0.02434539794921875, -0.009479522705078125, 0.0053863525390625, 0.020252227783203125, 0.03511810302734375, 0.049983978271484375, 0.064849853515625, 0.07971572875976562, 0.09458160400390625, 0.10944747924804688, 0.1243133544921875, 0.13917922973632812, 0.15404510498046875, 0.16891098022460938, 0.18377685546875, 0.19864273071289062, 0.21350860595703125, 0.22837448120117188, 0.2432403564453125, 0.2581062316894531, 0.27297210693359375, 0.2878379821777344, 0.302703857421875, 0.3175697326660156, 0.33243560791015625, 0.3473014831542969, 0.3621673583984375, 0.3770332336425781, 0.39189910888671875, 0.4067649841308594, 0.421630859375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 6.0, 16.0, 19.0, 18.0, 25.0, 16.0, 28.0, 42.0, 35.0, 28.0, 39.0, 40.0, 39.0, 43.0, 32.0, 52.0, 46.0, 44.0, 48.0, 35.0, 33.0, 40.0, 37.0, 27.0, 35.0, 32.0, 20.0, 17.0, 13.0, 21.0, 9.0, 4.0, 5.0, 8.0, 4.0, 7.0, 5.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.643497467041016, -30.758874893188477, -29.874250411987305, -28.989627838134766, -28.105003356933594, -27.220380783081055, -26.335758209228516, -25.451133728027344, -24.566509246826172, -23.681886672973633, -22.79726219177246, -21.912639617919922, -21.02801513671875, -20.14339256286621, -19.258769989013672, -18.3741455078125, -17.48952293395996, -16.604900360107422, -15.72027587890625, -14.835653305053711, -13.951028823852539, -13.06640625, -12.181782722473145, -11.297159194946289, -10.412535667419434, -9.527912139892578, -8.643288612365723, -7.758665561676025, -6.87404203414917, -5.9894185066223145, -5.104795455932617, -4.220171928405762, -3.3355484008789062, -2.450924873352051, -1.5663015842437744, -0.681678295135498, 0.20294523239135742, 1.087568759918213, 1.9721918106079102, 2.8568153381347656, 3.741438865661621, 4.626062393188477, 5.510685920715332, 6.395308971405029, 7.279932498931885, 8.164556503295898, 9.049179077148438, 9.933802604675293, 10.818426132202148, 11.703049659729004, 12.58767318725586, 13.472295761108398, 14.35692024230957, 15.24154281616211, 16.12616729736328, 17.01078987121582, 17.89541244506836, 18.7800350189209, 19.66465950012207, 20.54928207397461, 21.43390655517578, 22.31852912902832, 23.20315170288086, 24.08777618408203, 24.972400665283203]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 11.0, 5.0, 11.0, 10.0, 13.0, 12.0, 13.0, 18.0, 13.0, 16.0, 30.0, 32.0, 29.0, 24.0, 40.0, 22.0, 35.0, 28.0, 31.0, 29.0, 29.0, 43.0, 28.0, 35.0, 33.0, 36.0, 28.0, 36.0, 24.0, 29.0, 31.0, 23.0, 15.0, 16.0, 24.0, 22.0, 25.0, 14.0, 20.0, 11.0, 5.0, 4.0, 7.0, 13.0, 3.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.720094680786133, -23.941967010498047, -23.16383934020996, -22.385711669921875, -21.607582092285156, -20.82945442199707, -20.051326751708984, -19.2731990814209, -18.495071411132812, -17.716943740844727, -16.93881607055664, -16.160686492919922, -15.382559776306152, -14.60443115234375, -13.826303482055664, -13.048175811767578, -12.270047187805176, -11.49191951751709, -10.713790893554688, -9.935663223266602, -9.157535552978516, -8.37940788269043, -7.601279258728027, -6.823151588439941, -6.045023441314697, -5.266895294189453, -4.488767623901367, -3.710639476776123, -2.932511568069458, -2.154383659362793, -1.3762555122375488, -0.5981278419494629, 0.18000030517578125, 0.9581282734870911, 1.7362562417984009, 2.5143842697143555, 3.2925121784210205, 4.0706400871276855, 4.84876823425293, 5.626895904541016, 6.40502405166626, 7.183152198791504, 7.96127986907959, 8.739408493041992, 9.517536163330078, 10.295663833618164, 11.07379150390625, 11.851919174194336, 12.630047798156738, 13.408175468444824, 14.186304092407227, 14.964431762695312, 15.742559432983398, 16.520687103271484, 17.298816680908203, 18.076942443847656, 18.855072021484375, 19.63319969177246, 20.411327362060547, 21.189456939697266, 21.96758460998535, 22.745712280273438, 23.523839950561523, 24.30196762084961, 25.080095291137695]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 26.0, 39.0, 53.0, 91.0, 168.0, 239.0, 382.0, 572.0, 862.0, 1418.0, 2101.0, 3125.0, 4697.0, 7187.0, 10206.0, 14584.0, 20008.0, 27101.0, 36231.0, 46361.0, 57024.0, 67317.0, 76638.0, 83795.0, 85711.0, 84820.0, 80603.0, 72113.0, 62484.0, 51322.0, 41158.0, 31350.0, 23571.0, 17177.0, 12538.0, 8578.0, 5726.0, 3885.0, 2552.0, 1734.0, 1104.0, 692.0, 443.0, 289.0, 175.0, 95.0, 75.0, 51.0, 35.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-15.578125, -15.071533203125, -14.56494140625, -14.058349609375, -13.5517578125, -13.045166015625, -12.53857421875, -12.031982421875, -11.525390625, -11.018798828125, -10.51220703125, -10.005615234375, -9.4990234375, -8.992431640625, -8.48583984375, -7.979248046875, -7.47265625, -6.966064453125, -6.45947265625, -5.952880859375, -5.4462890625, -4.939697265625, -4.43310546875, -3.926513671875, -3.419921875, -2.913330078125, -2.40673828125, -1.900146484375, -1.3935546875, -0.886962890625, -0.38037109375, 0.126220703125, 0.6328125, 1.139404296875, 1.64599609375, 2.152587890625, 2.6591796875, 3.165771484375, 3.67236328125, 4.178955078125, 4.685546875, 5.192138671875, 5.69873046875, 6.205322265625, 6.7119140625, 7.218505859375, 7.72509765625, 8.231689453125, 8.73828125, 9.244873046875, 9.75146484375, 10.258056640625, 10.7646484375, 11.271240234375, 11.77783203125, 12.284423828125, 12.791015625, 13.297607421875, 13.80419921875, 14.310791015625, 14.8173828125, 15.323974609375, 15.83056640625, 16.337158203125, 16.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 10.0, 7.0, 9.0, 13.0, 11.0, 13.0, 15.0, 17.0, 13.0, 22.0, 28.0, 29.0, 32.0, 20.0, 40.0, 23.0, 35.0, 26.0, 36.0, 26.0, 34.0, 42.0, 25.0, 38.0, 33.0, 31.0, 29.0, 36.0, 23.0, 30.0, 30.0, 22.0, 18.0, 16.0, 21.0, 25.0, 20.0, 16.0, 19.0, 11.0, 5.0, 5.0, 9.0, 10.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.90625, -23.151611328125, -22.39697265625, -21.642333984375, -20.8876953125, -20.133056640625, -19.37841796875, -18.623779296875, -17.869140625, -17.114501953125, -16.35986328125, -15.605224609375, -14.8505859375, -14.095947265625, -13.34130859375, -12.586669921875, -11.83203125, -11.077392578125, -10.32275390625, -9.568115234375, -8.8134765625, -8.058837890625, -7.30419921875, -6.549560546875, -5.794921875, -5.040283203125, -4.28564453125, -3.531005859375, -2.7763671875, -2.021728515625, -1.26708984375, -0.512451171875, 0.2421875, 0.996826171875, 1.75146484375, 2.506103515625, 3.2607421875, 4.015380859375, 4.77001953125, 5.524658203125, 6.279296875, 7.033935546875, 7.78857421875, 8.543212890625, 9.2978515625, 10.052490234375, 10.80712890625, 11.561767578125, 12.31640625, 13.071044921875, 13.82568359375, 14.580322265625, 15.3349609375, 16.089599609375, 16.84423828125, 17.598876953125, 18.353515625, 19.108154296875, 19.86279296875, 20.617431640625, 21.3720703125, 22.126708984375, 22.88134765625, 23.635986328125, 24.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 8.0, 22.0, 46.0, 65.0, 107.0, 171.0, 275.0, 468.0, 794.0, 1160.0, 1801.0, 2720.0, 4272.0, 6435.0, 9451.0, 13614.0, 19451.0, 26840.0, 35967.0, 46534.0, 58979.0, 70041.0, 80267.0, 87229.0, 89786.0, 88658.0, 82629.0, 73086.0, 61715.0, 50199.0, 39046.0, 29614.0, 21299.0, 15044.0, 10459.0, 7114.0, 4693.0, 2994.0, 1989.0, 1310.0, 823.0, 513.0, 315.0, 209.0, 120.0, 87.0, 49.0, 31.0, 15.0, 12.0, 10.0, 5.0, 2.0, 3.0, 3.0], "bins": [-17.078125, -16.5704345703125, -16.062744140625, -15.5550537109375, -15.04736328125, -14.5396728515625, -14.031982421875, -13.5242919921875, -13.0166015625, -12.5089111328125, -12.001220703125, -11.4935302734375, -10.98583984375, -10.4781494140625, -9.970458984375, -9.4627685546875, -8.955078125, -8.4473876953125, -7.939697265625, -7.4320068359375, -6.92431640625, -6.4166259765625, -5.908935546875, -5.4012451171875, -4.8935546875, -4.3858642578125, -3.878173828125, -3.3704833984375, -2.86279296875, -2.3551025390625, -1.847412109375, -1.3397216796875, -0.83203125, -0.3243408203125, 0.183349609375, 0.6910400390625, 1.19873046875, 1.7064208984375, 2.214111328125, 2.7218017578125, 3.2294921875, 3.7371826171875, 4.244873046875, 4.7525634765625, 5.26025390625, 5.7679443359375, 6.275634765625, 6.7833251953125, 7.291015625, 7.7987060546875, 8.306396484375, 8.8140869140625, 9.32177734375, 9.8294677734375, 10.337158203125, 10.8448486328125, 11.3525390625, 11.8602294921875, 12.367919921875, 12.8756103515625, 13.38330078125, 13.8909912109375, 14.398681640625, 14.9063720703125, 15.4140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 3.0, 8.0, 11.0, 9.0, 16.0, 17.0, 15.0, 17.0, 28.0, 32.0, 41.0, 34.0, 29.0, 28.0, 36.0, 59.0, 38.0, 45.0, 39.0, 45.0, 39.0, 51.0, 42.0, 36.0, 28.0, 41.0, 29.0, 37.0, 24.0, 27.0, 19.0, 11.0, 10.0, 13.0, 8.0, 5.0, 10.0, 6.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.49658203125, -16.8837890625, -16.27099609375, -15.658203125, -15.04541015625, -14.4326171875, -13.81982421875, -13.20703125, -12.59423828125, -11.9814453125, -11.36865234375, -10.755859375, -10.14306640625, -9.5302734375, -8.91748046875, -8.3046875, -7.69189453125, -7.0791015625, -6.46630859375, -5.853515625, -5.24072265625, -4.6279296875, -4.01513671875, -3.40234375, -2.78955078125, -2.1767578125, -1.56396484375, -0.951171875, -0.33837890625, 0.2744140625, 0.88720703125, 1.5, 2.11279296875, 2.7255859375, 3.33837890625, 3.951171875, 4.56396484375, 5.1767578125, 5.78955078125, 6.40234375, 7.01513671875, 7.6279296875, 8.24072265625, 8.853515625, 9.46630859375, 10.0791015625, 10.69189453125, 11.3046875, 11.91748046875, 12.5302734375, 13.14306640625, 13.755859375, 14.36865234375, 14.9814453125, 15.59423828125, 16.20703125, 16.81982421875, 17.4326171875, 18.04541015625, 18.658203125, 19.27099609375, 19.8837890625, 20.49658203125, 21.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 8.0, 10.0, 19.0, 9.0, 43.0, 58.0, 84.0, 122.0, 221.0, 316.0, 536.0, 853.0, 1383.0, 2371.0, 3968.0, 6597.0, 10802.0, 17719.0, 28864.0, 45558.0, 68140.0, 93097.0, 117779.0, 131816.0, 131266.0, 115462.0, 91177.0, 65316.0, 44234.0, 27668.0, 17175.0, 10257.0, 6094.0, 3674.0, 2259.0, 1342.0, 860.0, 492.0, 312.0, 227.0, 121.0, 76.0, 53.0, 36.0, 19.0, 24.0, 14.0, 11.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0], "bins": [-10.7265625, -10.41064453125, -10.0947265625, -9.77880859375, -9.462890625, -9.14697265625, -8.8310546875, -8.51513671875, -8.19921875, -7.88330078125, -7.5673828125, -7.25146484375, -6.935546875, -6.61962890625, -6.3037109375, -5.98779296875, -5.671875, -5.35595703125, -5.0400390625, -4.72412109375, -4.408203125, -4.09228515625, -3.7763671875, -3.46044921875, -3.14453125, -2.82861328125, -2.5126953125, -2.19677734375, -1.880859375, -1.56494140625, -1.2490234375, -0.93310546875, -0.6171875, -0.30126953125, 0.0146484375, 0.33056640625, 0.646484375, 0.96240234375, 1.2783203125, 1.59423828125, 1.91015625, 2.22607421875, 2.5419921875, 2.85791015625, 3.173828125, 3.48974609375, 3.8056640625, 4.12158203125, 4.4375, 4.75341796875, 5.0693359375, 5.38525390625, 5.701171875, 6.01708984375, 6.3330078125, 6.64892578125, 6.96484375, 7.28076171875, 7.5966796875, 7.91259765625, 8.228515625, 8.54443359375, 8.8603515625, 9.17626953125, 9.4921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 11.0, 16.0, 15.0, 20.0, 33.0, 24.0, 39.0, 46.0, 55.0, 46.0, 53.0, 70.0, 68.0, 62.0, 62.0, 64.0, 38.0, 43.0, 43.0, 35.0, 36.0, 20.0, 26.0, 12.0, 13.0, 11.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010528564453125, -0.0010097026824951172, -0.0009665489196777344, -0.0009233951568603516, -0.0008802413940429688, -0.0008370876312255859, -0.0007939338684082031, -0.0007507801055908203, -0.0007076263427734375, -0.0006644725799560547, -0.0006213188171386719, -0.0005781650543212891, -0.0005350112915039062, -0.0004918575286865234, -0.0004487037658691406, -0.0004055500030517578, -0.000362396240234375, -0.0003192424774169922, -0.0002760887145996094, -0.00023293495178222656, -0.00018978118896484375, -0.00014662742614746094, -0.00010347366333007812, -6.031990051269531e-05, -1.71661376953125e-05, 2.5987625122070312e-05, 6.914138793945312e-05, 0.00011229515075683594, 0.00015544891357421875, 0.00019860267639160156, 0.00024175643920898438, 0.0002849102020263672, 0.00032806396484375, 0.0003712177276611328, 0.0004143714904785156, 0.00045752525329589844, 0.0005006790161132812, 0.0005438327789306641, 0.0005869865417480469, 0.0006301403045654297, 0.0006732940673828125, 0.0007164478302001953, 0.0007596015930175781, 0.0008027553558349609, 0.0008459091186523438, 0.0008890628814697266, 0.0009322166442871094, 0.0009753704071044922, 0.001018524169921875, 0.0010616779327392578, 0.0011048316955566406, 0.0011479854583740234, 0.0011911392211914062, 0.001234292984008789, 0.0012774467468261719, 0.0013206005096435547, 0.0013637542724609375, 0.0014069080352783203, 0.0014500617980957031, 0.001493215560913086, 0.0015363693237304688, 0.0015795230865478516, 0.0016226768493652344, 0.0016658306121826172, 0.001708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 14.0, 19.0, 24.0, 29.0, 49.0, 64.0, 106.0, 135.0, 251.0, 384.0, 635.0, 1024.0, 1689.0, 2907.0, 4940.0, 8529.0, 14682.0, 25346.0, 41699.0, 65526.0, 95189.0, 124760.0, 143681.0, 142316.0, 122331.0, 92349.0, 62897.0, 39536.0, 24008.0, 14025.0, 7928.0, 4599.0, 2700.0, 1614.0, 963.0, 547.0, 364.0, 228.0, 151.0, 105.0, 73.0, 45.0, 38.0, 20.0, 17.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6773681640625, -11.300048828125, -10.9227294921875, -10.54541015625, -10.1680908203125, -9.790771484375, -9.4134521484375, -9.0361328125, -8.6588134765625, -8.281494140625, -7.9041748046875, -7.52685546875, -7.1495361328125, -6.772216796875, -6.3948974609375, -6.017578125, -5.6402587890625, -5.262939453125, -4.8856201171875, -4.50830078125, -4.1309814453125, -3.753662109375, -3.3763427734375, -2.9990234375, -2.6217041015625, -2.244384765625, -1.8670654296875, -1.48974609375, -1.1124267578125, -0.735107421875, -0.3577880859375, 0.01953125, 0.3968505859375, 0.774169921875, 1.1514892578125, 1.52880859375, 1.9061279296875, 2.283447265625, 2.6607666015625, 3.0380859375, 3.4154052734375, 3.792724609375, 4.1700439453125, 4.54736328125, 4.9246826171875, 5.302001953125, 5.6793212890625, 6.056640625, 6.4339599609375, 6.811279296875, 7.1885986328125, 7.56591796875, 7.9432373046875, 8.320556640625, 8.6978759765625, 9.0751953125, 9.4525146484375, 9.829833984375, 10.2071533203125, 10.58447265625, 10.9617919921875, 11.339111328125, 11.7164306640625, 12.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 14.0, 12.0, 12.0, 15.0, 16.0, 24.0, 28.0, 34.0, 33.0, 44.0, 47.0, 50.0, 57.0, 72.0, 58.0, 54.0, 60.0, 49.0, 45.0, 40.0, 37.0, 34.0, 35.0, 29.0, 20.0, 15.0, 14.0, 9.0, 6.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.88653564453125, -4.7105712890625, -4.53460693359375, -4.358642578125, -4.18267822265625, -4.0067138671875, -3.83074951171875, -3.65478515625, -3.47882080078125, -3.3028564453125, -3.12689208984375, -2.950927734375, -2.77496337890625, -2.5989990234375, -2.42303466796875, -2.2470703125, -2.07110595703125, -1.8951416015625, -1.71917724609375, -1.543212890625, -1.36724853515625, -1.1912841796875, -1.01531982421875, -0.83935546875, -0.66339111328125, -0.4874267578125, -0.31146240234375, -0.135498046875, 0.04046630859375, 0.2164306640625, 0.39239501953125, 0.568359375, 0.74432373046875, 0.9202880859375, 1.09625244140625, 1.272216796875, 1.44818115234375, 1.6241455078125, 1.80010986328125, 1.97607421875, 2.15203857421875, 2.3280029296875, 2.50396728515625, 2.679931640625, 2.85589599609375, 3.0318603515625, 3.20782470703125, 3.3837890625, 3.55975341796875, 3.7357177734375, 3.91168212890625, 4.087646484375, 4.26361083984375, 4.4395751953125, 4.61553955078125, 4.79150390625, 4.96746826171875, 5.1434326171875, 5.31939697265625, 5.495361328125, 5.67132568359375, 5.8472900390625, 6.02325439453125, 6.19921875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 11.0, 9.0, 12.0, 25.0, 26.0, 22.0, 15.0, 23.0, 26.0, 32.0, 46.0, 35.0, 41.0, 44.0, 52.0, 50.0, 38.0, 43.0, 46.0, 41.0, 37.0, 41.0, 39.0, 38.0, 37.0, 27.0, 19.0, 22.0, 15.0, 18.0, 11.0, 8.0, 2.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.67168426513672, -29.784299850463867, -28.896913528442383, -28.00952911376953, -27.12214469909668, -26.234758377075195, -25.347373962402344, -24.45998764038086, -23.572603225708008, -22.685218811035156, -21.797832489013672, -20.91044807434082, -20.02306365966797, -19.135677337646484, -18.248292922973633, -17.36090850830078, -16.473522186279297, -15.586136817932129, -14.698752403259277, -13.81136703491211, -12.923981666564941, -12.036596298217773, -11.149211883544922, -10.261826515197754, -9.374443054199219, -8.48705768585205, -7.599672794342041, -6.712287902832031, -5.824902534484863, -4.9375176429748535, -4.050132751464844, -3.162747383117676, -2.275362014770508, -1.387976884841919, -0.5005918741226196, 0.3867931365966797, 1.2741782665252686, 2.1615633964538574, 3.048948287963867, 3.936333656311035, 4.823718547821045, 5.711103439331055, 6.598488807678223, 7.485873699188232, 8.373258590698242, 9.26064395904541, 10.148029327392578, 11.03541374206543, 11.922799110412598, 12.810184478759766, 13.697568893432617, 14.584954261779785, 15.472339630126953, 16.359724044799805, 17.247108459472656, 18.13449478149414, 19.021879196166992, 19.909263610839844, 20.796649932861328, 21.68403434753418, 22.57141876220703, 23.458805084228516, 24.346189498901367, 25.23357391357422, 26.120960235595703]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 10.0, 6.0, 5.0, 3.0, 10.0, 13.0, 11.0, 16.0, 12.0, 16.0, 20.0, 16.0, 14.0, 38.0, 31.0, 27.0, 35.0, 32.0, 34.0, 29.0, 25.0, 30.0, 33.0, 38.0, 44.0, 40.0, 35.0, 40.0, 33.0, 28.0, 35.0, 33.0, 27.0, 27.0, 21.0, 21.0, 19.0, 15.0, 12.0, 14.0, 12.0, 14.0, 10.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.14889907836914, -25.28321647644043, -24.41753387451172, -23.551849365234375, -22.686166763305664, -21.820484161376953, -20.954801559448242, -20.08911895751953, -19.223434448242188, -18.357751846313477, -17.492069244384766, -16.626384735107422, -15.760702133178711, -14.89501953125, -14.029336929321289, -13.163654327392578, -12.297971725463867, -11.432289123535156, -10.566605567932129, -9.700922966003418, -8.83523941040039, -7.96955680847168, -7.103874206542969, -6.2381911277771, -5.3725080490112305, -4.506824970245361, -3.6411421298980713, -2.7754592895507812, -1.909776210784912, -1.044093132019043, -0.17841053009033203, 0.6872725486755371, 1.5529556274414062, 2.4186387062072754, 3.2843215465545654, 4.1500043869018555, 5.015687465667725, 5.881370544433594, 6.747053146362305, 7.612736225128174, 8.478419303894043, 9.344101905822754, 10.209785461425781, 11.075468063354492, 11.941150665283203, 12.80683422088623, 13.672516822814941, 14.538200378417969, 15.40388298034668, 16.26956558227539, 17.1352481842041, 18.000930786132812, 18.866615295410156, 19.732297897338867, 20.597980499267578, 21.46366310119629, 22.329345703125, 23.19502830505371, 24.060710906982422, 24.926395416259766, 25.792078018188477, 26.657760620117188, 27.5234432220459, 28.38912582397461, 29.254810333251953]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 9.0, 4.0, 9.0, 20.0, 45.0, 78.0, 132.0, 228.0, 386.0, 610.0, 990.0, 1664.0, 2737.0, 4537.0, 7396.0, 12185.0, 19708.0, 31434.0, 49506.0, 76303.0, 114807.0, 166750.0, 230963.0, 303806.0, 374717.0, 424980.0, 448868.0, 434378.0, 387794.0, 319232.0, 246137.0, 179279.0, 124580.0, 84231.0, 54454.0, 34896.0, 21599.0, 13606.0, 8378.0, 5067.0, 3136.0, 1783.0, 1135.0, 681.0, 407.0, 259.0, 133.0, 103.0, 53.0, 35.0, 23.0, 21.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.765625, -19.119873046875, -18.47412109375, -17.828369140625, -17.1826171875, -16.536865234375, -15.89111328125, -15.245361328125, -14.599609375, -13.953857421875, -13.30810546875, -12.662353515625, -12.0166015625, -11.370849609375, -10.72509765625, -10.079345703125, -9.43359375, -8.787841796875, -8.14208984375, -7.496337890625, -6.8505859375, -6.204833984375, -5.55908203125, -4.913330078125, -4.267578125, -3.621826171875, -2.97607421875, -2.330322265625, -1.6845703125, -1.038818359375, -0.39306640625, 0.252685546875, 0.8984375, 1.544189453125, 2.18994140625, 2.835693359375, 3.4814453125, 4.127197265625, 4.77294921875, 5.418701171875, 6.064453125, 6.710205078125, 7.35595703125, 8.001708984375, 8.6474609375, 9.293212890625, 9.93896484375, 10.584716796875, 11.23046875, 11.876220703125, 12.52197265625, 13.167724609375, 13.8134765625, 14.459228515625, 15.10498046875, 15.750732421875, 16.396484375, 17.042236328125, 17.68798828125, 18.333740234375, 18.9794921875, 19.625244140625, 20.27099609375, 20.916748046875, 21.5625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 7.0, 3.0, 7.0, 7.0, 14.0, 11.0, 14.0, 14.0, 16.0, 18.0, 18.0, 15.0, 33.0, 30.0, 35.0, 39.0, 25.0, 38.0, 28.0, 28.0, 20.0, 42.0, 37.0, 41.0, 37.0, 40.0, 39.0, 30.0, 26.0, 34.0, 40.0, 29.0, 20.0, 23.0, 25.0, 23.0, 17.0, 6.0, 10.0, 12.0, 17.0, 11.0, 8.0, 1.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.296875, -22.5283203125, -21.759765625, -20.9912109375, -20.22265625, -19.4541015625, -18.685546875, -17.9169921875, -17.1484375, -16.3798828125, -15.611328125, -14.8427734375, -14.07421875, -13.3056640625, -12.537109375, -11.7685546875, -11.0, -10.2314453125, -9.462890625, -8.6943359375, -7.92578125, -7.1572265625, -6.388671875, -5.6201171875, -4.8515625, -4.0830078125, -3.314453125, -2.5458984375, -1.77734375, -1.0087890625, -0.240234375, 0.5283203125, 1.296875, 2.0654296875, 2.833984375, 3.6025390625, 4.37109375, 5.1396484375, 5.908203125, 6.6767578125, 7.4453125, 8.2138671875, 8.982421875, 9.7509765625, 10.51953125, 11.2880859375, 12.056640625, 12.8251953125, 13.59375, 14.3623046875, 15.130859375, 15.8994140625, 16.66796875, 17.4365234375, 18.205078125, 18.9736328125, 19.7421875, 20.5107421875, 21.279296875, 22.0478515625, 22.81640625, 23.5849609375, 24.353515625, 25.1220703125, 25.890625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 12.0, 6.0, 25.0, 27.0, 47.0, 62.0, 131.0, 206.0, 373.0, 559.0, 897.0, 1505.0, 2432.0, 3811.0, 6219.0, 9800.0, 15367.0, 23716.0, 36637.0, 54675.0, 80153.0, 114323.0, 156314.0, 207545.0, 263693.0, 316918.0, 361214.0, 386821.0, 390399.0, 369271.0, 329439.0, 279303.0, 222557.0, 169974.0, 125484.0, 88487.0, 60963.0, 41200.0, 26743.0, 17261.0, 11140.0, 6912.0, 4451.0, 2769.0, 1757.0, 1035.0, 623.0, 413.0, 243.0, 152.0, 79.0, 51.0, 46.0, 23.0, 20.0, 2.0, 5.0, 5.0, 0.0, 1.0], "bins": [-20.0, -19.377685546875, -18.75537109375, -18.133056640625, -17.5107421875, -16.888427734375, -16.26611328125, -15.643798828125, -15.021484375, -14.399169921875, -13.77685546875, -13.154541015625, -12.5322265625, -11.909912109375, -11.28759765625, -10.665283203125, -10.04296875, -9.420654296875, -8.79833984375, -8.176025390625, -7.5537109375, -6.931396484375, -6.30908203125, -5.686767578125, -5.064453125, -4.442138671875, -3.81982421875, -3.197509765625, -2.5751953125, -1.952880859375, -1.33056640625, -0.708251953125, -0.0859375, 0.536376953125, 1.15869140625, 1.781005859375, 2.4033203125, 3.025634765625, 3.64794921875, 4.270263671875, 4.892578125, 5.514892578125, 6.13720703125, 6.759521484375, 7.3818359375, 8.004150390625, 8.62646484375, 9.248779296875, 9.87109375, 10.493408203125, 11.11572265625, 11.738037109375, 12.3603515625, 12.982666015625, 13.60498046875, 14.227294921875, 14.849609375, 15.471923828125, 16.09423828125, 16.716552734375, 17.3388671875, 17.961181640625, 18.58349609375, 19.205810546875, 19.828125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 7.0, 11.0, 9.0, 19.0, 32.0, 29.0, 33.0, 47.0, 59.0, 64.0, 106.0, 122.0, 119.0, 138.0, 152.0, 146.0, 214.0, 206.0, 205.0, 198.0, 253.0, 226.0, 208.0, 186.0, 191.0, 176.0, 145.0, 142.0, 118.0, 91.0, 74.0, 79.0, 68.0, 54.0, 34.0, 22.0, 25.0, 17.0, 18.0, 13.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3046875, -12.9056396484375, -12.506591796875, -12.1075439453125, -11.70849609375, -11.3094482421875, -10.910400390625, -10.5113525390625, -10.1123046875, -9.7132568359375, -9.314208984375, -8.9151611328125, -8.51611328125, -8.1170654296875, -7.718017578125, -7.3189697265625, -6.919921875, -6.5208740234375, -6.121826171875, -5.7227783203125, -5.32373046875, -4.9246826171875, -4.525634765625, -4.1265869140625, -3.7275390625, -3.3284912109375, -2.929443359375, -2.5303955078125, -2.13134765625, -1.7322998046875, -1.333251953125, -0.9342041015625, -0.53515625, -0.1361083984375, 0.262939453125, 0.6619873046875, 1.06103515625, 1.4600830078125, 1.859130859375, 2.2581787109375, 2.6572265625, 3.0562744140625, 3.455322265625, 3.8543701171875, 4.25341796875, 4.6524658203125, 5.051513671875, 5.4505615234375, 5.849609375, 6.2486572265625, 6.647705078125, 7.0467529296875, 7.44580078125, 7.8448486328125, 8.243896484375, 8.6429443359375, 9.0419921875, 9.4410400390625, 9.840087890625, 10.2391357421875, 10.63818359375, 11.0372314453125, 11.436279296875, 11.8353271484375, 12.234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 4.0, 13.0, 12.0, 7.0, 15.0, 11.0, 20.0, 18.0, 18.0, 31.0, 23.0, 30.0, 19.0, 27.0, 37.0, 33.0, 33.0, 27.0, 48.0, 40.0, 51.0, 53.0, 26.0, 43.0, 26.0, 25.0, 35.0, 42.0, 24.0, 18.0, 21.0, 27.0, 20.0, 10.0, 16.0, 15.0, 10.0, 12.0, 7.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0], "bins": [-26.77130889892578, -26.007795333862305, -25.244281768798828, -24.48076629638672, -23.717252731323242, -22.953739166259766, -22.19022560119629, -21.426712036132812, -20.663196563720703, -19.899682998657227, -19.13616943359375, -18.37265396118164, -17.609140396118164, -16.845626831054688, -16.08211326599121, -15.318599700927734, -14.555086135864258, -13.791572570800781, -13.028058052062988, -12.264544486999512, -11.501029968261719, -10.737516403198242, -9.974002838134766, -9.210489273071289, -8.446974754333496, -7.683460712432861, -6.919946670532227, -6.15643310546875, -5.392919063568115, -4.6294050216674805, -3.865891456604004, -3.102377414703369, -2.3388614654541016, -1.5753475427627563, -0.8118336200714111, -0.04831981658935547, 0.7151942253112793, 1.478708267211914, 2.2422218322753906, 3.0057358741760254, 3.76924991607666, 4.532763957977295, 5.29627799987793, 6.059791564941406, 6.823305606842041, 7.586819648742676, 8.350333213806152, 9.113847732543945, 9.877361297607422, 10.640874862670898, 11.404389381408691, 12.167902946472168, 12.931417465209961, 13.694931030273438, 14.458444595336914, 15.22195816040039, 15.985472679138184, 16.748987197875977, 17.512500762939453, 18.27601432800293, 19.039527893066406, 19.803043365478516, 20.56655502319336, 21.33007049560547, 22.093584060668945]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 7.0, 7.0, 8.0, 7.0, 8.0, 12.0, 19.0, 19.0, 17.0, 27.0, 18.0, 26.0, 23.0, 32.0, 33.0, 24.0, 34.0, 36.0, 41.0, 41.0, 34.0, 50.0, 55.0, 38.0, 43.0, 33.0, 30.0, 35.0, 26.0, 36.0, 20.0, 28.0, 28.0, 25.0, 17.0, 5.0, 11.0, 7.0, 13.0, 11.0, 9.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.928504943847656, -26.996150970458984, -26.063796997070312, -25.131441116333008, -24.199087142944336, -23.266733169555664, -22.33437728881836, -21.402023315429688, -20.469669342041016, -19.537315368652344, -18.604961395263672, -17.672605514526367, -16.740251541137695, -15.807897567749023, -14.875542640686035, -13.943187713623047, -13.010833740234375, -12.078479766845703, -11.146124839782715, -10.213769912719727, -9.281415939331055, -8.349061965942383, -7.4167070388793945, -6.4843525886535645, -5.551998138427734, -4.619643688201904, -3.687289237976074, -2.754934787750244, -1.822580337524414, -0.890225887298584, 0.042128562927246094, 0.9744830131530762, 1.906839370727539, 2.839193820953369, 3.771548271179199, 4.703902721405029, 5.636257171630859, 6.5686116218566895, 7.5009660720825195, 8.433320999145508, 9.36567497253418, 10.298028945922852, 11.23038387298584, 12.162738800048828, 13.0950927734375, 14.027446746826172, 14.95980167388916, 15.892156600952148, 16.82451057434082, 17.756864547729492, 18.689220428466797, 19.62157440185547, 20.55392837524414, 21.486282348632812, 22.418636322021484, 23.35099220275879, 24.28334617614746, 25.215700149536133, 26.148056030273438, 27.08041000366211, 28.01276397705078, 28.945117950439453, 29.877471923828125, 30.80982780456543, 31.7421817779541]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 6.0, 11.0, 22.0, 31.0, 50.0, 85.0, 138.0, 183.0, 317.0, 466.0, 685.0, 1076.0, 1726.0, 2535.0, 4087.0, 6243.0, 9229.0, 13838.0, 20438.0, 29338.0, 41030.0, 55222.0, 71862.0, 87981.0, 101186.0, 107353.0, 104368.0, 94102.0, 78984.0, 62254.0, 46460.0, 34243.0, 23979.0, 16470.0, 11115.0, 7428.0, 4854.0, 3251.0, 2045.0, 1321.0, 885.0, 610.0, 390.0, 237.0, 159.0, 105.0, 66.0, 33.0, 30.0, 11.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.984375, -4.83203125, -4.6796875, -4.52734375, -4.375, -4.22265625, -4.0703125, -3.91796875, -3.765625, -3.61328125, -3.4609375, -3.30859375, -3.15625, -3.00390625, -2.8515625, -2.69921875, -2.546875, -2.39453125, -2.2421875, -2.08984375, -1.9375, -1.78515625, -1.6328125, -1.48046875, -1.328125, -1.17578125, -1.0234375, -0.87109375, -0.71875, -0.56640625, -0.4140625, -0.26171875, -0.109375, 0.04296875, 0.1953125, 0.34765625, 0.5, 0.65234375, 0.8046875, 0.95703125, 1.109375, 1.26171875, 1.4140625, 1.56640625, 1.71875, 1.87109375, 2.0234375, 2.17578125, 2.328125, 2.48046875, 2.6328125, 2.78515625, 2.9375, 3.08984375, 3.2421875, 3.39453125, 3.546875, 3.69921875, 3.8515625, 4.00390625, 4.15625, 4.30859375, 4.4609375, 4.61328125, 4.765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 8.0, 11.0, 19.0, 21.0, 17.0, 27.0, 18.0, 26.0, 23.0, 31.0, 32.0, 26.0, 34.0, 36.0, 44.0, 37.0, 35.0, 52.0, 56.0, 36.0, 42.0, 33.0, 32.0, 34.0, 25.0, 35.0, 20.0, 30.0, 27.0, 25.0, 16.0, 6.0, 9.0, 9.0, 13.0, 13.0, 7.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.26806640625, -26.3330078125, -25.39794921875, -24.462890625, -23.52783203125, -22.5927734375, -21.65771484375, -20.72265625, -19.78759765625, -18.8525390625, -17.91748046875, -16.982421875, -16.04736328125, -15.1123046875, -14.17724609375, -13.2421875, -12.30712890625, -11.3720703125, -10.43701171875, -9.501953125, -8.56689453125, -7.6318359375, -6.69677734375, -5.76171875, -4.82666015625, -3.8916015625, -2.95654296875, -2.021484375, -1.08642578125, -0.1513671875, 0.78369140625, 1.71875, 2.65380859375, 3.5888671875, 4.52392578125, 5.458984375, 6.39404296875, 7.3291015625, 8.26416015625, 9.19921875, 10.13427734375, 11.0693359375, 12.00439453125, 12.939453125, 13.87451171875, 14.8095703125, 15.74462890625, 16.6796875, 17.61474609375, 18.5498046875, 19.48486328125, 20.419921875, 21.35498046875, 22.2900390625, 23.22509765625, 24.16015625, 25.09521484375, 26.0302734375, 26.96533203125, 27.900390625, 28.83544921875, 29.7705078125, 30.70556640625, 31.640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 7.0, 18.0, 16.0, 18.0, 42.0, 65.0, 82.0, 130.0, 172.0, 302.0, 433.0, 680.0, 1051.0, 1642.0, 2588.0, 4007.0, 6557.0, 10663.0, 18179.0, 33939.0, 661836.0, 236326.0, 28594.0, 15656.0, 9435.0, 5836.0, 3742.0, 2378.0, 1481.0, 944.0, 613.0, 379.0, 247.0, 187.0, 105.0, 65.0, 38.0, 29.0, 28.0, 16.0, 9.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.21875, -16.695068359375, -16.17138671875, -15.647705078125, -15.1240234375, -14.600341796875, -14.07666015625, -13.552978515625, -13.029296875, -12.505615234375, -11.98193359375, -11.458251953125, -10.9345703125, -10.410888671875, -9.88720703125, -9.363525390625, -8.83984375, -8.316162109375, -7.79248046875, -7.268798828125, -6.7451171875, -6.221435546875, -5.69775390625, -5.174072265625, -4.650390625, -4.126708984375, -3.60302734375, -3.079345703125, -2.5556640625, -2.031982421875, -1.50830078125, -0.984619140625, -0.4609375, 0.062744140625, 0.58642578125, 1.110107421875, 1.6337890625, 2.157470703125, 2.68115234375, 3.204833984375, 3.728515625, 4.252197265625, 4.77587890625, 5.299560546875, 5.8232421875, 6.346923828125, 6.87060546875, 7.394287109375, 7.91796875, 8.441650390625, 8.96533203125, 9.489013671875, 10.0126953125, 10.536376953125, 11.06005859375, 11.583740234375, 12.107421875, 12.631103515625, 13.15478515625, 13.678466796875, 14.2021484375, 14.725830078125, 15.24951171875, 15.773193359375, 16.296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 3.0, 9.0, 11.0, 12.0, 17.0, 10.0, 27.0, 21.0, 23.0, 35.0, 23.0, 39.0, 34.0, 48.0, 48.0, 41.0, 43.0, 45.0, 48.0, 43.0, 44.0, 43.0, 45.0, 31.0, 33.0, 33.0, 29.0, 29.0, 20.0, 25.0, 19.0, 13.0, 9.0, 7.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.859375, -23.171875, -22.484375, -21.796875, -21.109375, -20.421875, -19.734375, -19.046875, -18.359375, -17.671875, -16.984375, -16.296875, -15.609375, -14.921875, -14.234375, -13.546875, -12.859375, -12.171875, -11.484375, -10.796875, -10.109375, -9.421875, -8.734375, -8.046875, -7.359375, -6.671875, -5.984375, -5.296875, -4.609375, -3.921875, -3.234375, -2.546875, -1.859375, -1.171875, -0.484375, 0.203125, 0.890625, 1.578125, 2.265625, 2.953125, 3.640625, 4.328125, 5.015625, 5.703125, 6.390625, 7.078125, 7.765625, 8.453125, 9.140625, 9.828125, 10.515625, 11.203125, 11.890625, 12.578125, 13.265625, 13.953125, 14.640625, 15.328125, 16.015625, 16.703125, 17.390625, 18.078125, 18.765625, 19.453125, 20.140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 1.0, 7.0, 10.0, 10.0, 12.0, 18.0, 42.0, 53.0, 67.0, 107.0, 133.0, 218.0, 328.0, 519.0, 797.0, 1179.0, 1821.0, 2943.0, 4759.0, 7615.0, 12694.0, 21945.0, 46710.0, 829595.0, 58432.0, 23450.0, 13467.0, 8062.0, 4846.0, 3115.0, 1946.0, 1224.0, 784.0, 543.0, 365.0, 230.0, 155.0, 100.0, 68.0, 57.0, 37.0, 29.0, 17.0, 15.0, 9.0, 8.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.123046875, -1.085052490234375, -1.04705810546875, -1.009063720703125, -0.9710693359375, -0.933074951171875, -0.89508056640625, -0.857086181640625, -0.819091796875, -0.781097412109375, -0.74310302734375, -0.705108642578125, -0.6671142578125, -0.629119873046875, -0.59112548828125, -0.553131103515625, -0.51513671875, -0.477142333984375, -0.43914794921875, -0.401153564453125, -0.3631591796875, -0.325164794921875, -0.28717041015625, -0.249176025390625, -0.211181640625, -0.173187255859375, -0.13519287109375, -0.097198486328125, -0.0592041015625, -0.021209716796875, 0.01678466796875, 0.054779052734375, 0.0927734375, 0.130767822265625, 0.16876220703125, 0.206756591796875, 0.2447509765625, 0.282745361328125, 0.32073974609375, 0.358734130859375, 0.396728515625, 0.434722900390625, 0.47271728515625, 0.510711669921875, 0.5487060546875, 0.586700439453125, 0.62469482421875, 0.662689208984375, 0.70068359375, 0.738677978515625, 0.77667236328125, 0.814666748046875, 0.8526611328125, 0.890655517578125, 0.92864990234375, 0.966644287109375, 1.004638671875, 1.042633056640625, 1.08062744140625, 1.118621826171875, 1.1566162109375, 1.194610595703125, 1.23260498046875, 1.270599365234375, 1.30859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 1.0, 1.0, 4.0, 5.0, 12.0, 13.0, 10.0, 11.0, 10.0, 22.0, 40.0, 28.0, 34.0, 45.0, 46.0, 55.0, 70.0, 56.0, 70.0, 67.0, 43.0, 65.0, 46.0, 49.0, 35.0, 28.0, 30.0, 26.0, 17.0, 14.0, 13.0, 9.0, 5.0, 7.0, 4.0, 8.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.698204040527344e-05, -5.5312179028987885e-05, -5.364231765270233e-05, -5.197245627641678e-05, -5.0302594900131226e-05, -4.863273352384567e-05, -4.696287214756012e-05, -4.529301077127457e-05, -4.3623149394989014e-05, -4.195328801870346e-05, -4.028342664241791e-05, -3.8613565266132355e-05, -3.69437038898468e-05, -3.527384251356125e-05, -3.3603981137275696e-05, -3.193411976099014e-05, -3.026425838470459e-05, -2.8594397008419037e-05, -2.6924535632133484e-05, -2.525467425584793e-05, -2.3584812879562378e-05, -2.1914951503276825e-05, -2.0245090126991272e-05, -1.857522875070572e-05, -1.6905367374420166e-05, -1.5235505998134613e-05, -1.356564462184906e-05, -1.1895783245563507e-05, -1.0225921869277954e-05, -8.556060492992401e-06, -6.886199116706848e-06, -5.216337740421295e-06, -3.546476364135742e-06, -1.8766149878501892e-06, -2.0675361156463623e-07, 1.4631077647209167e-06, 3.1329691410064697e-06, 4.802830517292023e-06, 6.472691893577576e-06, 8.142553269863129e-06, 9.812414646148682e-06, 1.1482276022434235e-05, 1.3152137398719788e-05, 1.482199877500534e-05, 1.6491860151290894e-05, 1.8161721527576447e-05, 1.9831582903862e-05, 2.1501444280147552e-05, 2.3171305656433105e-05, 2.484116703271866e-05, 2.651102840900421e-05, 2.8180889785289764e-05, 2.9850751161575317e-05, 3.152061253786087e-05, 3.319047391414642e-05, 3.4860335290431976e-05, 3.653019666671753e-05, 3.820005804300308e-05, 3.9869919419288635e-05, 4.153978079557419e-05, 4.320964217185974e-05, 4.4879503548145294e-05, 4.654936492443085e-05, 4.82192263007164e-05, 4.988908767700195e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 11.0, 23.0, 25.0, 20.0, 46.0, 81.0, 142.0, 237.0, 353.0, 547.0, 909.0, 1408.0, 2378.0, 3603.0, 5627.0, 8901.0, 13512.0, 20398.0, 30041.0, 42633.0, 59928.0, 79906.0, 101401.0, 118076.0, 122311.0, 111662.0, 91838.0, 70666.0, 52078.0, 36897.0, 24928.0, 17062.0, 11143.0, 7026.0, 4762.0, 2941.0, 1899.0, 1145.0, 781.0, 422.0, 268.0, 180.0, 117.0, 81.0, 53.0, 35.0, 23.0, 17.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.896484375, -0.8678207397460938, -0.8391571044921875, -0.8104934692382812, -0.781829833984375, -0.7531661987304688, -0.7245025634765625, -0.6958389282226562, -0.66717529296875, -0.6385116577148438, -0.6098480224609375, -0.5811843872070312, -0.552520751953125, -0.5238571166992188, -0.4951934814453125, -0.46652984619140625, -0.4378662109375, -0.40920257568359375, -0.3805389404296875, -0.35187530517578125, -0.323211669921875, -0.29454803466796875, -0.2658843994140625, -0.23722076416015625, -0.20855712890625, -0.17989349365234375, -0.1512298583984375, -0.12256622314453125, -0.093902587890625, -0.06523895263671875, -0.0365753173828125, -0.00791168212890625, 0.020751953125, 0.04941558837890625, 0.0780792236328125, 0.10674285888671875, 0.135406494140625, 0.16407012939453125, 0.1927337646484375, 0.22139739990234375, 0.25006103515625, 0.27872467041015625, 0.3073883056640625, 0.33605194091796875, 0.364715576171875, 0.39337921142578125, 0.4220428466796875, 0.45070648193359375, 0.4793701171875, 0.5080337524414062, 0.5366973876953125, 0.5653610229492188, 0.594024658203125, 0.6226882934570312, 0.6513519287109375, 0.6800155639648438, 0.70867919921875, 0.7373428344726562, 0.7660064697265625, 0.7946701049804688, 0.823333740234375, 0.8519973754882812, 0.8806610107421875, 0.9093246459960938, 0.93798828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 12.0, 17.0, 15.0, 16.0, 28.0, 30.0, 40.0, 33.0, 41.0, 36.0, 52.0, 64.0, 59.0, 65.0, 54.0, 64.0, 44.0, 43.0, 57.0, 42.0, 30.0, 33.0, 37.0, 10.0, 12.0, 10.0, 5.0, 5.0, 7.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5706710815429688, -0.5519866943359375, -0.5333023071289062, -0.514617919921875, -0.49593353271484375, -0.4772491455078125, -0.45856475830078125, -0.43988037109375, -0.42119598388671875, -0.4025115966796875, -0.38382720947265625, -0.365142822265625, -0.34645843505859375, -0.3277740478515625, -0.30908966064453125, -0.2904052734375, -0.27172088623046875, -0.2530364990234375, -0.23435211181640625, -0.215667724609375, -0.19698333740234375, -0.1782989501953125, -0.15961456298828125, -0.14093017578125, -0.12224578857421875, -0.1035614013671875, -0.08487701416015625, -0.066192626953125, -0.04750823974609375, -0.0288238525390625, -0.01013946533203125, 0.008544921875, 0.02722930908203125, 0.0459136962890625, 0.06459808349609375, 0.083282470703125, 0.10196685791015625, 0.1206512451171875, 0.13933563232421875, 0.15802001953125, 0.17670440673828125, 0.1953887939453125, 0.21407318115234375, 0.232757568359375, 0.25144195556640625, 0.2701263427734375, 0.28881072998046875, 0.3074951171875, 0.32617950439453125, 0.3448638916015625, 0.36354827880859375, 0.382232666015625, 0.40091705322265625, 0.4196014404296875, 0.43828582763671875, 0.45697021484375, 0.47565460205078125, 0.4943389892578125, 0.5130233764648438, 0.531707763671875, 0.5503921508789062, 0.5690765380859375, 0.5877609252929688, 0.6064453125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 7.0, 13.0, 7.0, 11.0, 13.0, 12.0, 16.0, 16.0, 20.0, 20.0, 22.0, 31.0, 21.0, 21.0, 41.0, 30.0, 27.0, 38.0, 34.0, 42.0, 49.0, 47.0, 46.0, 27.0, 35.0, 33.0, 23.0, 30.0, 36.0, 26.0, 27.0, 21.0, 16.0, 21.0, 12.0, 15.0, 12.0, 12.0, 10.0, 11.0, 11.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0], "bins": [-26.746143341064453, -25.995161056518555, -25.24418067932129, -24.49319839477539, -23.742218017578125, -22.991235733032227, -22.240253448486328, -21.489273071289062, -20.738290786743164, -19.987308502197266, -19.236328125, -18.4853458404541, -17.734365463256836, -16.983383178710938, -16.232402801513672, -15.481420516967773, -14.730439186096191, -13.97945785522461, -13.228476524353027, -12.477495193481445, -11.726512908935547, -10.975531578063965, -10.224550247192383, -9.473567962646484, -8.722587585449219, -7.971606254577637, -7.2206244468688965, -6.4696431159973145, -5.718661308288574, -4.967679977416992, -4.21669864654541, -3.46571683883667, -2.7147350311279297, -1.9637534618377686, -1.212772011756897, -0.4617905616760254, 0.28919100761413574, 1.0401725769042969, 1.791153907775879, 2.542135715484619, 3.293117046356201, 4.044098377227783, 4.795080184936523, 5.5460615158081055, 6.2970428466796875, 7.048024654388428, 7.79900598526001, 8.54998779296875, 9.300969123840332, 10.051950454711914, 10.802931785583496, 11.553913116455078, 12.304895401000977, 13.055876731872559, 13.80685806274414, 14.557840347290039, 15.308820724487305, 16.059803009033203, 16.81078338623047, 17.561765670776367, 18.312746047973633, 19.06372833251953, 19.814708709716797, 20.565690994262695, 21.316673278808594]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 7.0, 5.0, 8.0, 8.0, 5.0, 10.0, 17.0, 19.0, 20.0, 25.0, 17.0, 24.0, 30.0, 26.0, 30.0, 27.0, 34.0, 37.0, 38.0, 38.0, 39.0, 48.0, 49.0, 50.0, 34.0, 44.0, 26.0, 34.0, 29.0, 32.0, 22.0, 30.0, 34.0, 18.0, 20.0, 9.0, 4.0, 14.0, 12.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.60406494140625, -27.664897918701172, -26.72572898864746, -25.786561965942383, -24.847393035888672, -23.908226013183594, -22.969058990478516, -22.029890060424805, -21.090721130371094, -20.151554107666016, -19.212385177612305, -18.273218154907227, -17.334049224853516, -16.394882202148438, -15.455714225769043, -14.516546249389648, -13.57737922668457, -12.638211250305176, -11.699043273925781, -10.759876251220703, -9.820707321166992, -8.881540298461914, -7.9423723220825195, -7.003204345703125, -6.0640363693237305, -5.124868392944336, -4.185700416564941, -3.246532917022705, -2.3073649406433105, -1.368196964263916, -0.4290294647216797, 0.5101385116577148, 1.4493083953857422, 2.3884763717651367, 3.327644109725952, 4.266811847686768, 5.205979824066162, 6.145147800445557, 7.084315299987793, 8.023483276367188, 8.962651252746582, 9.901819229125977, 10.840987205505371, 11.780155181884766, 12.719322204589844, 13.658491134643555, 14.597658157348633, 15.536826133728027, 16.475994110107422, 17.4151611328125, 18.35433006286621, 19.29349708557129, 20.232666015625, 21.171833038330078, 22.111000061035156, 23.050168991088867, 23.989337921142578, 24.928504943847656, 25.867673873901367, 26.806840896606445, 27.746009826660156, 28.685176849365234, 29.624343872070312, 30.563512802124023, 31.5026798248291]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 8.0, 9.0, 14.0, 32.0, 35.0, 61.0, 98.0, 172.0, 262.0, 397.0, 672.0, 1033.0, 1526.0, 2416.0, 3672.0, 5204.0, 7708.0, 10959.0, 14953.0, 20152.0, 26877.0, 34895.0, 43534.0, 53045.0, 61903.0, 70332.0, 76421.0, 80295.0, 80272.0, 77105.0, 72336.0, 63568.0, 54694.0, 45383.0, 36570.0, 28235.0, 21513.0, 15822.0, 11502.0, 8152.0, 5639.0, 3811.0, 2498.0, 1712.0, 1145.0, 723.0, 461.0, 278.0, 167.0, 127.0, 72.0, 43.0, 20.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-13.5234375, -13.0885009765625, -12.653564453125, -12.2186279296875, -11.78369140625, -11.3487548828125, -10.913818359375, -10.4788818359375, -10.0439453125, -9.6090087890625, -9.174072265625, -8.7391357421875, -8.30419921875, -7.8692626953125, -7.434326171875, -6.9993896484375, -6.564453125, -6.1295166015625, -5.694580078125, -5.2596435546875, -4.82470703125, -4.3897705078125, -3.954833984375, -3.5198974609375, -3.0849609375, -2.6500244140625, -2.215087890625, -1.7801513671875, -1.34521484375, -0.9102783203125, -0.475341796875, -0.0404052734375, 0.39453125, 0.8294677734375, 1.264404296875, 1.6993408203125, 2.13427734375, 2.5692138671875, 3.004150390625, 3.4390869140625, 3.8740234375, 4.3089599609375, 4.743896484375, 5.1788330078125, 5.61376953125, 6.0487060546875, 6.483642578125, 6.9185791015625, 7.353515625, 7.7884521484375, 8.223388671875, 8.6583251953125, 9.09326171875, 9.5281982421875, 9.963134765625, 10.3980712890625, 10.8330078125, 11.2679443359375, 11.702880859375, 12.1378173828125, 12.57275390625, 13.0076904296875, 13.442626953125, 13.8775634765625, 14.3125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 6.0, 8.0, 7.0, 7.0, 10.0, 22.0, 17.0, 17.0, 23.0, 24.0, 21.0, 28.0, 29.0, 31.0, 27.0, 33.0, 35.0, 43.0, 34.0, 41.0, 50.0, 48.0, 49.0, 35.0, 38.0, 30.0, 34.0, 27.0, 31.0, 25.0, 29.0, 32.0, 18.0, 18.0, 9.0, 6.0, 12.0, 13.0, 7.0, 13.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.71875, -26.804931640625, -25.89111328125, -24.977294921875, -24.0634765625, -23.149658203125, -22.23583984375, -21.322021484375, -20.408203125, -19.494384765625, -18.58056640625, -17.666748046875, -16.7529296875, -15.839111328125, -14.92529296875, -14.011474609375, -13.09765625, -12.183837890625, -11.27001953125, -10.356201171875, -9.4423828125, -8.528564453125, -7.61474609375, -6.700927734375, -5.787109375, -4.873291015625, -3.95947265625, -3.045654296875, -2.1318359375, -1.218017578125, -0.30419921875, 0.609619140625, 1.5234375, 2.437255859375, 3.35107421875, 4.264892578125, 5.1787109375, 6.092529296875, 7.00634765625, 7.920166015625, 8.833984375, 9.747802734375, 10.66162109375, 11.575439453125, 12.4892578125, 13.403076171875, 14.31689453125, 15.230712890625, 16.14453125, 17.058349609375, 17.97216796875, 18.885986328125, 19.7998046875, 20.713623046875, 21.62744140625, 22.541259765625, 23.455078125, 24.368896484375, 25.28271484375, 26.196533203125, 27.1103515625, 28.024169921875, 28.93798828125, 29.851806640625, 30.765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 16.0, 16.0, 30.0, 54.0, 117.0, 151.0, 296.0, 415.0, 708.0, 1206.0, 1855.0, 2838.0, 4422.0, 6948.0, 10094.0, 14873.0, 20856.0, 28414.0, 37978.0, 48550.0, 60632.0, 71775.0, 81223.0, 87487.0, 89480.0, 87255.0, 81430.0, 71425.0, 60091.0, 48061.0, 37783.0, 28459.0, 20608.0, 14538.0, 9867.0, 6574.0, 4312.0, 2836.0, 1845.0, 1189.0, 739.0, 433.0, 249.0, 159.0, 103.0, 71.0, 37.0, 22.0, 12.0, 10.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.5234375, -15.0455322265625, -14.567626953125, -14.0897216796875, -13.61181640625, -13.1339111328125, -12.656005859375, -12.1781005859375, -11.7001953125, -11.2222900390625, -10.744384765625, -10.2664794921875, -9.78857421875, -9.3106689453125, -8.832763671875, -8.3548583984375, -7.876953125, -7.3990478515625, -6.921142578125, -6.4432373046875, -5.96533203125, -5.4874267578125, -5.009521484375, -4.5316162109375, -4.0537109375, -3.5758056640625, -3.097900390625, -2.6199951171875, -2.14208984375, -1.6641845703125, -1.186279296875, -0.7083740234375, -0.23046875, 0.2474365234375, 0.725341796875, 1.2032470703125, 1.68115234375, 2.1590576171875, 2.636962890625, 3.1148681640625, 3.5927734375, 4.0706787109375, 4.548583984375, 5.0264892578125, 5.50439453125, 5.9822998046875, 6.460205078125, 6.9381103515625, 7.416015625, 7.8939208984375, 8.371826171875, 8.8497314453125, 9.32763671875, 9.8055419921875, 10.283447265625, 10.7613525390625, 11.2392578125, 11.7171630859375, 12.195068359375, 12.6729736328125, 13.15087890625, 13.6287841796875, 14.106689453125, 14.5845947265625, 15.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 5.0, 8.0, 10.0, 8.0, 13.0, 9.0, 10.0, 22.0, 20.0, 28.0, 22.0, 29.0, 30.0, 33.0, 33.0, 35.0, 30.0, 47.0, 33.0, 29.0, 43.0, 40.0, 38.0, 34.0, 34.0, 25.0, 31.0, 38.0, 39.0, 34.0, 18.0, 33.0, 20.0, 17.0, 19.0, 18.0, 10.0, 9.0, 9.0, 9.0, 6.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 4.0, 2.0, 1.0], "bins": [-19.75, -19.173583984375, -18.59716796875, -18.020751953125, -17.4443359375, -16.867919921875, -16.29150390625, -15.715087890625, -15.138671875, -14.562255859375, -13.98583984375, -13.409423828125, -12.8330078125, -12.256591796875, -11.68017578125, -11.103759765625, -10.52734375, -9.950927734375, -9.37451171875, -8.798095703125, -8.2216796875, -7.645263671875, -7.06884765625, -6.492431640625, -5.916015625, -5.339599609375, -4.76318359375, -4.186767578125, -3.6103515625, -3.033935546875, -2.45751953125, -1.881103515625, -1.3046875, -0.728271484375, -0.15185546875, 0.424560546875, 1.0009765625, 1.577392578125, 2.15380859375, 2.730224609375, 3.306640625, 3.883056640625, 4.45947265625, 5.035888671875, 5.6123046875, 6.188720703125, 6.76513671875, 7.341552734375, 7.91796875, 8.494384765625, 9.07080078125, 9.647216796875, 10.2236328125, 10.800048828125, 11.37646484375, 11.952880859375, 12.529296875, 13.105712890625, 13.68212890625, 14.258544921875, 14.8349609375, 15.411376953125, 15.98779296875, 16.564208984375, 17.140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 11.0, 23.0, 20.0, 47.0, 61.0, 85.0, 189.0, 284.0, 469.0, 802.0, 1394.0, 2311.0, 3877.0, 6388.0, 10580.0, 16854.0, 26730.0, 40275.0, 57635.0, 77668.0, 97853.0, 113391.0, 118680.0, 114934.0, 99766.0, 80926.0, 60427.0, 42653.0, 28113.0, 18141.0, 11159.0, 6824.0, 3916.0, 2392.0, 1461.0, 860.0, 509.0, 297.0, 211.0, 117.0, 84.0, 51.0, 31.0, 17.0, 16.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.572021484375, -7.31591796875, -7.059814453125, -6.8037109375, -6.547607421875, -6.29150390625, -6.035400390625, -5.779296875, -5.523193359375, -5.26708984375, -5.010986328125, -4.7548828125, -4.498779296875, -4.24267578125, -3.986572265625, -3.73046875, -3.474365234375, -3.21826171875, -2.962158203125, -2.7060546875, -2.449951171875, -2.19384765625, -1.937744140625, -1.681640625, -1.425537109375, -1.16943359375, -0.913330078125, -0.6572265625, -0.401123046875, -0.14501953125, 0.111083984375, 0.3671875, 0.623291015625, 0.87939453125, 1.135498046875, 1.3916015625, 1.647705078125, 1.90380859375, 2.159912109375, 2.416015625, 2.672119140625, 2.92822265625, 3.184326171875, 3.4404296875, 3.696533203125, 3.95263671875, 4.208740234375, 4.46484375, 4.720947265625, 4.97705078125, 5.233154296875, 5.4892578125, 5.745361328125, 6.00146484375, 6.257568359375, 6.513671875, 6.769775390625, 7.02587890625, 7.281982421875, 7.5380859375, 7.794189453125, 8.05029296875, 8.306396484375, 8.5625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 3.0, 8.0, 9.0, 15.0, 10.0, 21.0, 16.0, 20.0, 21.0, 28.0, 34.0, 30.0, 41.0, 46.0, 52.0, 46.0, 51.0, 41.0, 40.0, 40.0, 42.0, 58.0, 34.0, 40.0, 39.0, 32.0, 24.0, 16.0, 28.0, 19.0, 12.0, 8.0, 9.0, 9.0, 14.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00087738037109375, -0.0008480101823806763, -0.0008186399936676025, -0.0007892698049545288, -0.0007598996162414551, -0.0007305294275283813, -0.0007011592388153076, -0.0006717890501022339, -0.0006424188613891602, -0.0006130486726760864, -0.0005836784839630127, -0.000554308295249939, -0.0005249381065368652, -0.0004955679178237915, -0.0004661977291107178, -0.00043682754039764404, -0.0004074573516845703, -0.0003780871629714966, -0.00034871697425842285, -0.0003193467855453491, -0.0002899765968322754, -0.00026060640811920166, -0.00023123621940612793, -0.0002018660306930542, -0.00017249584197998047, -0.00014312565326690674, -0.00011375546455383301, -8.438527584075928e-05, -5.501508712768555e-05, -2.5644898414611816e-05, 3.725290298461914e-06, 3.3095479011535645e-05, 6.246566772460938e-05, 9.18358564376831e-05, 0.00012120604515075684, 0.00015057623386383057, 0.0001799464225769043, 0.00020931661128997803, 0.00023868680000305176, 0.0002680569887161255, 0.0002974271774291992, 0.00032679736614227295, 0.0003561675548553467, 0.0003855377435684204, 0.00041490793228149414, 0.00044427812099456787, 0.0004736483097076416, 0.0005030184984207153, 0.0005323886871337891, 0.0005617588758468628, 0.0005911290645599365, 0.0006204992532730103, 0.000649869441986084, 0.0006792396306991577, 0.0007086098194122314, 0.0007379800081253052, 0.0007673501968383789, 0.0007967203855514526, 0.0008260905742645264, 0.0008554607629776001, 0.0008848309516906738, 0.0009142011404037476, 0.0009435713291168213, 0.000972941517829895, 0.0010023117065429688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 13.0, 20.0, 27.0, 44.0, 78.0, 116.0, 219.0, 335.0, 503.0, 901.0, 1447.0, 2582.0, 4234.0, 6934.0, 11665.0, 18033.0, 28071.0, 41756.0, 58047.0, 77093.0, 94629.0, 108629.0, 114192.0, 110253.0, 98149.0, 81153.0, 61829.0, 44766.0, 30509.0, 20023.0, 12854.0, 7655.0, 4740.0, 2771.0, 1708.0, 1025.0, 616.0, 358.0, 247.0, 129.0, 82.0, 51.0, 28.0, 10.0, 14.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.1640625, -8.891357421875, -8.61865234375, -8.345947265625, -8.0732421875, -7.800537109375, -7.52783203125, -7.255126953125, -6.982421875, -6.709716796875, -6.43701171875, -6.164306640625, -5.8916015625, -5.618896484375, -5.34619140625, -5.073486328125, -4.80078125, -4.528076171875, -4.25537109375, -3.982666015625, -3.7099609375, -3.437255859375, -3.16455078125, -2.891845703125, -2.619140625, -2.346435546875, -2.07373046875, -1.801025390625, -1.5283203125, -1.255615234375, -0.98291015625, -0.710205078125, -0.4375, -0.164794921875, 0.10791015625, 0.380615234375, 0.6533203125, 0.926025390625, 1.19873046875, 1.471435546875, 1.744140625, 2.016845703125, 2.28955078125, 2.562255859375, 2.8349609375, 3.107666015625, 3.38037109375, 3.653076171875, 3.92578125, 4.198486328125, 4.47119140625, 4.743896484375, 5.0166015625, 5.289306640625, 5.56201171875, 5.834716796875, 6.107421875, 6.380126953125, 6.65283203125, 6.925537109375, 7.1982421875, 7.470947265625, 7.74365234375, 8.016357421875, 8.2890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 4.0, 3.0, 5.0, 9.0, 21.0, 15.0, 22.0, 16.0, 29.0, 19.0, 30.0, 31.0, 31.0, 39.0, 30.0, 46.0, 42.0, 37.0, 51.0, 35.0, 34.0, 39.0, 49.0, 55.0, 44.0, 46.0, 35.0, 38.0, 20.0, 24.0, 15.0, 15.0, 15.0, 17.0, 10.0, 6.0, 2.0, 6.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.968109130859375, -3.84637451171875, -3.724639892578125, -3.6029052734375, -3.481170654296875, -3.35943603515625, -3.237701416015625, -3.115966796875, -2.994232177734375, -2.87249755859375, -2.750762939453125, -2.6290283203125, -2.507293701171875, -2.38555908203125, -2.263824462890625, -2.14208984375, -2.020355224609375, -1.89862060546875, -1.776885986328125, -1.6551513671875, -1.533416748046875, -1.41168212890625, -1.289947509765625, -1.168212890625, -1.046478271484375, -0.92474365234375, -0.803009033203125, -0.6812744140625, -0.559539794921875, -0.43780517578125, -0.316070556640625, -0.1943359375, -0.072601318359375, 0.04913330078125, 0.170867919921875, 0.2926025390625, 0.414337158203125, 0.53607177734375, 0.657806396484375, 0.779541015625, 0.901275634765625, 1.02301025390625, 1.144744873046875, 1.2664794921875, 1.388214111328125, 1.50994873046875, 1.631683349609375, 1.75341796875, 1.875152587890625, 1.99688720703125, 2.118621826171875, 2.2403564453125, 2.362091064453125, 2.48382568359375, 2.605560302734375, 2.727294921875, 2.849029541015625, 2.97076416015625, 3.092498779296875, 3.2142333984375, 3.335968017578125, 3.45770263671875, 3.579437255859375, 3.701171875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 6.0, 6.0, 8.0, 5.0, 11.0, 15.0, 9.0, 18.0, 15.0, 23.0, 17.0, 15.0, 23.0, 26.0, 35.0, 38.0, 42.0, 32.0, 26.0, 38.0, 45.0, 44.0, 43.0, 49.0, 33.0, 37.0, 39.0, 32.0, 32.0, 31.0, 31.0, 17.0, 20.0, 23.0, 16.0, 16.0, 11.0, 19.0, 10.0, 7.0, 9.0, 4.0, 5.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.271846771240234, -25.466659545898438, -24.661470413208008, -23.85628318786621, -23.051095962524414, -22.245906829833984, -21.440719604492188, -20.63553237915039, -19.830345153808594, -19.025157928466797, -18.219968795776367, -17.41478157043457, -16.609594345092773, -15.80440616607666, -14.999217987060547, -14.19403076171875, -13.38884162902832, -12.583653450012207, -11.77846622467041, -10.973278045654297, -10.1680908203125, -9.362902641296387, -8.557714462280273, -7.752526760101318, -6.947339057922363, -6.142151355743408, -5.336963653564453, -4.53177547454834, -3.7265877723693848, -2.9214000701904297, -2.1162118911743164, -1.3110241889953613, -0.5058345794677734, 0.2993532419204712, 1.1045410633087158, 1.90972900390625, 2.714916706085205, 3.52010440826416, 4.325292587280273, 5.1304802894592285, 5.935667991638184, 6.740855693817139, 7.546043395996094, 8.351231575012207, 9.15641975402832, 9.961606979370117, 10.76679515838623, 11.571983337402344, 12.37717056274414, 13.182358741760254, 13.98754596710205, 14.792734146118164, 15.597921371459961, 16.40311050415039, 17.208297729492188, 18.013484954833984, 18.81867218017578, 19.623859405517578, 20.429048538208008, 21.234235763549805, 22.0394229888916, 22.84461212158203, 23.649799346923828, 24.454986572265625, 25.260175704956055]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 10.0, 13.0, 16.0, 27.0, 22.0, 22.0, 21.0, 30.0, 28.0, 26.0, 37.0, 37.0, 44.0, 25.0, 47.0, 48.0, 38.0, 44.0, 42.0, 35.0, 35.0, 33.0, 38.0, 39.0, 22.0, 26.0, 27.0, 18.0, 20.0, 20.0, 13.0, 15.0, 12.0, 6.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.278982162475586, -30.311729431152344, -29.344478607177734, -28.377225875854492, -27.40997314453125, -26.44272232055664, -25.4754695892334, -24.508216857910156, -23.540964126586914, -22.573711395263672, -21.606460571289062, -20.63920783996582, -19.671955108642578, -18.70470428466797, -17.737451553344727, -16.770198822021484, -15.802947044372559, -14.835695266723633, -13.86844253540039, -12.901190757751465, -11.933938026428223, -10.966686248779297, -9.999433517456055, -9.032181739807129, -8.064929962158203, -7.097677707672119, -6.130425453186035, -5.163173675537109, -4.195920944213867, -3.2286691665649414, -2.2614169120788574, -1.2941646575927734, -0.32691192626953125, 0.640340268611908, 1.6075924634933472, 2.5748445987701416, 3.5420968532562256, 4.5093488693237305, 5.4766011238098145, 6.443853378295898, 7.411105632781982, 8.378357887268066, 9.345609664916992, 10.312862396240234, 11.28011417388916, 12.247365951538086, 13.214618682861328, 14.18187141418457, 15.149123191833496, 16.116374969482422, 17.083627700805664, 18.050880432128906, 19.018131256103516, 19.985383987426758, 20.95263671875, 21.91988754272461, 22.88714027404785, 23.854393005371094, 24.821643829345703, 25.788896560668945, 26.756149291992188, 27.723400115966797, 28.69065284729004, 29.65790557861328, 30.625158309936523]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 15.0, 32.0, 51.0, 86.0, 124.0, 205.0, 338.0, 586.0, 974.0, 1656.0, 2650.0, 4404.0, 7057.0, 11255.0, 18067.0, 28108.0, 43381.0, 66569.0, 98038.0, 140713.0, 193727.0, 256838.0, 321573.0, 377770.0, 413952.0, 421657.0, 399168.0, 351278.0, 290094.0, 226009.0, 166355.0, 118129.0, 81540.0, 54500.0, 35539.0, 23047.0, 14471.0, 9275.0, 5729.0, 3617.0, 2215.0, 1338.0, 821.0, 537.0, 278.0, 206.0, 114.0, 72.0, 51.0, 26.0, 16.0, 13.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.515625, -18.891357421875, -18.26708984375, -17.642822265625, -17.0185546875, -16.394287109375, -15.77001953125, -15.145751953125, -14.521484375, -13.897216796875, -13.27294921875, -12.648681640625, -12.0244140625, -11.400146484375, -10.77587890625, -10.151611328125, -9.52734375, -8.903076171875, -8.27880859375, -7.654541015625, -7.0302734375, -6.406005859375, -5.78173828125, -5.157470703125, -4.533203125, -3.908935546875, -3.28466796875, -2.660400390625, -2.0361328125, -1.411865234375, -0.78759765625, -0.163330078125, 0.4609375, 1.085205078125, 1.70947265625, 2.333740234375, 2.9580078125, 3.582275390625, 4.20654296875, 4.830810546875, 5.455078125, 6.079345703125, 6.70361328125, 7.327880859375, 7.9521484375, 8.576416015625, 9.20068359375, 9.824951171875, 10.44921875, 11.073486328125, 11.69775390625, 12.322021484375, 12.9462890625, 13.570556640625, 14.19482421875, 14.819091796875, 15.443359375, 16.067626953125, 16.69189453125, 17.316162109375, 17.9404296875, 18.564697265625, 19.18896484375, 19.813232421875, 20.4375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 10.0, 14.0, 21.0, 25.0, 27.0, 21.0, 24.0, 27.0, 28.0, 33.0, 41.0, 36.0, 33.0, 37.0, 49.0, 47.0, 36.0, 41.0, 42.0, 37.0, 27.0, 40.0, 40.0, 25.0, 25.0, 24.0, 27.0, 17.0, 19.0, 18.0, 14.0, 12.0, 8.0, 8.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.390625, -26.528564453125, -25.66650390625, -24.804443359375, -23.9423828125, -23.080322265625, -22.21826171875, -21.356201171875, -20.494140625, -19.632080078125, -18.77001953125, -17.907958984375, -17.0458984375, -16.183837890625, -15.32177734375, -14.459716796875, -13.59765625, -12.735595703125, -11.87353515625, -11.011474609375, -10.1494140625, -9.287353515625, -8.42529296875, -7.563232421875, -6.701171875, -5.839111328125, -4.97705078125, -4.114990234375, -3.2529296875, -2.390869140625, -1.52880859375, -0.666748046875, 0.1953125, 1.057373046875, 1.91943359375, 2.781494140625, 3.6435546875, 4.505615234375, 5.36767578125, 6.229736328125, 7.091796875, 7.953857421875, 8.81591796875, 9.677978515625, 10.5400390625, 11.402099609375, 12.26416015625, 13.126220703125, 13.98828125, 14.850341796875, 15.71240234375, 16.574462890625, 17.4365234375, 18.298583984375, 19.16064453125, 20.022705078125, 20.884765625, 21.746826171875, 22.60888671875, 23.470947265625, 24.3330078125, 25.195068359375, 26.05712890625, 26.919189453125, 27.78125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 14.0, 19.0, 31.0, 67.0, 124.0, 179.0, 326.0, 564.0, 1008.0, 1725.0, 3022.0, 5020.0, 8653.0, 14556.0, 23973.0, 39100.0, 61375.0, 94067.0, 138067.0, 194767.0, 259916.0, 326951.0, 386933.0, 426045.0, 434008.0, 408876.0, 359430.0, 294975.0, 226964.0, 165389.0, 114485.0, 77278.0, 49247.0, 30853.0, 18814.0, 11395.0, 6702.0, 4004.0, 2238.0, 1389.0, 763.0, 439.0, 233.0, 136.0, 76.0, 47.0, 19.0, 11.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.265625, -20.562744140625, -19.85986328125, -19.156982421875, -18.4541015625, -17.751220703125, -17.04833984375, -16.345458984375, -15.642578125, -14.939697265625, -14.23681640625, -13.533935546875, -12.8310546875, -12.128173828125, -11.42529296875, -10.722412109375, -10.01953125, -9.316650390625, -8.61376953125, -7.910888671875, -7.2080078125, -6.505126953125, -5.80224609375, -5.099365234375, -4.396484375, -3.693603515625, -2.99072265625, -2.287841796875, -1.5849609375, -0.882080078125, -0.17919921875, 0.523681640625, 1.2265625, 1.929443359375, 2.63232421875, 3.335205078125, 4.0380859375, 4.740966796875, 5.44384765625, 6.146728515625, 6.849609375, 7.552490234375, 8.25537109375, 8.958251953125, 9.6611328125, 10.364013671875, 11.06689453125, 11.769775390625, 12.47265625, 13.175537109375, 13.87841796875, 14.581298828125, 15.2841796875, 15.987060546875, 16.68994140625, 17.392822265625, 18.095703125, 18.798583984375, 19.50146484375, 20.204345703125, 20.9072265625, 21.610107421875, 22.31298828125, 23.015869140625, 23.71875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 10.0, 19.0, 31.0, 29.0, 41.0, 53.0, 75.0, 71.0, 84.0, 103.0, 123.0, 152.0, 138.0, 185.0, 191.0, 185.0, 194.0, 212.0, 203.0, 189.0, 194.0, 194.0, 171.0, 168.0, 156.0, 149.0, 117.0, 114.0, 110.0, 69.0, 65.0, 62.0, 54.0, 25.0, 24.0, 19.0, 18.0, 17.0, 9.0, 5.0, 11.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.4140625, -10.0238037109375, -9.633544921875, -9.2432861328125, -8.85302734375, -8.4627685546875, -8.072509765625, -7.6822509765625, -7.2919921875, -6.9017333984375, -6.511474609375, -6.1212158203125, -5.73095703125, -5.3406982421875, -4.950439453125, -4.5601806640625, -4.169921875, -3.7796630859375, -3.389404296875, -2.9991455078125, -2.60888671875, -2.2186279296875, -1.828369140625, -1.4381103515625, -1.0478515625, -0.6575927734375, -0.267333984375, 0.1229248046875, 0.51318359375, 0.9034423828125, 1.293701171875, 1.6839599609375, 2.07421875, 2.4644775390625, 2.854736328125, 3.2449951171875, 3.63525390625, 4.0255126953125, 4.415771484375, 4.8060302734375, 5.1962890625, 5.5865478515625, 5.976806640625, 6.3670654296875, 6.75732421875, 7.1475830078125, 7.537841796875, 7.9281005859375, 8.318359375, 8.7086181640625, 9.098876953125, 9.4891357421875, 9.87939453125, 10.2696533203125, 10.659912109375, 11.0501708984375, 11.4404296875, 11.8306884765625, 12.220947265625, 12.6112060546875, 13.00146484375, 13.3917236328125, 13.781982421875, 14.1722412109375, 14.5625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 17.0, 9.0, 10.0, 13.0, 23.0, 15.0, 30.0, 25.0, 23.0, 35.0, 37.0, 29.0, 32.0, 27.0, 28.0, 27.0, 49.0, 44.0, 39.0, 28.0, 26.0, 48.0, 38.0, 49.0, 41.0, 42.0, 33.0, 25.0, 18.0, 13.0, 29.0, 19.0, 14.0, 8.0, 15.0, 4.0, 7.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.76230812072754, -25.899370193481445, -25.03643226623535, -24.173492431640625, -23.31055450439453, -22.447616577148438, -21.584678649902344, -20.72174072265625, -19.858802795410156, -18.995864868164062, -18.13292694091797, -17.269989013671875, -16.40704917907715, -15.544111251831055, -14.681173324584961, -13.818235397338867, -12.95529556274414, -12.092357635498047, -11.229418754577637, -10.366480827331543, -9.503541946411133, -8.640604019165039, -7.777666091918945, -6.914727687835693, -6.051789283752441, -5.1888508796691895, -4.3259124755859375, -3.4629745483398438, -2.600036144256592, -1.7370977401733398, -0.8741598129272461, -0.01122140884399414, 0.851715087890625, 1.7146533727645874, 2.57759165763855, 3.4405298233032227, 4.303468227386475, 5.166406631469727, 6.02934455871582, 6.892282962799072, 7.755221366882324, 8.618159294128418, 9.481098175048828, 10.344036102294922, 11.206974029541016, 12.069912910461426, 12.93285083770752, 13.79578971862793, 14.658727645874023, 15.521665573120117, 16.38460350036621, 17.247543334960938, 18.11048126220703, 18.973419189453125, 19.83635711669922, 20.699295043945312, 21.562232971191406, 22.4251708984375, 23.288108825683594, 24.151046752929688, 25.013986587524414, 25.876924514770508, 26.7398624420166, 27.602800369262695, 28.465740203857422]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 8.0, 4.0, 7.0, 14.0, 13.0, 8.0, 9.0, 14.0, 16.0, 16.0, 18.0, 15.0, 31.0, 28.0, 29.0, 38.0, 29.0, 26.0, 35.0, 34.0, 29.0, 35.0, 36.0, 31.0, 31.0, 35.0, 35.0, 39.0, 34.0, 27.0, 27.0, 24.0, 21.0, 20.0, 27.0, 14.0, 17.0, 20.0, 19.0, 16.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.637876510620117, -24.81793785095215, -23.998001098632812, -23.178062438964844, -22.358123779296875, -21.53818702697754, -20.71824836730957, -19.898311614990234, -19.078372955322266, -18.258434295654297, -17.43849754333496, -16.618558883666992, -15.79862117767334, -14.978683471679688, -14.158744812011719, -13.338807106018066, -12.518869400024414, -11.698931694030762, -10.87899398803711, -10.05905532836914, -9.239117622375488, -8.419179916381836, -7.599241733551025, -6.779303550720215, -5.9593658447265625, -5.13942813873291, -4.3194899559021, -3.499552011489868, -2.6796140670776367, -1.8596763610839844, -1.0397381782531738, -0.21979999542236328, 0.6001396179199219, 1.4200775623321533, 2.2400155067443848, 3.059953451156616, 3.8798913955688477, 4.6998291015625, 5.5197672843933105, 6.339705467224121, 7.159643173217773, 7.979580879211426, 8.799518585205078, 9.619457244873047, 10.4393949508667, 11.259332656860352, 12.07927131652832, 12.899209022521973, 13.719146728515625, 14.539084434509277, 15.35902214050293, 16.1789608001709, 16.998897552490234, 17.818836212158203, 18.638774871826172, 19.45871353149414, 20.278650283813477, 21.098588943481445, 21.91852569580078, 22.73846435546875, 23.55840301513672, 24.378339767456055, 25.198278427124023, 26.01821517944336, 26.838153839111328]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 4.0, 15.0, 16.0, 34.0, 45.0, 88.0, 123.0, 221.0, 317.0, 482.0, 731.0, 1097.0, 1789.0, 2768.0, 4307.0, 6603.0, 9877.0, 14647.0, 21173.0, 30888.0, 42686.0, 57454.0, 73343.0, 88219.0, 100575.0, 105272.0, 102516.0, 92112.0, 77484.0, 61462.0, 46599.0, 33548.0, 23965.0, 16306.0, 11042.0, 7199.0, 4783.0, 3154.0, 2010.0, 1278.0, 810.0, 515.0, 346.0, 248.0, 143.0, 96.0, 58.0, 47.0, 18.0, 14.0, 14.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0], "bins": [-4.21484375, -4.085693359375, -3.95654296875, -3.827392578125, -3.6982421875, -3.569091796875, -3.43994140625, -3.310791015625, -3.181640625, -3.052490234375, -2.92333984375, -2.794189453125, -2.6650390625, -2.535888671875, -2.40673828125, -2.277587890625, -2.1484375, -2.019287109375, -1.89013671875, -1.760986328125, -1.6318359375, -1.502685546875, -1.37353515625, -1.244384765625, -1.115234375, -0.986083984375, -0.85693359375, -0.727783203125, -0.5986328125, -0.469482421875, -0.34033203125, -0.211181640625, -0.08203125, 0.047119140625, 0.17626953125, 0.305419921875, 0.4345703125, 0.563720703125, 0.69287109375, 0.822021484375, 0.951171875, 1.080322265625, 1.20947265625, 1.338623046875, 1.4677734375, 1.596923828125, 1.72607421875, 1.855224609375, 1.984375, 2.113525390625, 2.24267578125, 2.371826171875, 2.5009765625, 2.630126953125, 2.75927734375, 2.888427734375, 3.017578125, 3.146728515625, 3.27587890625, 3.405029296875, 3.5341796875, 3.663330078125, 3.79248046875, 3.921630859375, 4.05078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 9.0, 4.0, 6.0, 14.0, 12.0, 10.0, 9.0, 13.0, 15.0, 16.0, 19.0, 15.0, 32.0, 23.0, 31.0, 36.0, 31.0, 26.0, 31.0, 39.0, 29.0, 34.0, 34.0, 34.0, 31.0, 33.0, 39.0, 35.0, 34.0, 29.0, 25.0, 27.0, 21.0, 16.0, 30.0, 14.0, 19.0, 20.0, 17.0, 18.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.640625, -24.81689453125, -23.9931640625, -23.16943359375, -22.345703125, -21.52197265625, -20.6982421875, -19.87451171875, -19.05078125, -18.22705078125, -17.4033203125, -16.57958984375, -15.755859375, -14.93212890625, -14.1083984375, -13.28466796875, -12.4609375, -11.63720703125, -10.8134765625, -9.98974609375, -9.166015625, -8.34228515625, -7.5185546875, -6.69482421875, -5.87109375, -5.04736328125, -4.2236328125, -3.39990234375, -2.576171875, -1.75244140625, -0.9287109375, -0.10498046875, 0.71875, 1.54248046875, 2.3662109375, 3.18994140625, 4.013671875, 4.83740234375, 5.6611328125, 6.48486328125, 7.30859375, 8.13232421875, 8.9560546875, 9.77978515625, 10.603515625, 11.42724609375, 12.2509765625, 13.07470703125, 13.8984375, 14.72216796875, 15.5458984375, 16.36962890625, 17.193359375, 18.01708984375, 18.8408203125, 19.66455078125, 20.48828125, 21.31201171875, 22.1357421875, 22.95947265625, 23.783203125, 24.60693359375, 25.4306640625, 26.25439453125, 27.078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 16.0, 17.0, 32.0, 34.0, 46.0, 81.0, 123.0, 163.0, 287.0, 421.0, 631.0, 928.0, 1429.0, 2180.0, 3225.0, 4888.0, 7515.0, 11999.0, 19782.0, 39064.0, 718082.0, 166016.0, 27747.0, 15841.0, 9640.0, 6323.0, 4144.0, 2623.0, 1816.0, 1132.0, 790.0, 503.0, 362.0, 222.0, 170.0, 100.0, 44.0, 42.0, 34.0, 24.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.2784423828125, -9.908447265625, -9.5384521484375, -9.16845703125, -8.7984619140625, -8.428466796875, -8.0584716796875, -7.6884765625, -7.3184814453125, -6.948486328125, -6.5784912109375, -6.20849609375, -5.8385009765625, -5.468505859375, -5.0985107421875, -4.728515625, -4.3585205078125, -3.988525390625, -3.6185302734375, -3.24853515625, -2.8785400390625, -2.508544921875, -2.1385498046875, -1.7685546875, -1.3985595703125, -1.028564453125, -0.6585693359375, -0.28857421875, 0.0814208984375, 0.451416015625, 0.8214111328125, 1.19140625, 1.5614013671875, 1.931396484375, 2.3013916015625, 2.67138671875, 3.0413818359375, 3.411376953125, 3.7813720703125, 4.1513671875, 4.5213623046875, 4.891357421875, 5.2613525390625, 5.63134765625, 6.0013427734375, 6.371337890625, 6.7413330078125, 7.111328125, 7.4813232421875, 7.851318359375, 8.2213134765625, 8.59130859375, 8.9613037109375, 9.331298828125, 9.7012939453125, 10.0712890625, 10.4412841796875, 10.811279296875, 11.1812744140625, 11.55126953125, 11.9212646484375, 12.291259765625, 12.6612548828125, 13.03125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 2.0, 4.0, 6.0, 8.0, 12.0, 14.0, 8.0, 13.0, 20.0, 15.0, 19.0, 15.0, 29.0, 29.0, 33.0, 31.0, 40.0, 42.0, 33.0, 42.0, 28.0, 36.0, 44.0, 30.0, 48.0, 35.0, 31.0, 37.0, 26.0, 31.0, 39.0, 31.0, 30.0, 24.0, 19.0, 14.0, 14.0, 8.0, 8.0, 7.0, 18.0, 11.0, 10.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.203125, -18.55859375, -17.9140625, -17.26953125, -16.625, -15.98046875, -15.3359375, -14.69140625, -14.046875, -13.40234375, -12.7578125, -12.11328125, -11.46875, -10.82421875, -10.1796875, -9.53515625, -8.890625, -8.24609375, -7.6015625, -6.95703125, -6.3125, -5.66796875, -5.0234375, -4.37890625, -3.734375, -3.08984375, -2.4453125, -1.80078125, -1.15625, -0.51171875, 0.1328125, 0.77734375, 1.421875, 2.06640625, 2.7109375, 3.35546875, 4.0, 4.64453125, 5.2890625, 5.93359375, 6.578125, 7.22265625, 7.8671875, 8.51171875, 9.15625, 9.80078125, 10.4453125, 11.08984375, 11.734375, 12.37890625, 13.0234375, 13.66796875, 14.3125, 14.95703125, 15.6015625, 16.24609375, 16.890625, 17.53515625, 18.1796875, 18.82421875, 19.46875, 20.11328125, 20.7578125, 21.40234375, 22.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 23.0, 27.0, 46.0, 46.0, 81.0, 108.0, 152.0, 223.0, 354.0, 626.0, 879.0, 1479.0, 2462.0, 4324.0, 7273.0, 13116.0, 24083.0, 65679.0, 839444.0, 41144.0, 20114.0, 10991.0, 6502.0, 3616.0, 2081.0, 1328.0, 818.0, 547.0, 312.0, 210.0, 141.0, 103.0, 59.0, 44.0, 19.0, 29.0, 22.0, 12.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2267608642578125, -1.184967041015625, -1.1431732177734375, -1.10137939453125, -1.0595855712890625, -1.017791748046875, -0.9759979248046875, -0.9342041015625, -0.8924102783203125, -0.850616455078125, -0.8088226318359375, -0.76702880859375, -0.7252349853515625, -0.683441162109375, -0.6416473388671875, -0.599853515625, -0.5580596923828125, -0.516265869140625, -0.4744720458984375, -0.43267822265625, -0.3908843994140625, -0.349090576171875, -0.3072967529296875, -0.2655029296875, -0.2237091064453125, -0.181915283203125, -0.1401214599609375, -0.09832763671875, -0.0565338134765625, -0.014739990234375, 0.0270538330078125, 0.06884765625, 0.1106414794921875, 0.152435302734375, 0.1942291259765625, 0.23602294921875, 0.2778167724609375, 0.319610595703125, 0.3614044189453125, 0.4031982421875, 0.4449920654296875, 0.486785888671875, 0.5285797119140625, 0.57037353515625, 0.6121673583984375, 0.653961181640625, 0.6957550048828125, 0.737548828125, 0.7793426513671875, 0.821136474609375, 0.8629302978515625, 0.90472412109375, 0.9465179443359375, 0.988311767578125, 1.0301055908203125, 1.0718994140625, 1.1136932373046875, 1.155487060546875, 1.1972808837890625, 1.23907470703125, 1.2808685302734375, 1.322662353515625, 1.3644561767578125, 1.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 16.0, 12.0, 14.0, 7.0, 9.0, 26.0, 34.0, 40.0, 49.0, 62.0, 55.0, 65.0, 61.0, 75.0, 62.0, 62.0, 69.0, 60.0, 43.0, 43.0, 37.0, 29.0, 18.0, 11.0, 12.0, 10.0, 2.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.109476089477539e-05, -5.9548765420913696e-05, -5.8002769947052e-05, -5.645677447319031e-05, -5.491077899932861e-05, -5.336478352546692e-05, -5.1818788051605225e-05, -5.027279257774353e-05, -4.8726797103881836e-05, -4.718080163002014e-05, -4.563480615615845e-05, -4.408881068229675e-05, -4.254281520843506e-05, -4.0996819734573364e-05, -3.945082426071167e-05, -3.7904828786849976e-05, -3.635883331298828e-05, -3.481283783912659e-05, -3.326684236526489e-05, -3.17208468914032e-05, -3.0174851417541504e-05, -2.862885594367981e-05, -2.7082860469818115e-05, -2.553686499595642e-05, -2.3990869522094727e-05, -2.2444874048233032e-05, -2.0898878574371338e-05, -1.9352883100509644e-05, -1.780688762664795e-05, -1.6260892152786255e-05, -1.471489667892456e-05, -1.3168901205062866e-05, -1.1622905731201172e-05, -1.0076910257339478e-05, -8.530914783477783e-06, -6.984919309616089e-06, -5.4389238357543945e-06, -3.8929283618927e-06, -2.346932888031006e-06, -8.009374141693115e-07, 7.450580596923828e-07, 2.291053533554077e-06, 3.8370490074157715e-06, 5.383044481277466e-06, 6.92903995513916e-06, 8.475035429000854e-06, 1.0021030902862549e-05, 1.1567026376724243e-05, 1.3113021850585938e-05, 1.4659017324447632e-05, 1.6205012798309326e-05, 1.775100827217102e-05, 1.9297003746032715e-05, 2.084299921989441e-05, 2.2388994693756104e-05, 2.3934990167617798e-05, 2.5480985641479492e-05, 2.7026981115341187e-05, 2.857297658920288e-05, 3.0118972063064575e-05, 3.166496753692627e-05, 3.3210963010787964e-05, 3.475695848464966e-05, 3.630295395851135e-05, 3.784894943237305e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 6.0, 6.0, 12.0, 10.0, 13.0, 26.0, 51.0, 71.0, 86.0, 152.0, 229.0, 338.0, 537.0, 823.0, 1322.0, 2031.0, 3076.0, 4658.0, 7192.0, 11359.0, 16839.0, 25211.0, 37084.0, 53596.0, 75131.0, 100936.0, 124855.0, 135214.0, 121992.0, 97143.0, 71711.0, 51455.0, 35241.0, 23777.0, 15908.0, 10491.0, 6974.0, 4673.0, 2896.0, 1961.0, 1155.0, 829.0, 515.0, 330.0, 211.0, 165.0, 106.0, 53.0, 36.0, 25.0, 14.0, 18.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.90966796875, -0.8807296752929688, -0.8517913818359375, -0.8228530883789062, -0.793914794921875, -0.7649765014648438, -0.7360382080078125, -0.7070999145507812, -0.67816162109375, -0.6492233276367188, -0.6202850341796875, -0.5913467407226562, -0.562408447265625, -0.5334701538085938, -0.5045318603515625, -0.47559356689453125, -0.4466552734375, -0.41771697998046875, -0.3887786865234375, -0.35984039306640625, -0.330902099609375, -0.30196380615234375, -0.2730255126953125, -0.24408721923828125, -0.21514892578125, -0.18621063232421875, -0.1572723388671875, -0.12833404541015625, -0.099395751953125, -0.07045745849609375, -0.0415191650390625, -0.01258087158203125, 0.016357421875, 0.04529571533203125, 0.0742340087890625, 0.10317230224609375, 0.132110595703125, 0.16104888916015625, 0.1899871826171875, 0.21892547607421875, 0.24786376953125, 0.27680206298828125, 0.3057403564453125, 0.33467864990234375, 0.363616943359375, 0.39255523681640625, 0.4214935302734375, 0.45043182373046875, 0.4793701171875, 0.5083084106445312, 0.5372467041015625, 0.5661849975585938, 0.595123291015625, 0.6240615844726562, 0.6529998779296875, 0.6819381713867188, 0.71087646484375, 0.7398147583007812, 0.7687530517578125, 0.7976913452148438, 0.826629638671875, 0.8555679321289062, 0.8845062255859375, 0.9134445190429688, 0.9423828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 4.0, 6.0, 7.0, 7.0, 8.0, 9.0, 19.0, 17.0, 13.0, 23.0, 20.0, 19.0, 23.0, 23.0, 34.0, 35.0, 38.0, 45.0, 44.0, 53.0, 48.0, 50.0, 46.0, 47.0, 43.0, 38.0, 24.0, 32.0, 24.0, 20.0, 21.0, 9.0, 20.0, 24.0, 10.0, 11.0, 9.0, 14.0, 12.0, 5.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3662109375, -0.35453033447265625, -0.3428497314453125, -0.33116912841796875, -0.319488525390625, -0.30780792236328125, -0.2961273193359375, -0.28444671630859375, -0.27276611328125, -0.26108551025390625, -0.2494049072265625, -0.23772430419921875, -0.226043701171875, -0.21436309814453125, -0.2026824951171875, -0.19100189208984375, -0.1793212890625, -0.16764068603515625, -0.1559600830078125, -0.14427947998046875, -0.132598876953125, -0.12091827392578125, -0.1092376708984375, -0.09755706787109375, -0.08587646484375, -0.07419586181640625, -0.0625152587890625, -0.05083465576171875, -0.039154052734375, -0.02747344970703125, -0.0157928466796875, -0.00411224365234375, 0.007568359375, 0.01924896240234375, 0.0309295654296875, 0.04261016845703125, 0.054290771484375, 0.06597137451171875, 0.0776519775390625, 0.08933258056640625, 0.10101318359375, 0.11269378662109375, 0.1243743896484375, 0.13605499267578125, 0.147735595703125, 0.15941619873046875, 0.1710968017578125, 0.18277740478515625, 0.1944580078125, 0.20613861083984375, 0.2178192138671875, 0.22949981689453125, 0.241180419921875, 0.25286102294921875, 0.2645416259765625, 0.27622222900390625, 0.28790283203125, 0.29958343505859375, 0.3112640380859375, 0.32294464111328125, 0.334625244140625, 0.34630584716796875, 0.3579864501953125, 0.36966705322265625, 0.38134765625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 7.0, 7.0, 8.0, 15.0, 10.0, 8.0, 22.0, 17.0, 23.0, 28.0, 23.0, 22.0, 32.0, 42.0, 33.0, 30.0, 24.0, 36.0, 27.0, 49.0, 46.0, 32.0, 28.0, 33.0, 40.0, 44.0, 45.0, 47.0, 37.0, 28.0, 18.0, 20.0, 15.0, 34.0, 12.0, 16.0, 14.0, 3.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.501680374145508, -25.635757446289062, -24.769834518432617, -23.903911590576172, -23.037986755371094, -22.17206573486328, -21.306140899658203, -20.440217971801758, -19.574295043945312, -18.708372116088867, -17.842449188232422, -16.976526260375977, -16.11060333251953, -15.24467945098877, -14.378755569458008, -13.512832641601562, -12.646909713745117, -11.780986785888672, -10.915063858032227, -10.049139976501465, -9.18321704864502, -8.317294120788574, -7.451370716094971, -6.585447311401367, -5.719524383544922, -4.853601455688477, -3.987678050994873, -3.1217548847198486, -2.255831718444824, -1.389908790588379, -0.5239853858947754, 0.3419380187988281, 1.2078609466552734, 2.073784112930298, 2.9397072792053223, 3.8056304454803467, 4.671553611755371, 5.537476539611816, 6.40339994430542, 7.269323348999023, 8.135246276855469, 9.001169204711914, 9.86709213256836, 10.733016014099121, 11.598938941955566, 12.464861869812012, 13.330785751342773, 14.196708679199219, 15.062631607055664, 15.92855453491211, 16.794477462768555, 17.660400390625, 18.526325225830078, 19.39224624633789, 20.25817108154297, 21.124094009399414, 21.99001693725586, 22.855939865112305, 23.72186279296875, 24.587785720825195, 25.45370864868164, 26.31963348388672, 27.185556411743164, 28.05147933959961, 28.917402267456055]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 9.0, 4.0, 6.0, 14.0, 12.0, 11.0, 8.0, 14.0, 13.0, 17.0, 20.0, 13.0, 29.0, 26.0, 27.0, 37.0, 32.0, 29.0, 29.0, 35.0, 34.0, 36.0, 31.0, 35.0, 28.0, 31.0, 42.0, 38.0, 36.0, 25.0, 25.0, 30.0, 20.0, 17.0, 24.0, 19.0, 18.0, 17.0, 18.0, 19.0, 14.0, 11.0, 4.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-25.635940551757812, -24.813968658447266, -23.99199676513672, -23.170024871826172, -22.348052978515625, -21.526081085205078, -20.70410919189453, -19.882137298583984, -19.060165405273438, -18.23819351196289, -17.416221618652344, -16.594249725341797, -15.77227783203125, -14.950305938720703, -14.12833309173584, -13.306361198425293, -12.48438835144043, -11.662416458129883, -10.840444564819336, -10.018472671508789, -9.196500778198242, -8.374528884887695, -7.552556037902832, -6.730584144592285, -5.908612251281738, -5.086640357971191, -4.2646684646606445, -3.4426960945129395, -2.6207242012023926, -1.7987523078918457, -0.9767799377441406, -0.15480804443359375, 0.6671638488769531, 1.4891358613967896, 2.311107873916626, 3.133080005645752, 3.955051898956299, 4.777023792266846, 5.598996162414551, 6.420968055725098, 7.2429399490356445, 8.064911842346191, 8.886883735656738, 9.708856582641602, 10.530828475952148, 11.352800369262695, 12.174772262573242, 12.996744155883789, 13.818716049194336, 14.640687942504883, 15.46265983581543, 16.284631729125977, 17.106603622436523, 17.92857551574707, 18.75054931640625, 19.572521209716797, 20.394493103027344, 21.21646499633789, 22.038436889648438, 22.860408782958984, 23.68238067626953, 24.504352569580078, 25.326324462890625, 26.148296356201172, 26.97026824951172]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 17.0, 29.0, 43.0, 87.0, 130.0, 193.0, 344.0, 572.0, 906.0, 1442.0, 2210.0, 3319.0, 5134.0, 7567.0, 11031.0, 15485.0, 21500.0, 28888.0, 38038.0, 48850.0, 59517.0, 69055.0, 78258.0, 83752.0, 86155.0, 84673.0, 78913.0, 69911.0, 60473.0, 49631.0, 39438.0, 30166.0, 22501.0, 16242.0, 11342.0, 7754.0, 5313.0, 3530.0, 2215.0, 1485.0, 942.0, 576.0, 358.0, 235.0, 147.0, 70.0, 50.0, 24.0, 23.0, 11.0, 2.0, 3.0, 4.0, 2.0], "bins": [-15.90625, -15.4459228515625, -14.985595703125, -14.5252685546875, -14.06494140625, -13.6046142578125, -13.144287109375, -12.6839599609375, -12.2236328125, -11.7633056640625, -11.302978515625, -10.8426513671875, -10.38232421875, -9.9219970703125, -9.461669921875, -9.0013427734375, -8.541015625, -8.0806884765625, -7.620361328125, -7.1600341796875, -6.69970703125, -6.2393798828125, -5.779052734375, -5.3187255859375, -4.8583984375, -4.3980712890625, -3.937744140625, -3.4774169921875, -3.01708984375, -2.5567626953125, -2.096435546875, -1.6361083984375, -1.17578125, -0.7154541015625, -0.255126953125, 0.2052001953125, 0.66552734375, 1.1258544921875, 1.586181640625, 2.0465087890625, 2.5068359375, 2.9671630859375, 3.427490234375, 3.8878173828125, 4.34814453125, 4.8084716796875, 5.268798828125, 5.7291259765625, 6.189453125, 6.6497802734375, 7.110107421875, 7.5704345703125, 8.03076171875, 8.4910888671875, 8.951416015625, 9.4117431640625, 9.8720703125, 10.3323974609375, 10.792724609375, 11.2530517578125, 11.71337890625, 12.1737060546875, 12.634033203125, 13.0943603515625, 13.5546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 2.0, 6.0, 13.0, 16.0, 9.0, 6.0, 14.0, 14.0, 18.0, 18.0, 15.0, 28.0, 24.0, 30.0, 38.0, 31.0, 29.0, 30.0, 29.0, 38.0, 32.0, 35.0, 32.0, 29.0, 34.0, 38.0, 36.0, 39.0, 25.0, 29.0, 22.0, 22.0, 20.0, 21.0, 24.0, 14.0, 20.0, 13.0, 24.0, 11.0, 14.0, 3.0, 6.0, 3.0, 1.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-24.9375, -24.14013671875, -23.3427734375, -22.54541015625, -21.748046875, -20.95068359375, -20.1533203125, -19.35595703125, -18.55859375, -17.76123046875, -16.9638671875, -16.16650390625, -15.369140625, -14.57177734375, -13.7744140625, -12.97705078125, -12.1796875, -11.38232421875, -10.5849609375, -9.78759765625, -8.990234375, -8.19287109375, -7.3955078125, -6.59814453125, -5.80078125, -5.00341796875, -4.2060546875, -3.40869140625, -2.611328125, -1.81396484375, -1.0166015625, -0.21923828125, 0.578125, 1.37548828125, 2.1728515625, 2.97021484375, 3.767578125, 4.56494140625, 5.3623046875, 6.15966796875, 6.95703125, 7.75439453125, 8.5517578125, 9.34912109375, 10.146484375, 10.94384765625, 11.7412109375, 12.53857421875, 13.3359375, 14.13330078125, 14.9306640625, 15.72802734375, 16.525390625, 17.32275390625, 18.1201171875, 18.91748046875, 19.71484375, 20.51220703125, 21.3095703125, 22.10693359375, 22.904296875, 23.70166015625, 24.4990234375, 25.29638671875, 26.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 14.0, 27.0, 34.0, 55.0, 98.0, 145.0, 245.0, 342.0, 662.0, 1036.0, 1689.0, 2598.0, 3894.0, 5772.0, 8796.0, 12778.0, 17930.0, 25001.0, 33749.0, 43704.0, 55106.0, 65558.0, 76326.0, 83754.0, 87760.0, 88021.0, 82991.0, 75755.0, 65311.0, 53818.0, 43464.0, 32894.0, 24586.0, 17423.0, 12440.0, 8575.0, 5707.0, 3729.0, 2444.0, 1529.0, 1048.0, 688.0, 403.0, 253.0, 159.0, 95.0, 58.0, 39.0, 20.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.484375, -14.03125, -13.578125, -13.125, -12.671875, -12.21875, -11.765625, -11.3125, -10.859375, -10.40625, -9.953125, -9.5, -9.046875, -8.59375, -8.140625, -7.6875, -7.234375, -6.78125, -6.328125, -5.875, -5.421875, -4.96875, -4.515625, -4.0625, -3.609375, -3.15625, -2.703125, -2.25, -1.796875, -1.34375, -0.890625, -0.4375, 0.015625, 0.46875, 0.921875, 1.375, 1.828125, 2.28125, 2.734375, 3.1875, 3.640625, 4.09375, 4.546875, 5.0, 5.453125, 5.90625, 6.359375, 6.8125, 7.265625, 7.71875, 8.171875, 8.625, 9.078125, 9.53125, 9.984375, 10.4375, 10.890625, 11.34375, 11.796875, 12.25, 12.703125, 13.15625, 13.609375, 14.0625, 14.515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 8.0, 8.0, 7.0, 7.0, 8.0, 17.0, 15.0, 11.0, 24.0, 23.0, 27.0, 22.0, 31.0, 37.0, 33.0, 38.0, 24.0, 41.0, 44.0, 46.0, 47.0, 31.0, 46.0, 35.0, 33.0, 44.0, 27.0, 29.0, 31.0, 22.0, 31.0, 14.0, 19.0, 25.0, 20.0, 7.0, 10.0, 6.0, 14.0, 4.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.1875, -18.5791015625, -17.970703125, -17.3623046875, -16.75390625, -16.1455078125, -15.537109375, -14.9287109375, -14.3203125, -13.7119140625, -13.103515625, -12.4951171875, -11.88671875, -11.2783203125, -10.669921875, -10.0615234375, -9.453125, -8.8447265625, -8.236328125, -7.6279296875, -7.01953125, -6.4111328125, -5.802734375, -5.1943359375, -4.5859375, -3.9775390625, -3.369140625, -2.7607421875, -2.15234375, -1.5439453125, -0.935546875, -0.3271484375, 0.28125, 0.8896484375, 1.498046875, 2.1064453125, 2.71484375, 3.3232421875, 3.931640625, 4.5400390625, 5.1484375, 5.7568359375, 6.365234375, 6.9736328125, 7.58203125, 8.1904296875, 8.798828125, 9.4072265625, 10.015625, 10.6240234375, 11.232421875, 11.8408203125, 12.44921875, 13.0576171875, 13.666015625, 14.2744140625, 14.8828125, 15.4912109375, 16.099609375, 16.7080078125, 17.31640625, 17.9248046875, 18.533203125, 19.1416015625, 19.75]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 6.0, 8.0, 6.0, 13.0, 14.0, 27.0, 47.0, 56.0, 79.0, 164.0, 244.0, 409.0, 709.0, 1226.0, 1960.0, 3440.0, 6121.0, 10144.0, 17177.0, 27282.0, 41218.0, 60208.0, 80591.0, 101127.0, 114787.0, 120698.0, 114869.0, 100015.0, 78834.0, 58996.0, 40670.0, 26423.0, 16771.0, 9979.0, 5915.0, 3465.0, 1978.0, 1152.0, 689.0, 412.0, 235.0, 140.0, 85.0, 54.0, 41.0, 21.0, 18.0, 14.0, 9.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.3046875, -8.0489501953125, -7.793212890625, -7.5374755859375, -7.28173828125, -7.0260009765625, -6.770263671875, -6.5145263671875, -6.2587890625, -6.0030517578125, -5.747314453125, -5.4915771484375, -5.23583984375, -4.9801025390625, -4.724365234375, -4.4686279296875, -4.212890625, -3.9571533203125, -3.701416015625, -3.4456787109375, -3.18994140625, -2.9342041015625, -2.678466796875, -2.4227294921875, -2.1669921875, -1.9112548828125, -1.655517578125, -1.3997802734375, -1.14404296875, -0.8883056640625, -0.632568359375, -0.3768310546875, -0.12109375, 0.1346435546875, 0.390380859375, 0.6461181640625, 0.90185546875, 1.1575927734375, 1.413330078125, 1.6690673828125, 1.9248046875, 2.1805419921875, 2.436279296875, 2.6920166015625, 2.94775390625, 3.2034912109375, 3.459228515625, 3.7149658203125, 3.970703125, 4.2264404296875, 4.482177734375, 4.7379150390625, 4.99365234375, 5.2493896484375, 5.505126953125, 5.7608642578125, 6.0166015625, 6.2723388671875, 6.528076171875, 6.7838134765625, 7.03955078125, 7.2952880859375, 7.551025390625, 7.8067626953125, 8.0625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 8.0, 3.0, 3.0, 7.0, 6.0, 8.0, 14.0, 17.0, 18.0, 17.0, 27.0, 21.0, 42.0, 47.0, 32.0, 47.0, 60.0, 52.0, 50.0, 55.0, 53.0, 60.0, 45.0, 49.0, 47.0, 35.0, 39.0, 24.0, 18.0, 15.0, 22.0, 10.0, 14.0, 10.0, 7.0, 3.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012569427490234375, -0.0012216418981552124, -0.0011863410472869873, -0.0011510401964187622, -0.0011157393455505371, -0.001080438494682312, -0.001045137643814087, -0.0010098367929458618, -0.0009745359420776367, -0.0009392350912094116, -0.0009039342403411865, -0.0008686333894729614, -0.0008333325386047363, -0.0007980316877365112, -0.0007627308368682861, -0.000727429986000061, -0.0006921291351318359, -0.0006568282842636108, -0.0006215274333953857, -0.0005862265825271606, -0.0005509257316589355, -0.0005156248807907104, -0.00048032402992248535, -0.00044502317905426025, -0.00040972232818603516, -0.00037442147731781006, -0.00033912062644958496, -0.00030381977558135986, -0.00026851892471313477, -0.00023321807384490967, -0.00019791722297668457, -0.00016261637210845947, -0.00012731552124023438, -9.201467037200928e-05, -5.671381950378418e-05, -2.1412968635559082e-05, 1.3887882232666016e-05, 4.918873310089111e-05, 8.448958396911621e-05, 0.00011979043483734131, 0.0001550912857055664, 0.0001903921365737915, 0.0002256929874420166, 0.0002609938383102417, 0.0002962946891784668, 0.0003315955400466919, 0.000366896390914917, 0.0004021972417831421, 0.0004374980926513672, 0.0004727989435195923, 0.0005080997943878174, 0.0005434006452560425, 0.0005787014961242676, 0.0006140023469924927, 0.0006493031978607178, 0.0006846040487289429, 0.000719904899597168, 0.0007552057504653931, 0.0007905066013336182, 0.0008258074522018433, 0.0008611083030700684, 0.0008964091539382935, 0.0009317100048065186, 0.0009670108556747437, 0.0010023117065429688]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 12.0, 18.0, 32.0, 46.0, 69.0, 117.0, 145.0, 262.0, 446.0, 762.0, 1369.0, 2410.0, 4343.0, 7936.0, 13776.0, 24698.0, 40185.0, 62458.0, 89809.0, 116271.0, 134072.0, 137145.0, 124200.0, 100007.0, 71648.0, 47663.0, 29335.0, 17126.0, 9835.0, 5299.0, 3002.0, 1714.0, 928.0, 534.0, 327.0, 205.0, 118.0, 69.0, 44.0, 29.0, 17.0, 19.0, 10.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.25, -9.9212646484375, -9.592529296875, -9.2637939453125, -8.93505859375, -8.6063232421875, -8.277587890625, -7.9488525390625, -7.6201171875, -7.2913818359375, -6.962646484375, -6.6339111328125, -6.30517578125, -5.9764404296875, -5.647705078125, -5.3189697265625, -4.990234375, -4.6614990234375, -4.332763671875, -4.0040283203125, -3.67529296875, -3.3465576171875, -3.017822265625, -2.6890869140625, -2.3603515625, -2.0316162109375, -1.702880859375, -1.3741455078125, -1.04541015625, -0.7166748046875, -0.387939453125, -0.0592041015625, 0.26953125, 0.5982666015625, 0.927001953125, 1.2557373046875, 1.58447265625, 1.9132080078125, 2.241943359375, 2.5706787109375, 2.8994140625, 3.2281494140625, 3.556884765625, 3.8856201171875, 4.21435546875, 4.5430908203125, 4.871826171875, 5.2005615234375, 5.529296875, 5.8580322265625, 6.186767578125, 6.5155029296875, 6.84423828125, 7.1729736328125, 7.501708984375, 7.8304443359375, 8.1591796875, 8.4879150390625, 8.816650390625, 9.1453857421875, 9.47412109375, 9.8028564453125, 10.131591796875, 10.4603271484375, 10.7890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 3.0, 12.0, 6.0, 12.0, 15.0, 15.0, 18.0, 20.0, 19.0, 22.0, 36.0, 35.0, 32.0, 43.0, 46.0, 57.0, 56.0, 52.0, 62.0, 51.0, 49.0, 55.0, 46.0, 30.0, 41.0, 26.0, 23.0, 17.0, 14.0, 14.0, 12.0, 12.0, 9.0, 5.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.81304931640625, -3.6690673828125, -3.52508544921875, -3.381103515625, -3.23712158203125, -3.0931396484375, -2.94915771484375, -2.80517578125, -2.66119384765625, -2.5172119140625, -2.37322998046875, -2.229248046875, -2.08526611328125, -1.9412841796875, -1.79730224609375, -1.6533203125, -1.50933837890625, -1.3653564453125, -1.22137451171875, -1.077392578125, -0.93341064453125, -0.7894287109375, -0.64544677734375, -0.50146484375, -0.35748291015625, -0.2135009765625, -0.06951904296875, 0.074462890625, 0.21844482421875, 0.3624267578125, 0.50640869140625, 0.650390625, 0.79437255859375, 0.9383544921875, 1.08233642578125, 1.226318359375, 1.37030029296875, 1.5142822265625, 1.65826416015625, 1.80224609375, 1.94622802734375, 2.0902099609375, 2.23419189453125, 2.378173828125, 2.52215576171875, 2.6661376953125, 2.81011962890625, 2.9541015625, 3.09808349609375, 3.2420654296875, 3.38604736328125, 3.530029296875, 3.67401123046875, 3.8179931640625, 3.96197509765625, 4.10595703125, 4.24993896484375, 4.3939208984375, 4.53790283203125, 4.681884765625, 4.82586669921875, 4.9698486328125, 5.11383056640625, 5.2578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 3.0, 8.0, 8.0, 11.0, 6.0, 16.0, 13.0, 12.0, 24.0, 26.0, 17.0, 25.0, 27.0, 31.0, 44.0, 39.0, 29.0, 41.0, 33.0, 31.0, 33.0, 40.0, 34.0, 40.0, 36.0, 34.0, 41.0, 33.0, 35.0, 39.0, 29.0, 20.0, 26.0, 17.0, 19.0, 9.0, 18.0, 8.0, 12.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-25.911949157714844, -25.077377319335938, -24.2428035736084, -23.408231735229492, -22.573657989501953, -21.739086151123047, -20.904512405395508, -20.0699405670166, -19.235366821289062, -18.400794982910156, -17.566221237182617, -16.73164939880371, -15.897075653076172, -15.062503814697266, -14.227930068969727, -13.39335823059082, -12.558785438537598, -11.724212646484375, -10.889639854431152, -10.05506706237793, -9.220494270324707, -8.385921478271484, -7.55134916305542, -6.716776371002197, -5.882203578948975, -5.047630786895752, -4.213057994842529, -3.3784854412078857, -2.543912649154663, -1.7093400955200195, -0.8747673034667969, -0.04019451141357422, 0.7943782806396484, 1.628951072692871, 2.4635238647460938, 3.2980964183807373, 4.132669448852539, 4.9672417640686035, 5.801814556121826, 6.636387348175049, 7.4709601402282715, 8.305532455444336, 9.140105247497559, 9.974678039550781, 10.809250831604004, 11.643823623657227, 12.47839641571045, 13.312969207763672, 14.147541999816895, 14.982114791870117, 15.81668758392334, 16.651260375976562, 17.48583221435547, 18.320405960083008, 19.154977798461914, 19.989551544189453, 20.82412338256836, 21.658695220947266, 22.493268966674805, 23.32784080505371, 24.16241455078125, 24.996986389160156, 25.831560134887695, 26.6661319732666, 27.50070571899414]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 8.0, 6.0, 4.0, 6.0, 8.0, 13.0, 17.0, 6.0, 17.0, 18.0, 16.0, 22.0, 21.0, 27.0, 29.0, 35.0, 27.0, 32.0, 51.0, 41.0, 37.0, 37.0, 34.0, 38.0, 25.0, 38.0, 28.0, 29.0, 35.0, 36.0, 28.0, 28.0, 34.0, 25.0, 21.0, 21.0, 21.0, 14.0, 8.0, 12.0, 6.0, 13.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.85369110107422, -26.894153594970703, -25.934616088867188, -24.975078582763672, -24.015541076660156, -23.05600357055664, -22.096466064453125, -21.13692855834961, -20.177391052246094, -19.217853546142578, -18.258316040039062, -17.298778533935547, -16.33924102783203, -15.379703521728516, -14.420166969299316, -13.4606294631958, -12.501092910766602, -11.541555404663086, -10.58201789855957, -9.622480392456055, -8.662942886352539, -7.703405857086182, -6.743868827819824, -5.784331321716309, -4.824793815612793, -3.8652563095092773, -2.905719041824341, -1.9461817741394043, -0.9866442680358887, -0.027106761932373047, 0.9324302673339844, 1.8919677734375, 2.8515052795410156, 3.8110427856445312, 4.770580291748047, 5.730117321014404, 6.68965482711792, 7.6491923332214355, 8.608729362487793, 9.568266868591309, 10.527804374694824, 11.48734188079834, 12.446879386901855, 13.406415939331055, 14.36595344543457, 15.325490951538086, 16.2850284576416, 17.244565963745117, 18.204103469848633, 19.16364097595215, 20.123178482055664, 21.08271598815918, 22.042253494262695, 23.00179100036621, 23.961326599121094, 24.92086410522461, 25.880401611328125, 26.83993911743164, 27.799476623535156, 28.759014129638672, 29.718551635742188, 30.678089141845703, 31.63762664794922, 32.597164154052734, 33.55670166015625]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 6.0, 17.0, 26.0, 48.0, 65.0, 152.0, 192.0, 389.0, 638.0, 1035.0, 1739.0, 2819.0, 4554.0, 7661.0, 12053.0, 19075.0, 29705.0, 44840.0, 66813.0, 97806.0, 137939.0, 187777.0, 242877.0, 301460.0, 353704.0, 388907.0, 401987.0, 389910.0, 352409.0, 299327.0, 241442.0, 184776.0, 135796.0, 95457.0, 66050.0, 44629.0, 29171.0, 18794.0, 11884.0, 7657.0, 4759.0, 2988.0, 1882.0, 1211.0, 730.0, 427.0, 261.0, 188.0, 107.0, 66.0, 30.0, 18.0, 20.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-19.03125, -18.406982421875, -17.78271484375, -17.158447265625, -16.5341796875, -15.909912109375, -15.28564453125, -14.661376953125, -14.037109375, -13.412841796875, -12.78857421875, -12.164306640625, -11.5400390625, -10.915771484375, -10.29150390625, -9.667236328125, -9.04296875, -8.418701171875, -7.79443359375, -7.170166015625, -6.5458984375, -5.921630859375, -5.29736328125, -4.673095703125, -4.048828125, -3.424560546875, -2.80029296875, -2.176025390625, -1.5517578125, -0.927490234375, -0.30322265625, 0.321044921875, 0.9453125, 1.569580078125, 2.19384765625, 2.818115234375, 3.4423828125, 4.066650390625, 4.69091796875, 5.315185546875, 5.939453125, 6.563720703125, 7.18798828125, 7.812255859375, 8.4365234375, 9.060791015625, 9.68505859375, 10.309326171875, 10.93359375, 11.557861328125, 12.18212890625, 12.806396484375, 13.4306640625, 14.054931640625, 14.67919921875, 15.303466796875, 15.927734375, 16.552001953125, 17.17626953125, 17.800537109375, 18.4248046875, 19.049072265625, 19.67333984375, 20.297607421875, 20.921875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 4.0, 6.0, 10.0, 15.0, 12.0, 8.0, 19.0, 15.0, 15.0, 25.0, 18.0, 26.0, 36.0, 32.0, 26.0, 34.0, 50.0, 43.0, 33.0, 40.0, 35.0, 32.0, 26.0, 37.0, 32.0, 27.0, 30.0, 39.0, 26.0, 32.0, 27.0, 28.0, 24.0, 21.0, 19.0, 15.0, 9.0, 11.0, 9.0, 9.0, 4.0, 7.0, 9.0, 7.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.0625, -24.199951171875, -23.33740234375, -22.474853515625, -21.6123046875, -20.749755859375, -19.88720703125, -19.024658203125, -18.162109375, -17.299560546875, -16.43701171875, -15.574462890625, -14.7119140625, -13.849365234375, -12.98681640625, -12.124267578125, -11.26171875, -10.399169921875, -9.53662109375, -8.674072265625, -7.8115234375, -6.948974609375, -6.08642578125, -5.223876953125, -4.361328125, -3.498779296875, -2.63623046875, -1.773681640625, -0.9111328125, -0.048583984375, 0.81396484375, 1.676513671875, 2.5390625, 3.401611328125, 4.26416015625, 5.126708984375, 5.9892578125, 6.851806640625, 7.71435546875, 8.576904296875, 9.439453125, 10.302001953125, 11.16455078125, 12.027099609375, 12.8896484375, 13.752197265625, 14.61474609375, 15.477294921875, 16.33984375, 17.202392578125, 18.06494140625, 18.927490234375, 19.7900390625, 20.652587890625, 21.51513671875, 22.377685546875, 23.240234375, 24.102783203125, 24.96533203125, 25.827880859375, 26.6904296875, 27.552978515625, 28.41552734375, 29.278076171875, 30.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 16.0, 41.0, 57.0, 97.0, 180.0, 278.0, 490.0, 833.0, 1297.0, 2189.0, 3690.0, 5940.0, 9439.0, 15027.0, 23497.0, 35960.0, 53630.0, 77549.0, 110396.0, 149884.0, 196326.0, 246677.0, 297622.0, 339310.0, 366745.0, 375410.0, 363799.0, 333264.0, 290457.0, 240090.0, 188820.0, 143323.0, 104294.0, 74053.0, 50528.0, 33590.0, 22296.0, 14192.0, 8863.0, 5552.0, 3435.0, 2075.0, 1264.0, 707.0, 453.0, 275.0, 167.0, 85.0, 52.0, 36.0, 19.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.06103515625, -18.4345703125, -17.80810546875, -17.181640625, -16.55517578125, -15.9287109375, -15.30224609375, -14.67578125, -14.04931640625, -13.4228515625, -12.79638671875, -12.169921875, -11.54345703125, -10.9169921875, -10.29052734375, -9.6640625, -9.03759765625, -8.4111328125, -7.78466796875, -7.158203125, -6.53173828125, -5.9052734375, -5.27880859375, -4.65234375, -4.02587890625, -3.3994140625, -2.77294921875, -2.146484375, -1.52001953125, -0.8935546875, -0.26708984375, 0.359375, 0.98583984375, 1.6123046875, 2.23876953125, 2.865234375, 3.49169921875, 4.1181640625, 4.74462890625, 5.37109375, 5.99755859375, 6.6240234375, 7.25048828125, 7.876953125, 8.50341796875, 9.1298828125, 9.75634765625, 10.3828125, 11.00927734375, 11.6357421875, 12.26220703125, 12.888671875, 13.51513671875, 14.1416015625, 14.76806640625, 15.39453125, 16.02099609375, 16.6474609375, 17.27392578125, 17.900390625, 18.52685546875, 19.1533203125, 19.77978515625, 20.40625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 14.0, 19.0, 19.0, 21.0, 25.0, 32.0, 60.0, 60.0, 75.0, 99.0, 90.0, 119.0, 127.0, 143.0, 185.0, 149.0, 181.0, 208.0, 189.0, 231.0, 202.0, 196.0, 180.0, 180.0, 162.0, 169.0, 144.0, 134.0, 134.0, 118.0, 72.0, 63.0, 56.0, 40.0, 40.0, 26.0, 27.0, 20.0, 13.0, 17.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2265625, -12.8109130859375, -12.395263671875, -11.9796142578125, -11.56396484375, -11.1483154296875, -10.732666015625, -10.3170166015625, -9.9013671875, -9.4857177734375, -9.070068359375, -8.6544189453125, -8.23876953125, -7.8231201171875, -7.407470703125, -6.9918212890625, -6.576171875, -6.1605224609375, -5.744873046875, -5.3292236328125, -4.91357421875, -4.4979248046875, -4.082275390625, -3.6666259765625, -3.2509765625, -2.8353271484375, -2.419677734375, -2.0040283203125, -1.58837890625, -1.1727294921875, -0.757080078125, -0.3414306640625, 0.07421875, 0.4898681640625, 0.905517578125, 1.3211669921875, 1.73681640625, 2.1524658203125, 2.568115234375, 2.9837646484375, 3.3994140625, 3.8150634765625, 4.230712890625, 4.6463623046875, 5.06201171875, 5.4776611328125, 5.893310546875, 6.3089599609375, 6.724609375, 7.1402587890625, 7.555908203125, 7.9715576171875, 8.38720703125, 8.8028564453125, 9.218505859375, 9.6341552734375, 10.0498046875, 10.4654541015625, 10.881103515625, 11.2967529296875, 11.71240234375, 12.1280517578125, 12.543701171875, 12.9593505859375, 13.375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 3.0, 8.0, 3.0, 11.0, 21.0, 20.0, 17.0, 25.0, 28.0, 31.0, 31.0, 24.0, 34.0, 41.0, 33.0, 37.0, 47.0, 48.0, 41.0, 46.0, 40.0, 48.0, 38.0, 43.0, 39.0, 24.0, 41.0, 34.0, 25.0, 11.0, 23.0, 15.0, 13.0, 12.0, 12.0, 4.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.273366928100586, -30.314577102661133, -29.355789184570312, -28.39699935913086, -27.43821144104004, -26.479421615600586, -25.520633697509766, -24.561843872070312, -23.60305404663086, -22.644264221191406, -21.685476303100586, -20.726686477661133, -19.767898559570312, -18.80910873413086, -17.850318908691406, -16.891530990600586, -15.932743072509766, -14.973954200744629, -14.015165328979492, -13.056375503540039, -12.097587585449219, -11.138797760009766, -10.180008888244629, -9.221220016479492, -8.262431144714355, -7.303642272949219, -6.344853401184082, -5.386064052581787, -4.42727518081665, -3.4684863090515137, -2.5096969604492188, -1.550908088684082, -0.5921192169189453, 0.36666977405548096, 1.3254587650299072, 2.284247875213623, 3.2430367469787598, 4.2018256187438965, 5.160614967346191, 6.119403839111328, 7.078192710876465, 8.036981582641602, 8.995770454406738, 9.954559326171875, 10.913349151611328, 11.872137069702148, 12.830926895141602, 13.789715766906738, 14.748504638671875, 15.707293510437012, 16.66608238220215, 17.6248722076416, 18.583660125732422, 19.542449951171875, 20.501239776611328, 21.46002769470215, 22.41881561279297, 23.377605438232422, 24.336393356323242, 25.295183181762695, 26.253971099853516, 27.21276092529297, 28.171550750732422, 29.130338668823242, 30.089128494262695]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 5.0, 15.0, 17.0, 17.0, 19.0, 15.0, 25.0, 23.0, 17.0, 24.0, 29.0, 28.0, 30.0, 41.0, 31.0, 45.0, 40.0, 40.0, 44.0, 53.0, 51.0, 38.0, 34.0, 29.0, 31.0, 24.0, 24.0, 31.0, 26.0, 19.0, 30.0, 16.0, 11.0, 10.0, 11.0, 9.0, 5.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.164623260498047, -28.139732360839844, -27.114843368530273, -26.089954376220703, -25.0650634765625, -24.040172576904297, -23.015283584594727, -21.990394592285156, -20.965503692626953, -19.94061279296875, -18.91572380065918, -17.89083480834961, -16.865943908691406, -15.84105396270752, -14.816164016723633, -13.791274070739746, -12.76638412475586, -11.741494178771973, -10.716604232788086, -9.6917142868042, -8.666824340820312, -7.641934394836426, -6.617044448852539, -5.592154502868652, -4.567264556884766, -3.542374610900879, -2.517484664916992, -1.4925947189331055, -0.46770477294921875, 0.557185173034668, 1.5820751190185547, 2.6069650650024414, 3.631855010986328, 4.656744956970215, 5.681634902954102, 6.706524848937988, 7.731414794921875, 8.756304740905762, 9.781194686889648, 10.806084632873535, 11.830974578857422, 12.855864524841309, 13.880754470825195, 14.905644416809082, 15.930534362792969, 16.955425262451172, 17.980314254760742, 19.005203247070312, 20.030094146728516, 21.05498504638672, 22.07987403869629, 23.10476303100586, 24.129653930664062, 25.154544830322266, 26.179433822631836, 27.204322814941406, 28.22921371459961, 29.254104614257812, 30.278993606567383, 31.303882598876953, 32.328773498535156, 33.35366439819336, 34.37855529785156, 35.4034423828125, 36.4283332824707]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 11.0, 17.0, 23.0, 48.0, 71.0, 78.0, 140.0, 227.0, 379.0, 523.0, 842.0, 1405.0, 2080.0, 3377.0, 5309.0, 8279.0, 12716.0, 19372.0, 28495.0, 41227.0, 56595.0, 74345.0, 92573.0, 106586.0, 112012.0, 109481.0, 96285.0, 79170.0, 60553.0, 44285.0, 31302.0, 21429.0, 14229.0, 9050.0, 5868.0, 3753.0, 2376.0, 1500.0, 906.0, 626.0, 392.0, 228.0, 134.0, 101.0, 62.0, 35.0, 24.0, 8.0, 9.0, 7.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.03515625, -3.90753173828125, -3.7799072265625, -3.65228271484375, -3.524658203125, -3.39703369140625, -3.2694091796875, -3.14178466796875, -3.01416015625, -2.88653564453125, -2.7589111328125, -2.63128662109375, -2.503662109375, -2.37603759765625, -2.2484130859375, -2.12078857421875, -1.9931640625, -1.86553955078125, -1.7379150390625, -1.61029052734375, -1.482666015625, -1.35504150390625, -1.2274169921875, -1.09979248046875, -0.97216796875, -0.84454345703125, -0.7169189453125, -0.58929443359375, -0.461669921875, -0.33404541015625, -0.2064208984375, -0.07879638671875, 0.048828125, 0.17645263671875, 0.3040771484375, 0.43170166015625, 0.559326171875, 0.68695068359375, 0.8145751953125, 0.94219970703125, 1.06982421875, 1.19744873046875, 1.3250732421875, 1.45269775390625, 1.580322265625, 1.70794677734375, 1.8355712890625, 1.96319580078125, 2.0908203125, 2.21844482421875, 2.3460693359375, 2.47369384765625, 2.601318359375, 2.72894287109375, 2.8565673828125, 2.98419189453125, 3.11181640625, 3.23944091796875, 3.3670654296875, 3.49468994140625, 3.622314453125, 3.74993896484375, 3.8775634765625, 4.00518798828125, 4.1328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 14.0, 18.0, 15.0, 21.0, 14.0, 27.0, 22.0, 16.0, 24.0, 27.0, 28.0, 31.0, 39.0, 33.0, 44.0, 41.0, 40.0, 43.0, 54.0, 51.0, 39.0, 33.0, 30.0, 28.0, 27.0, 23.0, 30.0, 29.0, 17.0, 29.0, 18.0, 10.0, 11.0, 10.0, 10.0, 5.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.13037109375, -27.1044921875, -26.07861328125, -25.052734375, -24.02685546875, -23.0009765625, -21.97509765625, -20.94921875, -19.92333984375, -18.8974609375, -17.87158203125, -16.845703125, -15.81982421875, -14.7939453125, -13.76806640625, -12.7421875, -11.71630859375, -10.6904296875, -9.66455078125, -8.638671875, -7.61279296875, -6.5869140625, -5.56103515625, -4.53515625, -3.50927734375, -2.4833984375, -1.45751953125, -0.431640625, 0.59423828125, 1.6201171875, 2.64599609375, 3.671875, 4.69775390625, 5.7236328125, 6.74951171875, 7.775390625, 8.80126953125, 9.8271484375, 10.85302734375, 11.87890625, 12.90478515625, 13.9306640625, 14.95654296875, 15.982421875, 17.00830078125, 18.0341796875, 19.06005859375, 20.0859375, 21.11181640625, 22.1376953125, 23.16357421875, 24.189453125, 25.21533203125, 26.2412109375, 27.26708984375, 28.29296875, 29.31884765625, 30.3447265625, 31.37060546875, 32.396484375, 33.42236328125, 34.4482421875, 35.47412109375, 36.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 14.0, 11.0, 19.0, 26.0, 56.0, 59.0, 105.0, 162.0, 241.0, 381.0, 531.0, 798.0, 1080.0, 1683.0, 2337.0, 3325.0, 4958.0, 7206.0, 10599.0, 16337.0, 27789.0, 153345.0, 702867.0, 50568.0, 21850.0, 13548.0, 8919.0, 6143.0, 4172.0, 2982.0, 2045.0, 1376.0, 973.0, 640.0, 452.0, 328.0, 216.0, 140.0, 96.0, 69.0, 38.0, 16.0, 22.0, 14.0, 13.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.9296875, -8.6614990234375, -8.393310546875, -8.1251220703125, -7.85693359375, -7.5887451171875, -7.320556640625, -7.0523681640625, -6.7841796875, -6.5159912109375, -6.247802734375, -5.9796142578125, -5.71142578125, -5.4432373046875, -5.175048828125, -4.9068603515625, -4.638671875, -4.3704833984375, -4.102294921875, -3.8341064453125, -3.56591796875, -3.2977294921875, -3.029541015625, -2.7613525390625, -2.4931640625, -2.2249755859375, -1.956787109375, -1.6885986328125, -1.42041015625, -1.1522216796875, -0.884033203125, -0.6158447265625, -0.34765625, -0.0794677734375, 0.188720703125, 0.4569091796875, 0.72509765625, 0.9932861328125, 1.261474609375, 1.5296630859375, 1.7978515625, 2.0660400390625, 2.334228515625, 2.6024169921875, 2.87060546875, 3.1387939453125, 3.406982421875, 3.6751708984375, 3.943359375, 4.2115478515625, 4.479736328125, 4.7479248046875, 5.01611328125, 5.2843017578125, 5.552490234375, 5.8206787109375, 6.0888671875, 6.3570556640625, 6.625244140625, 6.8934326171875, 7.16162109375, 7.4298095703125, 7.697998046875, 7.9661865234375, 8.234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 3.0, 11.0, 10.0, 11.0, 13.0, 21.0, 21.0, 20.0, 18.0, 36.0, 29.0, 27.0, 31.0, 25.0, 33.0, 41.0, 40.0, 45.0, 30.0, 34.0, 43.0, 33.0, 43.0, 47.0, 39.0, 37.0, 31.0, 17.0, 23.0, 33.0, 20.0, 29.0, 18.0, 12.0, 14.0, 12.0, 8.0, 7.0, 7.0, 10.0, 4.0, 2.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.53125, -21.847900390625, -21.16455078125, -20.481201171875, -19.7978515625, -19.114501953125, -18.43115234375, -17.747802734375, -17.064453125, -16.381103515625, -15.69775390625, -15.014404296875, -14.3310546875, -13.647705078125, -12.96435546875, -12.281005859375, -11.59765625, -10.914306640625, -10.23095703125, -9.547607421875, -8.8642578125, -8.180908203125, -7.49755859375, -6.814208984375, -6.130859375, -5.447509765625, -4.76416015625, -4.080810546875, -3.3974609375, -2.714111328125, -2.03076171875, -1.347412109375, -0.6640625, 0.019287109375, 0.70263671875, 1.385986328125, 2.0693359375, 2.752685546875, 3.43603515625, 4.119384765625, 4.802734375, 5.486083984375, 6.16943359375, 6.852783203125, 7.5361328125, 8.219482421875, 8.90283203125, 9.586181640625, 10.26953125, 10.952880859375, 11.63623046875, 12.319580078125, 13.0029296875, 13.686279296875, 14.36962890625, 15.052978515625, 15.736328125, 16.419677734375, 17.10302734375, 17.786376953125, 18.4697265625, 19.153076171875, 19.83642578125, 20.519775390625, 21.203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 8.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 16.0, 17.0, 23.0, 33.0, 44.0, 46.0, 82.0, 117.0, 143.0, 252.0, 323.0, 451.0, 687.0, 968.0, 1304.0, 1939.0, 2735.0, 3938.0, 5960.0, 8724.0, 13102.0, 20535.0, 36309.0, 753660.0, 121359.0, 25940.0, 16174.0, 10599.0, 7095.0, 4772.0, 3383.0, 2400.0, 1620.0, 1096.0, 767.0, 566.0, 383.0, 266.0, 187.0, 151.0, 82.0, 73.0, 54.0, 43.0, 38.0, 27.0, 16.0, 7.0, 6.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0], "bins": [-1.0185546875, -0.9874420166015625, -0.956329345703125, -0.9252166748046875, -0.89410400390625, -0.8629913330078125, -0.831878662109375, -0.8007659912109375, -0.7696533203125, -0.7385406494140625, -0.707427978515625, -0.6763153076171875, -0.64520263671875, -0.6140899658203125, -0.582977294921875, -0.5518646240234375, -0.520751953125, -0.4896392822265625, -0.458526611328125, -0.4274139404296875, -0.39630126953125, -0.3651885986328125, -0.334075927734375, -0.3029632568359375, -0.2718505859375, -0.2407379150390625, -0.209625244140625, -0.1785125732421875, -0.14739990234375, -0.1162872314453125, -0.085174560546875, -0.0540618896484375, -0.02294921875, 0.0081634521484375, 0.039276123046875, 0.0703887939453125, 0.10150146484375, 0.1326141357421875, 0.163726806640625, 0.1948394775390625, 0.2259521484375, 0.2570648193359375, 0.288177490234375, 0.3192901611328125, 0.35040283203125, 0.3815155029296875, 0.412628173828125, 0.4437408447265625, 0.474853515625, 0.5059661865234375, 0.537078857421875, 0.5681915283203125, 0.59930419921875, 0.6304168701171875, 0.661529541015625, 0.6926422119140625, 0.7237548828125, 0.7548675537109375, 0.785980224609375, 0.8170928955078125, 0.84820556640625, 0.8793182373046875, 0.910430908203125, 0.9415435791015625, 0.97265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 20.0, 17.0, 22.0, 30.0, 36.0, 37.0, 43.0, 50.0, 55.0, 62.0, 47.0, 46.0, 49.0, 58.0, 57.0, 51.0, 39.0, 32.0, 26.0, 28.0, 22.0, 15.0, 30.0, 16.0, 12.0, 5.0, 13.0, 10.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.213062882423401e-05, -3.112107515335083e-05, -3.011152148246765e-05, -2.9101967811584473e-05, -2.8092414140701294e-05, -2.7082860469818115e-05, -2.6073306798934937e-05, -2.5063753128051758e-05, -2.405419945716858e-05, -2.30446457862854e-05, -2.203509211540222e-05, -2.1025538444519043e-05, -2.0015984773635864e-05, -1.9006431102752686e-05, -1.7996877431869507e-05, -1.6987323760986328e-05, -1.597777009010315e-05, -1.496821641921997e-05, -1.3958662748336792e-05, -1.2949109077453613e-05, -1.1939555406570435e-05, -1.0930001735687256e-05, -9.920448064804077e-06, -8.910894393920898e-06, -7.90134072303772e-06, -6.891787052154541e-06, -5.882233381271362e-06, -4.872679710388184e-06, -3.863126039505005e-06, -2.853572368621826e-06, -1.8440186977386475e-06, -8.344650268554688e-07, 1.7508864402770996e-07, 1.1846423149108887e-06, 2.1941959857940674e-06, 3.203749656677246e-06, 4.213303327560425e-06, 5.2228569984436035e-06, 6.232410669326782e-06, 7.241964340209961e-06, 8.25151801109314e-06, 9.261071681976318e-06, 1.0270625352859497e-05, 1.1280179023742676e-05, 1.2289732694625854e-05, 1.3299286365509033e-05, 1.4308840036392212e-05, 1.531839370727539e-05, 1.632794737815857e-05, 1.7337501049041748e-05, 1.8347054719924927e-05, 1.9356608390808105e-05, 2.0366162061691284e-05, 2.1375715732574463e-05, 2.238526940345764e-05, 2.339482307434082e-05, 2.4404376745224e-05, 2.5413930416107178e-05, 2.6423484086990356e-05, 2.7433037757873535e-05, 2.8442591428756714e-05, 2.9452145099639893e-05, 3.046169877052307e-05, 3.147125244140625e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 16.0, 31.0, 47.0, 66.0, 103.0, 146.0, 226.0, 381.0, 539.0, 862.0, 1327.0, 2147.0, 3293.0, 4826.0, 7381.0, 11009.0, 16835.0, 24967.0, 36315.0, 53595.0, 77299.0, 106062.0, 131355.0, 141280.0, 123869.0, 94554.0, 67314.0, 46987.0, 31917.0, 21516.0, 14391.0, 9571.0, 6462.0, 4149.0, 2773.0, 1731.0, 1161.0, 708.0, 480.0, 283.0, 204.0, 137.0, 93.0, 53.0, 26.0, 23.0, 17.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0], "bins": [-0.9873046875, -0.9585342407226562, -0.9297637939453125, -0.9009933471679688, -0.872222900390625, -0.8434524536132812, -0.8146820068359375, -0.7859115600585938, -0.75714111328125, -0.7283706665039062, -0.6996002197265625, -0.6708297729492188, -0.642059326171875, -0.6132888793945312, -0.5845184326171875, -0.5557479858398438, -0.5269775390625, -0.49820709228515625, -0.4694366455078125, -0.44066619873046875, -0.411895751953125, -0.38312530517578125, -0.3543548583984375, -0.32558441162109375, -0.29681396484375, -0.26804351806640625, -0.2392730712890625, -0.21050262451171875, -0.181732177734375, -0.15296173095703125, -0.1241912841796875, -0.09542083740234375, -0.066650390625, -0.03787994384765625, -0.0091094970703125, 0.01966094970703125, 0.048431396484375, 0.07720184326171875, 0.1059722900390625, 0.13474273681640625, 0.16351318359375, 0.19228363037109375, 0.2210540771484375, 0.24982452392578125, 0.278594970703125, 0.30736541748046875, 0.3361358642578125, 0.36490631103515625, 0.3936767578125, 0.42244720458984375, 0.4512176513671875, 0.47998809814453125, 0.508758544921875, 0.5375289916992188, 0.5662994384765625, 0.5950698852539062, 0.62384033203125, 0.6526107788085938, 0.6813812255859375, 0.7101516723632812, 0.738922119140625, 0.7676925659179688, 0.7964630126953125, 0.8252334594726562, 0.85400390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 4.0, 8.0, 6.0, 12.0, 6.0, 9.0, 13.0, 14.0, 14.0, 17.0, 22.0, 25.0, 27.0, 30.0, 33.0, 39.0, 53.0, 48.0, 58.0, 62.0, 76.0, 47.0, 55.0, 39.0, 51.0, 39.0, 25.0, 18.0, 16.0, 11.0, 14.0, 16.0, 18.0, 10.0, 12.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.50927734375, -0.49341583251953125, -0.4775543212890625, -0.46169281005859375, -0.445831298828125, -0.42996978759765625, -0.4141082763671875, -0.39824676513671875, -0.38238525390625, -0.36652374267578125, -0.3506622314453125, -0.33480072021484375, -0.318939208984375, -0.30307769775390625, -0.2872161865234375, -0.27135467529296875, -0.2554931640625, -0.23963165283203125, -0.2237701416015625, -0.20790863037109375, -0.192047119140625, -0.17618560791015625, -0.1603240966796875, -0.14446258544921875, -0.12860107421875, -0.11273956298828125, -0.0968780517578125, -0.08101654052734375, -0.065155029296875, -0.04929351806640625, -0.0334320068359375, -0.01757049560546875, -0.001708984375, 0.01415252685546875, 0.0300140380859375, 0.04587554931640625, 0.061737060546875, 0.07759857177734375, 0.0934600830078125, 0.10932159423828125, 0.12518310546875, 0.14104461669921875, 0.1569061279296875, 0.17276763916015625, 0.188629150390625, 0.20449066162109375, 0.2203521728515625, 0.23621368408203125, 0.2520751953125, 0.26793670654296875, 0.2837982177734375, 0.29965972900390625, 0.315521240234375, 0.33138275146484375, 0.3472442626953125, 0.36310577392578125, 0.37896728515625, 0.39482879638671875, 0.4106903076171875, 0.42655181884765625, 0.442413330078125, 0.45827484130859375, 0.4741363525390625, 0.48999786376953125, 0.505859375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 8.0, 8.0, 16.0, 21.0, 24.0, 31.0, 21.0, 35.0, 29.0, 31.0, 35.0, 35.0, 36.0, 44.0, 41.0, 50.0, 42.0, 40.0, 44.0, 50.0, 42.0, 36.0, 37.0, 26.0, 42.0, 27.0, 25.0, 17.0, 18.0, 15.0, 8.0, 15.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.252750396728516, -30.284765243530273, -29.31678009033203, -28.34879493713379, -27.380809783935547, -26.412822723388672, -25.44483757019043, -24.476852416992188, -23.508867263793945, -22.540882110595703, -21.57289695739746, -20.60491180419922, -19.636924743652344, -18.668941497802734, -17.70095443725586, -16.732969284057617, -15.764984130859375, -14.796998977661133, -13.82901382446289, -12.861027717590332, -11.89304256439209, -10.925057411193848, -9.957071304321289, -8.989086151123047, -8.021100997924805, -7.0531158447265625, -6.085130214691162, -5.117144584655762, -4.1491594314575195, -3.1811742782592773, -2.213188648223877, -1.2452030181884766, -0.2772197723388672, 0.6907656192779541, 1.6587510108947754, 2.6267364025115967, 3.594721794128418, 4.56270694732666, 5.5306925773620605, 6.498678207397461, 7.466663360595703, 8.434648513793945, 9.402633666992188, 10.370619773864746, 11.338604927062988, 12.30659008026123, 13.274576187133789, 14.242561340332031, 15.210546493530273, 16.178531646728516, 17.146516799926758, 18.114501953125, 19.082489013671875, 20.050472259521484, 21.01845932006836, 21.9864444732666, 22.954429626464844, 23.922414779663086, 24.890399932861328, 25.85838508605957, 26.826370239257812, 27.794357299804688, 28.76234245300293, 29.730327606201172, 30.698312759399414]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 16.0, 17.0, 18.0, 17.0, 21.0, 27.0, 16.0, 17.0, 31.0, 30.0, 28.0, 39.0, 34.0, 39.0, 41.0, 43.0, 44.0, 56.0, 49.0, 38.0, 38.0, 27.0, 29.0, 30.0, 22.0, 31.0, 27.0, 20.0, 28.0, 19.0, 10.0, 15.0, 8.0, 11.0, 4.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.467607498168945, -28.4381046295166, -27.408601760864258, -26.379098892211914, -25.34959602355957, -24.320093154907227, -23.290592193603516, -22.261089324951172, -21.231586456298828, -20.202083587646484, -19.17258071899414, -18.143077850341797, -17.113574981689453, -16.08407211303711, -15.054570198059082, -14.025067329406738, -12.995563507080078, -11.966060638427734, -10.93655776977539, -9.907054901123047, -8.877552032470703, -7.848049640655518, -6.818547248840332, -5.789044380187988, -4.7595415115356445, -3.730038642883301, -2.700536012649536, -1.6710333824157715, -0.6415305137634277, 0.387972354888916, 1.4174747467041016, 2.4469776153564453, 3.476482391357422, 4.505985260009766, 5.535488128662109, 6.564990520477295, 7.594493389129639, 8.62399673461914, 9.653498649597168, 10.683001518249512, 11.712504386901855, 12.7420072555542, 13.771510124206543, 14.80101203918457, 15.830514907836914, 16.860017776489258, 17.8895206451416, 18.919023513793945, 19.94852638244629, 20.978029251098633, 22.007532119750977, 23.03703498840332, 24.066537857055664, 25.096040725708008, 26.12554168701172, 27.155044555664062, 28.184547424316406, 29.21405029296875, 30.243553161621094, 31.273056030273438, 32.30255889892578, 33.332061767578125, 34.36156463623047, 35.39106750488281, 36.420570373535156]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 7.0, 18.0, 18.0, 31.0, 61.0, 91.0, 126.0, 185.0, 304.0, 489.0, 772.0, 1213.0, 1738.0, 2556.0, 3819.0, 5673.0, 8008.0, 11178.0, 15381.0, 21221.0, 27580.0, 34915.0, 43988.0, 52118.0, 61226.0, 69252.0, 75115.0, 78171.0, 78784.0, 75963.0, 70931.0, 63082.0, 54761.0, 45802.0, 36723.0, 28936.0, 22091.0, 16805.0, 12107.0, 8557.0, 6233.0, 4245.0, 2717.0, 1988.0, 1246.0, 806.0, 577.0, 372.0, 229.0, 131.0, 79.0, 57.0, 36.0, 25.0, 11.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-13.265625, -12.8392333984375, -12.412841796875, -11.9864501953125, -11.56005859375, -11.1336669921875, -10.707275390625, -10.2808837890625, -9.8544921875, -9.4281005859375, -9.001708984375, -8.5753173828125, -8.14892578125, -7.7225341796875, -7.296142578125, -6.8697509765625, -6.443359375, -6.0169677734375, -5.590576171875, -5.1641845703125, -4.73779296875, -4.3114013671875, -3.885009765625, -3.4586181640625, -3.0322265625, -2.6058349609375, -2.179443359375, -1.7530517578125, -1.32666015625, -0.9002685546875, -0.473876953125, -0.0474853515625, 0.37890625, 0.8052978515625, 1.231689453125, 1.6580810546875, 2.08447265625, 2.5108642578125, 2.937255859375, 3.3636474609375, 3.7900390625, 4.2164306640625, 4.642822265625, 5.0692138671875, 5.49560546875, 5.9219970703125, 6.348388671875, 6.7747802734375, 7.201171875, 7.6275634765625, 8.053955078125, 8.4803466796875, 8.90673828125, 9.3331298828125, 9.759521484375, 10.1859130859375, 10.6123046875, 11.0386962890625, 11.465087890625, 11.8914794921875, 12.31787109375, 12.7442626953125, 13.170654296875, 13.5970458984375, 14.0234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 11.0, 16.0, 16.0, 19.0, 19.0, 17.0, 27.0, 18.0, 17.0, 28.0, 30.0, 31.0, 35.0, 37.0, 37.0, 42.0, 45.0, 36.0, 65.0, 41.0, 44.0, 38.0, 27.0, 35.0, 29.0, 20.0, 30.0, 29.0, 19.0, 30.0, 20.0, 10.0, 13.0, 8.0, 12.0, 5.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.0, -27.9921875, -26.984375, -25.9765625, -24.96875, -23.9609375, -22.953125, -21.9453125, -20.9375, -19.9296875, -18.921875, -17.9140625, -16.90625, -15.8984375, -14.890625, -13.8828125, -12.875, -11.8671875, -10.859375, -9.8515625, -8.84375, -7.8359375, -6.828125, -5.8203125, -4.8125, -3.8046875, -2.796875, -1.7890625, -0.78125, 0.2265625, 1.234375, 2.2421875, 3.25, 4.2578125, 5.265625, 6.2734375, 7.28125, 8.2890625, 9.296875, 10.3046875, 11.3125, 12.3203125, 13.328125, 14.3359375, 15.34375, 16.3515625, 17.359375, 18.3671875, 19.375, 20.3828125, 21.390625, 22.3984375, 23.40625, 24.4140625, 25.421875, 26.4296875, 27.4375, 28.4453125, 29.453125, 30.4609375, 31.46875, 32.4765625, 33.484375, 34.4921875, 35.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 10.0, 13.0, 33.0, 46.0, 71.0, 129.0, 217.0, 346.0, 547.0, 817.0, 1324.0, 2123.0, 3238.0, 5088.0, 7508.0, 11011.0, 15864.0, 22176.0, 29870.0, 39317.0, 50295.0, 61151.0, 71063.0, 80059.0, 85549.0, 87526.0, 84743.0, 78554.0, 70192.0, 59557.0, 48064.0, 37718.0, 28675.0, 20590.0, 14575.0, 10411.0, 7059.0, 4683.0, 3082.0, 1952.0, 1251.0, 800.0, 515.0, 295.0, 193.0, 91.0, 76.0, 39.0, 25.0, 12.0, 12.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.13671875, -13.671875, -13.20703125, -12.7421875, -12.27734375, -11.8125, -11.34765625, -10.8828125, -10.41796875, -9.953125, -9.48828125, -9.0234375, -8.55859375, -8.09375, -7.62890625, -7.1640625, -6.69921875, -6.234375, -5.76953125, -5.3046875, -4.83984375, -4.375, -3.91015625, -3.4453125, -2.98046875, -2.515625, -2.05078125, -1.5859375, -1.12109375, -0.65625, -0.19140625, 0.2734375, 0.73828125, 1.203125, 1.66796875, 2.1328125, 2.59765625, 3.0625, 3.52734375, 3.9921875, 4.45703125, 4.921875, 5.38671875, 5.8515625, 6.31640625, 6.78125, 7.24609375, 7.7109375, 8.17578125, 8.640625, 9.10546875, 9.5703125, 10.03515625, 10.5, 10.96484375, 11.4296875, 11.89453125, 12.359375, 12.82421875, 13.2890625, 13.75390625, 14.21875, 14.68359375, 15.1484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 1.0, 4.0, 6.0, 3.0, 8.0, 9.0, 16.0, 16.0, 9.0, 24.0, 22.0, 14.0, 26.0, 26.0, 32.0, 34.0, 37.0, 37.0, 48.0, 39.0, 36.0, 44.0, 33.0, 43.0, 46.0, 32.0, 45.0, 36.0, 32.0, 37.0, 25.0, 27.0, 23.0, 20.0, 25.0, 17.0, 11.0, 6.0, 9.0, 7.0, 7.0, 9.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.84375, -19.150390625, -18.45703125, -17.763671875, -17.0703125, -16.376953125, -15.68359375, -14.990234375, -14.296875, -13.603515625, -12.91015625, -12.216796875, -11.5234375, -10.830078125, -10.13671875, -9.443359375, -8.75, -8.056640625, -7.36328125, -6.669921875, -5.9765625, -5.283203125, -4.58984375, -3.896484375, -3.203125, -2.509765625, -1.81640625, -1.123046875, -0.4296875, 0.263671875, 0.95703125, 1.650390625, 2.34375, 3.037109375, 3.73046875, 4.423828125, 5.1171875, 5.810546875, 6.50390625, 7.197265625, 7.890625, 8.583984375, 9.27734375, 9.970703125, 10.6640625, 11.357421875, 12.05078125, 12.744140625, 13.4375, 14.130859375, 14.82421875, 15.517578125, 16.2109375, 16.904296875, 17.59765625, 18.291015625, 18.984375, 19.677734375, 20.37109375, 21.064453125, 21.7578125, 22.451171875, 23.14453125, 23.837890625, 24.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 13.0, 23.0, 51.0, 62.0, 108.0, 168.0, 261.0, 438.0, 677.0, 1120.0, 1820.0, 2877.0, 4600.0, 7022.0, 10785.0, 16128.0, 23429.0, 33271.0, 45359.0, 59183.0, 72651.0, 85820.0, 94886.0, 98597.0, 96456.0, 88686.0, 77044.0, 62990.0, 49193.0, 36326.0, 26099.0, 18069.0, 12363.0, 7934.0, 5198.0, 3253.0, 2095.0, 1307.0, 841.0, 533.0, 316.0, 181.0, 128.0, 71.0, 43.0, 28.0, 22.0, 11.0, 8.0, 3.0, 3.0, 1.0, 3.0], "bins": [-8.2578125, -8.01947021484375, -7.7811279296875, -7.54278564453125, -7.304443359375, -7.06610107421875, -6.8277587890625, -6.58941650390625, -6.35107421875, -6.11273193359375, -5.8743896484375, -5.63604736328125, -5.397705078125, -5.15936279296875, -4.9210205078125, -4.68267822265625, -4.4443359375, -4.20599365234375, -3.9676513671875, -3.72930908203125, -3.490966796875, -3.25262451171875, -3.0142822265625, -2.77593994140625, -2.53759765625, -2.29925537109375, -2.0609130859375, -1.82257080078125, -1.584228515625, -1.34588623046875, -1.1075439453125, -0.86920166015625, -0.630859375, -0.39251708984375, -0.1541748046875, 0.08416748046875, 0.322509765625, 0.56085205078125, 0.7991943359375, 1.03753662109375, 1.27587890625, 1.51422119140625, 1.7525634765625, 1.99090576171875, 2.229248046875, 2.46759033203125, 2.7059326171875, 2.94427490234375, 3.1826171875, 3.42095947265625, 3.6593017578125, 3.89764404296875, 4.135986328125, 4.37432861328125, 4.6126708984375, 4.85101318359375, 5.08935546875, 5.32769775390625, 5.5660400390625, 5.80438232421875, 6.042724609375, 6.28106689453125, 6.5194091796875, 6.75775146484375, 6.99609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 16.0, 14.0, 17.0, 17.0, 27.0, 42.0, 41.0, 50.0, 41.0, 46.0, 48.0, 55.0, 65.0, 53.0, 70.0, 62.0, 52.0, 49.0, 49.0, 35.0, 25.0, 29.0, 23.0, 9.0, 10.0, 11.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001735687255859375, -0.0016918033361434937, -0.0016479194164276123, -0.001604035496711731, -0.0015601515769958496, -0.0015162676572799683, -0.001472383737564087, -0.0014284998178482056, -0.0013846158981323242, -0.0013407319784164429, -0.0012968480587005615, -0.0012529641389846802, -0.0012090802192687988, -0.0011651962995529175, -0.0011213123798370361, -0.0010774284601211548, -0.0010335445404052734, -0.000989660620689392, -0.0009457767009735107, -0.0009018927812576294, -0.000858008861541748, -0.0008141249418258667, -0.0007702410221099854, -0.000726357102394104, -0.0006824731826782227, -0.0006385892629623413, -0.00059470534324646, -0.0005508214235305786, -0.0005069375038146973, -0.0004630535840988159, -0.00041916966438293457, -0.0003752857446670532, -0.0003314018249511719, -0.00028751790523529053, -0.00024363398551940918, -0.00019975006580352783, -0.00015586614608764648, -0.00011198222637176514, -6.809830665588379e-05, -2.421438694000244e-05, 1.9669532775878906e-05, 6.355345249176025e-05, 0.0001074373722076416, 0.00015132129192352295, 0.0001952052116394043, 0.00023908913135528564, 0.000282973051071167, 0.00032685697078704834, 0.0003707408905029297, 0.00041462481021881104, 0.0004585087299346924, 0.0005023926496505737, 0.0005462765693664551, 0.0005901604890823364, 0.0006340444087982178, 0.0006779283285140991, 0.0007218122482299805, 0.0007656961679458618, 0.0008095800876617432, 0.0008534640073776245, 0.0008973479270935059, 0.0009412318468093872, 0.0009851157665252686, 0.00102899968624115, 0.0010728836059570312]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 16.0, 24.0, 18.0, 32.0, 78.0, 115.0, 204.0, 287.0, 489.0, 842.0, 1435.0, 2378.0, 4032.0, 6629.0, 10667.0, 16940.0, 26498.0, 38864.0, 54822.0, 72862.0, 91347.0, 105606.0, 111836.0, 110944.0, 100362.0, 84217.0, 66166.0, 48407.0, 33604.0, 22387.0, 14366.0, 8737.0, 5409.0, 3112.0, 1985.0, 1097.0, 693.0, 395.0, 251.0, 155.0, 87.0, 55.0, 32.0, 20.0, 16.0, 12.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.94970703125, -8.6494140625, -8.34912109375, -8.048828125, -7.74853515625, -7.4482421875, -7.14794921875, -6.84765625, -6.54736328125, -6.2470703125, -5.94677734375, -5.646484375, -5.34619140625, -5.0458984375, -4.74560546875, -4.4453125, -4.14501953125, -3.8447265625, -3.54443359375, -3.244140625, -2.94384765625, -2.6435546875, -2.34326171875, -2.04296875, -1.74267578125, -1.4423828125, -1.14208984375, -0.841796875, -0.54150390625, -0.2412109375, 0.05908203125, 0.359375, 0.65966796875, 0.9599609375, 1.26025390625, 1.560546875, 1.86083984375, 2.1611328125, 2.46142578125, 2.76171875, 3.06201171875, 3.3623046875, 3.66259765625, 3.962890625, 4.26318359375, 4.5634765625, 4.86376953125, 5.1640625, 5.46435546875, 5.7646484375, 6.06494140625, 6.365234375, 6.66552734375, 6.9658203125, 7.26611328125, 7.56640625, 7.86669921875, 8.1669921875, 8.46728515625, 8.767578125, 9.06787109375, 9.3681640625, 9.66845703125, 9.96875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 7.0, 14.0, 11.0, 21.0, 13.0, 13.0, 27.0, 23.0, 28.0, 24.0, 24.0, 37.0, 36.0, 35.0, 43.0, 46.0, 31.0, 43.0, 65.0, 42.0, 43.0, 31.0, 38.0, 35.0, 31.0, 27.0, 28.0, 19.0, 28.0, 12.0, 21.0, 18.0, 8.0, 8.0, 13.0, 4.0, 9.0, 2.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-3.818359375, -3.70050048828125, -3.5826416015625, -3.46478271484375, -3.346923828125, -3.22906494140625, -3.1112060546875, -2.99334716796875, -2.87548828125, -2.75762939453125, -2.6397705078125, -2.52191162109375, -2.404052734375, -2.28619384765625, -2.1683349609375, -2.05047607421875, -1.9326171875, -1.81475830078125, -1.6968994140625, -1.57904052734375, -1.461181640625, -1.34332275390625, -1.2254638671875, -1.10760498046875, -0.98974609375, -0.87188720703125, -0.7540283203125, -0.63616943359375, -0.518310546875, -0.40045166015625, -0.2825927734375, -0.16473388671875, -0.046875, 0.07098388671875, 0.1888427734375, 0.30670166015625, 0.424560546875, 0.54241943359375, 0.6602783203125, 0.77813720703125, 0.89599609375, 1.01385498046875, 1.1317138671875, 1.24957275390625, 1.367431640625, 1.48529052734375, 1.6031494140625, 1.72100830078125, 1.8388671875, 1.95672607421875, 2.0745849609375, 2.19244384765625, 2.310302734375, 2.42816162109375, 2.5460205078125, 2.66387939453125, 2.78173828125, 2.89959716796875, 3.0174560546875, 3.13531494140625, 3.253173828125, 3.37103271484375, 3.4888916015625, 3.60675048828125, 3.724609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 3.0, 9.0, 10.0, 10.0, 12.0, 24.0, 18.0, 16.0, 26.0, 35.0, 25.0, 32.0, 30.0, 49.0, 33.0, 34.0, 34.0, 48.0, 48.0, 41.0, 50.0, 39.0, 49.0, 42.0, 41.0, 37.0, 25.0, 35.0, 19.0, 24.0, 20.0, 12.0, 12.0, 9.0, 14.0, 13.0, 8.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.63239860534668, -29.672460556030273, -28.712522506713867, -27.75258445739746, -26.792648315429688, -25.83271026611328, -24.872772216796875, -23.91283416748047, -22.952896118164062, -21.992958068847656, -21.03302001953125, -20.073081970214844, -19.113143920898438, -18.15320587158203, -17.193269729614258, -16.23333168029785, -15.273393630981445, -14.313455581665039, -13.353517532348633, -12.393580436706543, -11.433642387390137, -10.47370433807373, -9.51376724243164, -8.553829193115234, -7.593891143798828, -6.633953094482422, -5.674015522003174, -4.714077949523926, -3.7541399002075195, -2.7942018508911133, -1.8342642784118652, -0.8743267059326172, 0.08561134338378906, 1.0455491542816162, 2.0054869651794434, 2.9654247760772705, 3.9253625869750977, 4.885300636291504, 5.845238208770752, 6.80517578125, 7.765113830566406, 8.725051879882812, 9.684989929199219, 10.644927024841309, 11.604865074157715, 12.564803123474121, 13.524740219116211, 14.484678268432617, 15.444616317749023, 16.40455436706543, 17.364492416381836, 18.324430465698242, 19.284366607666016, 20.244304656982422, 21.204242706298828, 22.164180755615234, 23.12411880493164, 24.084056854248047, 25.043994903564453, 26.00393295288086, 26.963871002197266, 27.923809051513672, 28.883745193481445, 29.84368324279785, 30.803621292114258]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 12.0, 10.0, 19.0, 16.0, 17.0, 31.0, 18.0, 26.0, 25.0, 27.0, 35.0, 31.0, 34.0, 34.0, 47.0, 34.0, 32.0, 44.0, 39.0, 39.0, 47.0, 44.0, 26.0, 41.0, 36.0, 22.0, 23.0, 27.0, 25.0, 18.0, 18.0, 9.0, 10.0, 10.0, 10.0, 9.0, 11.0, 1.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.79273223876953, -32.674896240234375, -31.55706024169922, -30.439224243164062, -29.321388244628906, -28.20355224609375, -27.08571434020996, -25.967878341674805, -24.85004234313965, -23.732206344604492, -22.614370346069336, -21.49653434753418, -20.37869644165039, -19.260860443115234, -18.143024444580078, -17.025188446044922, -15.907352447509766, -14.78951644897461, -13.671680450439453, -12.55384349822998, -11.436007499694824, -10.318171501159668, -9.200334548950195, -8.082498550415039, -6.964662551879883, -5.846826553344727, -4.728990077972412, -3.6111538410186768, -2.4933176040649414, -1.3754816055297852, -0.2576451301574707, 0.8601913452148438, 1.9780235290527344, 3.0958597660064697, 4.213696002960205, 5.3315324783325195, 6.449368476867676, 7.567204475402832, 8.685041427612305, 9.802877426147461, 10.920713424682617, 12.038549423217773, 13.15638542175293, 14.274222373962402, 15.392058372497559, 16.50989532470703, 17.627731323242188, 18.745567321777344, 19.8634033203125, 20.981239318847656, 22.099075317382812, 23.21691131591797, 24.334747314453125, 25.45258331298828, 26.57042121887207, 27.688257217407227, 28.806093215942383, 29.92392921447754, 31.041765213012695, 32.159603118896484, 33.27743911743164, 34.3952751159668, 35.51311111450195, 36.63094711303711, 37.748783111572266]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 10.0, 31.0, 37.0, 69.0, 137.0, 199.0, 364.0, 606.0, 1040.0, 1804.0, 3122.0, 5314.0, 8825.0, 14667.0, 23818.0, 37827.0, 59367.0, 90597.0, 132809.0, 189355.0, 254453.0, 325252.0, 387667.0, 429624.0, 439385.0, 415462.0, 364408.0, 295840.0, 227598.0, 164561.0, 113473.0, 76269.0, 49437.0, 31511.0, 19637.0, 12032.0, 7134.0, 4331.0, 2601.0, 1479.0, 931.0, 496.0, 286.0, 156.0, 114.0, 68.0, 38.0, 18.0, 13.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.875, -21.176025390625, -20.47705078125, -19.778076171875, -19.0791015625, -18.380126953125, -17.68115234375, -16.982177734375, -16.283203125, -15.584228515625, -14.88525390625, -14.186279296875, -13.4873046875, -12.788330078125, -12.08935546875, -11.390380859375, -10.69140625, -9.992431640625, -9.29345703125, -8.594482421875, -7.8955078125, -7.196533203125, -6.49755859375, -5.798583984375, -5.099609375, -4.400634765625, -3.70166015625, -3.002685546875, -2.3037109375, -1.604736328125, -0.90576171875, -0.206787109375, 0.4921875, 1.191162109375, 1.89013671875, 2.589111328125, 3.2880859375, 3.987060546875, 4.68603515625, 5.385009765625, 6.083984375, 6.782958984375, 7.48193359375, 8.180908203125, 8.8798828125, 9.578857421875, 10.27783203125, 10.976806640625, 11.67578125, 12.374755859375, 13.07373046875, 13.772705078125, 14.4716796875, 15.170654296875, 15.86962890625, 16.568603515625, 17.267578125, 17.966552734375, 18.66552734375, 19.364501953125, 20.0634765625, 20.762451171875, 21.46142578125, 22.160400390625, 22.859375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 12.0, 12.0, 19.0, 18.0, 20.0, 23.0, 20.0, 26.0, 22.0, 28.0, 39.0, 30.0, 35.0, 34.0, 48.0, 29.0, 36.0, 41.0, 38.0, 43.0, 48.0, 38.0, 30.0, 43.0, 32.0, 20.0, 29.0, 25.0, 27.0, 12.0, 22.0, 8.0, 9.0, 10.0, 9.0, 11.0, 10.0, 2.0, 4.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.34375, -31.28173828125, -30.2197265625, -29.15771484375, -28.095703125, -27.03369140625, -25.9716796875, -24.90966796875, -23.84765625, -22.78564453125, -21.7236328125, -20.66162109375, -19.599609375, -18.53759765625, -17.4755859375, -16.41357421875, -15.3515625, -14.28955078125, -13.2275390625, -12.16552734375, -11.103515625, -10.04150390625, -8.9794921875, -7.91748046875, -6.85546875, -5.79345703125, -4.7314453125, -3.66943359375, -2.607421875, -1.54541015625, -0.4833984375, 0.57861328125, 1.640625, 2.70263671875, 3.7646484375, 4.82666015625, 5.888671875, 6.95068359375, 8.0126953125, 9.07470703125, 10.13671875, 11.19873046875, 12.2607421875, 13.32275390625, 14.384765625, 15.44677734375, 16.5087890625, 17.57080078125, 18.6328125, 19.69482421875, 20.7568359375, 21.81884765625, 22.880859375, 23.94287109375, 25.0048828125, 26.06689453125, 27.12890625, 28.19091796875, 29.2529296875, 30.31494140625, 31.376953125, 32.43896484375, 33.5009765625, 34.56298828125, 35.625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 11.0, 24.0, 37.0, 58.0, 105.0, 182.0, 314.0, 576.0, 1061.0, 1796.0, 3141.0, 5255.0, 8995.0, 14810.0, 23542.0, 37715.0, 57690.0, 87580.0, 125035.0, 173995.0, 230552.0, 290179.0, 345954.0, 386996.0, 404723.0, 399495.0, 367766.0, 318629.0, 260263.0, 200640.0, 148161.0, 104890.0, 71260.0, 47225.0, 29624.0, 18448.0, 11273.0, 6827.0, 3992.0, 2247.0, 1417.0, 800.0, 470.0, 231.0, 150.0, 66.0, 39.0, 24.0, 12.0, 10.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-24.015625, -23.303955078125, -22.59228515625, -21.880615234375, -21.1689453125, -20.457275390625, -19.74560546875, -19.033935546875, -18.322265625, -17.610595703125, -16.89892578125, -16.187255859375, -15.4755859375, -14.763916015625, -14.05224609375, -13.340576171875, -12.62890625, -11.917236328125, -11.20556640625, -10.493896484375, -9.7822265625, -9.070556640625, -8.35888671875, -7.647216796875, -6.935546875, -6.223876953125, -5.51220703125, -4.800537109375, -4.0888671875, -3.377197265625, -2.66552734375, -1.953857421875, -1.2421875, -0.530517578125, 0.18115234375, 0.892822265625, 1.6044921875, 2.316162109375, 3.02783203125, 3.739501953125, 4.451171875, 5.162841796875, 5.87451171875, 6.586181640625, 7.2978515625, 8.009521484375, 8.72119140625, 9.432861328125, 10.14453125, 10.856201171875, 11.56787109375, 12.279541015625, 12.9912109375, 13.702880859375, 14.41455078125, 15.126220703125, 15.837890625, 16.549560546875, 17.26123046875, 17.972900390625, 18.6845703125, 19.396240234375, 20.10791015625, 20.819580078125, 21.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 18.0, 18.0, 24.0, 24.0, 39.0, 40.0, 64.0, 70.0, 71.0, 103.0, 119.0, 132.0, 164.0, 172.0, 184.0, 192.0, 200.0, 205.0, 216.0, 194.0, 229.0, 198.0, 194.0, 168.0, 155.0, 131.0, 126.0, 116.0, 118.0, 88.0, 67.0, 55.0, 47.0, 32.0, 24.0, 13.0, 9.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.5703125, -14.0916748046875, -13.613037109375, -13.1343994140625, -12.65576171875, -12.1771240234375, -11.698486328125, -11.2198486328125, -10.7412109375, -10.2625732421875, -9.783935546875, -9.3052978515625, -8.82666015625, -8.3480224609375, -7.869384765625, -7.3907470703125, -6.912109375, -6.4334716796875, -5.954833984375, -5.4761962890625, -4.99755859375, -4.5189208984375, -4.040283203125, -3.5616455078125, -3.0830078125, -2.6043701171875, -2.125732421875, -1.6470947265625, -1.16845703125, -0.6898193359375, -0.211181640625, 0.2674560546875, 0.74609375, 1.2247314453125, 1.703369140625, 2.1820068359375, 2.66064453125, 3.1392822265625, 3.617919921875, 4.0965576171875, 4.5751953125, 5.0538330078125, 5.532470703125, 6.0111083984375, 6.48974609375, 6.9683837890625, 7.447021484375, 7.9256591796875, 8.404296875, 8.8829345703125, 9.361572265625, 9.8402099609375, 10.31884765625, 10.7974853515625, 11.276123046875, 11.7547607421875, 12.2333984375, 12.7120361328125, 13.190673828125, 13.6693115234375, 14.14794921875, 14.6265869140625, 15.105224609375, 15.5838623046875, 16.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 8.0, 3.0, 3.0, 6.0, 8.0, 11.0, 9.0, 8.0, 17.0, 15.0, 23.0, 27.0, 27.0, 30.0, 26.0, 27.0, 33.0, 36.0, 29.0, 38.0, 33.0, 46.0, 36.0, 39.0, 27.0, 45.0, 37.0, 29.0, 28.0, 40.0, 31.0, 41.0, 25.0, 18.0, 26.0, 19.0, 15.0, 14.0, 13.0, 10.0, 7.0, 5.0, 7.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.797842025756836, -24.91282844543457, -24.027814865112305, -23.14280128479004, -22.25778579711914, -21.372772216796875, -20.48775863647461, -19.602745056152344, -18.717731475830078, -17.832717895507812, -16.947704315185547, -16.06269073486328, -15.1776762008667, -14.292662620544434, -13.407648086547852, -12.522634506225586, -11.63762092590332, -10.752607345581055, -9.867593765258789, -8.982579231262207, -8.097565650939941, -7.212552070617676, -6.327538013458252, -5.442523956298828, -4.5575103759765625, -3.6724965572357178, -2.787482738494873, -1.9024689197540283, -1.0174551010131836, -0.13244152069091797, 0.7525725364685059, 1.6375865936279297, 2.5226001739501953, 3.40761399269104, 4.292627811431885, 5.177641868591309, 6.062655448913574, 6.94766902923584, 7.832683086395264, 8.717697143554688, 9.602710723876953, 10.487724304199219, 11.372737884521484, 12.257752418518066, 13.142765998840332, 14.027779579162598, 14.91279411315918, 15.797807693481445, 16.68282127380371, 17.567834854125977, 18.452848434448242, 19.337862014770508, 20.222877502441406, 21.107891082763672, 21.992904663085938, 22.877918243408203, 23.76293182373047, 24.647945404052734, 25.532958984375, 26.417972564697266, 27.30298614501953, 28.187999725341797, 29.073015213012695, 29.95802879333496, 30.843042373657227]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 7.0, 8.0, 2.0, 13.0, 14.0, 16.0, 14.0, 21.0, 23.0, 22.0, 20.0, 21.0, 30.0, 29.0, 27.0, 31.0, 38.0, 35.0, 40.0, 40.0, 34.0, 40.0, 45.0, 49.0, 31.0, 33.0, 33.0, 39.0, 36.0, 19.0, 23.0, 29.0, 23.0, 17.0, 21.0, 14.0, 9.0, 10.0, 5.0, 9.0, 3.0, 9.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.66719055175781, -35.495819091796875, -34.32444763183594, -33.153076171875, -31.981704711914062, -30.810333251953125, -29.63896369934082, -28.467592239379883, -27.296220779418945, -26.124849319458008, -24.95347785949707, -23.782106399536133, -22.610736846923828, -21.43936538696289, -20.267993927001953, -19.096622467041016, -17.925251007080078, -16.75387954711914, -15.582508087158203, -14.411137580871582, -13.239766120910645, -12.068394660949707, -10.897024154663086, -9.725652694702148, -8.554281234741211, -7.382909774780273, -6.211538791656494, -5.040167808532715, -3.8687963485717773, -2.69742488861084, -1.5260539054870605, -0.35468292236328125, 0.8166923522949219, 1.9880635738372803, 3.1594347953796387, 4.330805778503418, 5.5021772384643555, 6.673548698425293, 7.844919681549072, 9.016290664672852, 10.187662124633789, 11.359033584594727, 12.530405044555664, 13.701775550842285, 14.873147010803223, 16.044517517089844, 17.21588897705078, 18.38726043701172, 19.558631896972656, 20.730003356933594, 21.90137481689453, 23.07274627685547, 24.244117736816406, 25.415489196777344, 26.58685874938965, 27.758230209350586, 28.929601669311523, 30.10097312927246, 31.2723445892334, 32.4437141418457, 33.61508560180664, 34.78645706176758, 35.957828521728516, 37.12919998168945, 38.30057144165039]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 5.0, 14.0, 16.0, 41.0, 40.0, 71.0, 94.0, 138.0, 253.0, 330.0, 487.0, 755.0, 1127.0, 1773.0, 2873.0, 4349.0, 6614.0, 9969.0, 15157.0, 22238.0, 32429.0, 45904.0, 62891.0, 81064.0, 99572.0, 112137.0, 113902.0, 105863.0, 88937.0, 70299.0, 52537.0, 37850.0, 26140.0, 17757.0, 11920.0, 7926.0, 5199.0, 3445.0, 2210.0, 1546.0, 946.0, 604.0, 393.0, 229.0, 167.0, 109.0, 81.0, 61.0, 21.0, 26.0, 21.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0], "bins": [-5.13671875, -4.9820556640625, -4.827392578125, -4.6727294921875, -4.51806640625, -4.3634033203125, -4.208740234375, -4.0540771484375, -3.8994140625, -3.7447509765625, -3.590087890625, -3.4354248046875, -3.28076171875, -3.1260986328125, -2.971435546875, -2.8167724609375, -2.662109375, -2.5074462890625, -2.352783203125, -2.1981201171875, -2.04345703125, -1.8887939453125, -1.734130859375, -1.5794677734375, -1.4248046875, -1.2701416015625, -1.115478515625, -0.9608154296875, -0.80615234375, -0.6514892578125, -0.496826171875, -0.3421630859375, -0.1875, -0.0328369140625, 0.121826171875, 0.2764892578125, 0.43115234375, 0.5858154296875, 0.740478515625, 0.8951416015625, 1.0498046875, 1.2044677734375, 1.359130859375, 1.5137939453125, 1.66845703125, 1.8231201171875, 1.977783203125, 2.1324462890625, 2.287109375, 2.4417724609375, 2.596435546875, 2.7510986328125, 2.90576171875, 3.0604248046875, 3.215087890625, 3.3697509765625, 3.5244140625, 3.6790771484375, 3.833740234375, 3.9884033203125, 4.14306640625, 4.2977294921875, 4.452392578125, 4.6070556640625, 4.76171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 8.0, 5.0, 11.0, 18.0, 12.0, 15.0, 24.0, 24.0, 17.0, 24.0, 21.0, 32.0, 29.0, 28.0, 33.0, 35.0, 33.0, 41.0, 41.0, 37.0, 34.0, 49.0, 46.0, 31.0, 33.0, 39.0, 31.0, 37.0, 20.0, 19.0, 30.0, 23.0, 18.0, 21.0, 12.0, 9.0, 10.0, 4.0, 9.0, 4.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.25, -35.07568359375, -33.9013671875, -32.72705078125, -31.552734375, -30.37841796875, -29.2041015625, -28.02978515625, -26.85546875, -25.68115234375, -24.5068359375, -23.33251953125, -22.158203125, -20.98388671875, -19.8095703125, -18.63525390625, -17.4609375, -16.28662109375, -15.1123046875, -13.93798828125, -12.763671875, -11.58935546875, -10.4150390625, -9.24072265625, -8.06640625, -6.89208984375, -5.7177734375, -4.54345703125, -3.369140625, -2.19482421875, -1.0205078125, 0.15380859375, 1.328125, 2.50244140625, 3.6767578125, 4.85107421875, 6.025390625, 7.19970703125, 8.3740234375, 9.54833984375, 10.72265625, 11.89697265625, 13.0712890625, 14.24560546875, 15.419921875, 16.59423828125, 17.7685546875, 18.94287109375, 20.1171875, 21.29150390625, 22.4658203125, 23.64013671875, 24.814453125, 25.98876953125, 27.1630859375, 28.33740234375, 29.51171875, 30.68603515625, 31.8603515625, 33.03466796875, 34.208984375, 35.38330078125, 36.5576171875, 37.73193359375, 38.90625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 8.0, 10.0, 11.0, 13.0, 22.0, 37.0, 48.0, 74.0, 107.0, 180.0, 252.0, 427.0, 611.0, 894.0, 1379.0, 2106.0, 3141.0, 4581.0, 6923.0, 10538.0, 17267.0, 31898.0, 349669.0, 531194.0, 35647.0, 18471.0, 11203.0, 7299.0, 4875.0, 3263.0, 2130.0, 1436.0, 952.0, 665.0, 420.0, 268.0, 185.0, 119.0, 71.0, 53.0, 41.0, 24.0, 18.0, 12.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.015625, -11.640869140625, -11.26611328125, -10.891357421875, -10.5166015625, -10.141845703125, -9.76708984375, -9.392333984375, -9.017578125, -8.642822265625, -8.26806640625, -7.893310546875, -7.5185546875, -7.143798828125, -6.76904296875, -6.394287109375, -6.01953125, -5.644775390625, -5.27001953125, -4.895263671875, -4.5205078125, -4.145751953125, -3.77099609375, -3.396240234375, -3.021484375, -2.646728515625, -2.27197265625, -1.897216796875, -1.5224609375, -1.147705078125, -0.77294921875, -0.398193359375, -0.0234375, 0.351318359375, 0.72607421875, 1.100830078125, 1.4755859375, 1.850341796875, 2.22509765625, 2.599853515625, 2.974609375, 3.349365234375, 3.72412109375, 4.098876953125, 4.4736328125, 4.848388671875, 5.22314453125, 5.597900390625, 5.97265625, 6.347412109375, 6.72216796875, 7.096923828125, 7.4716796875, 7.846435546875, 8.22119140625, 8.595947265625, 8.970703125, 9.345458984375, 9.72021484375, 10.094970703125, 10.4697265625, 10.844482421875, 11.21923828125, 11.593994140625, 11.96875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 7.0, 10.0, 11.0, 17.0, 20.0, 18.0, 25.0, 15.0, 27.0, 22.0, 28.0, 31.0, 34.0, 37.0, 38.0, 44.0, 48.0, 55.0, 34.0, 46.0, 33.0, 23.0, 35.0, 33.0, 24.0, 19.0, 39.0, 27.0, 29.0, 25.0, 18.0, 17.0, 19.0, 9.0, 8.0, 12.0, 8.0, 8.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-25.734375, -24.944580078125, -24.15478515625, -23.364990234375, -22.5751953125, -21.785400390625, -20.99560546875, -20.205810546875, -19.416015625, -18.626220703125, -17.83642578125, -17.046630859375, -16.2568359375, -15.467041015625, -14.67724609375, -13.887451171875, -13.09765625, -12.307861328125, -11.51806640625, -10.728271484375, -9.9384765625, -9.148681640625, -8.35888671875, -7.569091796875, -6.779296875, -5.989501953125, -5.19970703125, -4.409912109375, -3.6201171875, -2.830322265625, -2.04052734375, -1.250732421875, -0.4609375, 0.328857421875, 1.11865234375, 1.908447265625, 2.6982421875, 3.488037109375, 4.27783203125, 5.067626953125, 5.857421875, 6.647216796875, 7.43701171875, 8.226806640625, 9.0166015625, 9.806396484375, 10.59619140625, 11.385986328125, 12.17578125, 12.965576171875, 13.75537109375, 14.545166015625, 15.3349609375, 16.124755859375, 16.91455078125, 17.704345703125, 18.494140625, 19.283935546875, 20.07373046875, 20.863525390625, 21.6533203125, 22.443115234375, 23.23291015625, 24.022705078125, 24.8125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 11.0, 18.0, 10.0, 34.0, 53.0, 69.0, 99.0, 122.0, 200.0, 304.0, 426.0, 590.0, 966.0, 1405.0, 2178.0, 3287.0, 5240.0, 8033.0, 13060.0, 21221.0, 42021.0, 815539.0, 68973.0, 24390.0, 14453.0, 8983.0, 5782.0, 3758.0, 2491.0, 1621.0, 1008.0, 703.0, 499.0, 305.0, 223.0, 132.0, 119.0, 58.0, 53.0, 30.0, 23.0, 14.0, 15.0, 9.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3173828125, -1.275726318359375, -1.23406982421875, -1.192413330078125, -1.1507568359375, -1.109100341796875, -1.06744384765625, -1.025787353515625, -0.984130859375, -0.942474365234375, -0.90081787109375, -0.859161376953125, -0.8175048828125, -0.775848388671875, -0.73419189453125, -0.692535400390625, -0.65087890625, -0.609222412109375, -0.56756591796875, -0.525909423828125, -0.4842529296875, -0.442596435546875, -0.40093994140625, -0.359283447265625, -0.317626953125, -0.275970458984375, -0.23431396484375, -0.192657470703125, -0.1510009765625, -0.109344482421875, -0.06768798828125, -0.026031494140625, 0.015625, 0.057281494140625, 0.09893798828125, 0.140594482421875, 0.1822509765625, 0.223907470703125, 0.26556396484375, 0.307220458984375, 0.348876953125, 0.390533447265625, 0.43218994140625, 0.473846435546875, 0.5155029296875, 0.557159423828125, 0.59881591796875, 0.640472412109375, 0.68212890625, 0.723785400390625, 0.76544189453125, 0.807098388671875, 0.8487548828125, 0.890411376953125, 0.93206787109375, 0.973724365234375, 1.015380859375, 1.057037353515625, 1.09869384765625, 1.140350341796875, 1.1820068359375, 1.223663330078125, 1.26531982421875, 1.306976318359375, 1.3486328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 18.0, 22.0, 15.0, 27.0, 19.0, 27.0, 33.0, 34.0, 36.0, 37.0, 42.0, 50.0, 42.0, 51.0, 50.0, 57.0, 48.0, 47.0, 45.0, 41.0, 39.0, 31.0, 25.0, 25.0, 18.0, 19.0, 11.0, 15.0, 13.0, 7.0, 5.0, 5.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3974647521972656e-05, -3.2806769013404846e-05, -3.1638890504837036e-05, -3.0471011996269226e-05, -2.9303133487701416e-05, -2.8135254979133606e-05, -2.6967376470565796e-05, -2.5799497961997986e-05, -2.4631619453430176e-05, -2.3463740944862366e-05, -2.2295862436294556e-05, -2.1127983927726746e-05, -1.9960105419158936e-05, -1.8792226910591125e-05, -1.7624348402023315e-05, -1.6456469893455505e-05, -1.5288591384887695e-05, -1.4120712876319885e-05, -1.2952834367752075e-05, -1.1784955859184265e-05, -1.0617077350616455e-05, -9.449198842048645e-06, -8.281320333480835e-06, -7.113441824913025e-06, -5.945563316345215e-06, -4.777684807777405e-06, -3.6098062992095947e-06, -2.4419277906417847e-06, -1.2740492820739746e-06, -1.0617077350616455e-07, 1.0617077350616455e-06, 2.2295862436294556e-06, 3.3974647521972656e-06, 4.565343260765076e-06, 5.733221769332886e-06, 6.901100277900696e-06, 8.068978786468506e-06, 9.236857295036316e-06, 1.0404735803604126e-05, 1.1572614312171936e-05, 1.2740492820739746e-05, 1.3908371329307556e-05, 1.5076249837875366e-05, 1.6244128346443176e-05, 1.7412006855010986e-05, 1.8579885363578796e-05, 1.9747763872146606e-05, 2.0915642380714417e-05, 2.2083520889282227e-05, 2.3251399397850037e-05, 2.4419277906417847e-05, 2.5587156414985657e-05, 2.6755034923553467e-05, 2.7922913432121277e-05, 2.9090791940689087e-05, 3.0258670449256897e-05, 3.142654895782471e-05, 3.259442746639252e-05, 3.376230597496033e-05, 3.493018448352814e-05, 3.609806299209595e-05, 3.726594150066376e-05, 3.843382000923157e-05, 3.960169851779938e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 15.0, 19.0, 21.0, 38.0, 41.0, 80.0, 134.0, 186.0, 273.0, 500.0, 761.0, 1225.0, 1890.0, 3031.0, 4918.0, 7948.0, 12708.0, 20517.0, 32718.0, 51681.0, 80511.0, 120105.0, 158630.0, 165815.0, 132660.0, 91659.0, 59432.0, 37994.0, 23710.0, 14902.0, 9203.0, 5657.0, 3498.0, 2276.0, 1391.0, 841.0, 558.0, 366.0, 211.0, 144.0, 105.0, 56.0, 53.0, 25.0, 19.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.2998046875, -1.261749267578125, -1.22369384765625, -1.185638427734375, -1.1475830078125, -1.109527587890625, -1.07147216796875, -1.033416748046875, -0.995361328125, -0.957305908203125, -0.91925048828125, -0.881195068359375, -0.8431396484375, -0.805084228515625, -0.76702880859375, -0.728973388671875, -0.69091796875, -0.652862548828125, -0.61480712890625, -0.576751708984375, -0.5386962890625, -0.500640869140625, -0.46258544921875, -0.424530029296875, -0.386474609375, -0.348419189453125, -0.31036376953125, -0.272308349609375, -0.2342529296875, -0.196197509765625, -0.15814208984375, -0.120086669921875, -0.08203125, -0.043975830078125, -0.00592041015625, 0.032135009765625, 0.0701904296875, 0.108245849609375, 0.14630126953125, 0.184356689453125, 0.222412109375, 0.260467529296875, 0.29852294921875, 0.336578369140625, 0.3746337890625, 0.412689208984375, 0.45074462890625, 0.488800048828125, 0.52685546875, 0.564910888671875, 0.60296630859375, 0.641021728515625, 0.6790771484375, 0.717132568359375, 0.75518798828125, 0.793243408203125, 0.831298828125, 0.869354248046875, 0.90740966796875, 0.945465087890625, 0.9835205078125, 1.021575927734375, 1.05963134765625, 1.097686767578125, 1.1357421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 13.0, 20.0, 23.0, 31.0, 42.0, 50.0, 62.0, 67.0, 68.0, 71.0, 65.0, 86.0, 47.0, 54.0, 44.0, 41.0, 34.0, 24.0, 15.0, 28.0, 14.0, 9.0, 13.0, 7.0, 5.0, 3.0, 7.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55859375, -0.537811279296875, -0.51702880859375, -0.496246337890625, -0.4754638671875, -0.454681396484375, -0.43389892578125, -0.413116455078125, -0.392333984375, -0.371551513671875, -0.35076904296875, -0.329986572265625, -0.3092041015625, -0.288421630859375, -0.26763916015625, -0.246856689453125, -0.22607421875, -0.205291748046875, -0.18450927734375, -0.163726806640625, -0.1429443359375, -0.122161865234375, -0.10137939453125, -0.080596923828125, -0.059814453125, -0.039031982421875, -0.01824951171875, 0.002532958984375, 0.0233154296875, 0.044097900390625, 0.06488037109375, 0.085662841796875, 0.1064453125, 0.127227783203125, 0.14801025390625, 0.168792724609375, 0.1895751953125, 0.210357666015625, 0.23114013671875, 0.251922607421875, 0.272705078125, 0.293487548828125, 0.31427001953125, 0.335052490234375, 0.3558349609375, 0.376617431640625, 0.39739990234375, 0.418182373046875, 0.43896484375, 0.459747314453125, 0.48052978515625, 0.501312255859375, 0.5220947265625, 0.542877197265625, 0.56365966796875, 0.584442138671875, 0.605224609375, 0.626007080078125, 0.64678955078125, 0.667572021484375, 0.6883544921875, 0.709136962890625, 0.72991943359375, 0.750701904296875, 0.771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 7.0, 3.0, 6.0, 10.0, 11.0, 17.0, 14.0, 16.0, 30.0, 20.0, 34.0, 27.0, 28.0, 32.0, 27.0, 35.0, 44.0, 29.0, 41.0, 37.0, 39.0, 37.0, 36.0, 38.0, 36.0, 34.0, 34.0, 30.0, 38.0, 34.0, 23.0, 24.0, 17.0, 15.0, 20.0, 10.0, 7.0, 7.0, 6.0, 13.0, 5.0, 8.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.750097274780273, -25.847896575927734, -24.945693969726562, -24.04349136352539, -23.14129066467285, -22.239089965820312, -21.33688735961914, -20.43468475341797, -19.53248405456543, -18.63028335571289, -17.72808074951172, -16.825878143310547, -15.923677444458008, -15.021475791931152, -14.119274139404297, -13.217072486877441, -12.314870834350586, -11.41266918182373, -10.510467529296875, -9.60826587677002, -8.706064224243164, -7.803862571716309, -6.901660919189453, -5.999459266662598, -5.097257614135742, -4.195055961608887, -3.2928543090820312, -2.390652656555176, -1.4884510040283203, -0.5862493515014648, 0.3159523010253906, 1.218153953552246, 2.1203575134277344, 3.02255916595459, 3.9247608184814453, 4.826962471008301, 5.729164123535156, 6.631365776062012, 7.533567428588867, 8.435769081115723, 9.337970733642578, 10.240172386169434, 11.142374038696289, 12.044575691223145, 12.94677734375, 13.848978996276855, 14.751180648803711, 15.653382301330566, 16.555583953857422, 17.457786560058594, 18.359987258911133, 19.262187957763672, 20.164390563964844, 21.066593170166016, 21.968793869018555, 22.870994567871094, 23.773197174072266, 24.675399780273438, 25.577600479125977, 26.479801177978516, 27.382003784179688, 28.28420639038086, 29.1864070892334, 30.088607788085938, 30.99081039428711]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 8.0, 2.0, 13.0, 17.0, 13.0, 14.0, 23.0, 23.0, 20.0, 21.0, 22.0, 31.0, 29.0, 26.0, 34.0, 37.0, 35.0, 38.0, 42.0, 36.0, 41.0, 49.0, 40.0, 34.0, 36.0, 34.0, 34.0, 33.0, 20.0, 23.0, 33.0, 18.0, 24.0, 16.0, 12.0, 9.0, 11.0, 5.0, 8.0, 4.0, 9.0, 2.0, 2.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.592384338378906, -35.40847396850586, -34.22455978393555, -33.0406494140625, -31.856739044189453, -30.672826766967773, -29.488914489746094, -28.305004119873047, -27.121091842651367, -25.937179565429688, -24.75326919555664, -23.56935691833496, -22.38544464111328, -21.201534271240234, -20.017621994018555, -18.833709716796875, -17.649799346923828, -16.46588706970215, -15.281976699829102, -14.098064422607422, -12.914153099060059, -11.730241775512695, -10.546329498291016, -9.362418174743652, -8.178506851196289, -6.994595527648926, -5.810683727264404, -4.626771926879883, -3.4428606033325195, -2.2589492797851562, -1.0750374794006348, 0.10887432098388672, 1.2927818298339844, 2.4766933917999268, 3.660604953765869, 4.844516754150391, 6.028428077697754, 7.212339401245117, 8.396251678466797, 9.58016300201416, 10.764074325561523, 11.947985649108887, 13.13189697265625, 14.31580924987793, 15.499720573425293, 16.683631896972656, 17.867544174194336, 19.051456451416016, 20.235366821289062, 21.419279098510742, 22.60318946838379, 23.78710174560547, 24.971012115478516, 26.154924392700195, 27.338836669921875, 28.522747039794922, 29.7066593170166, 30.89057159423828, 32.07448196411133, 33.258392333984375, 34.44230651855469, 35.626216888427734, 36.81012725830078, 37.994041442871094, 39.17795181274414]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 20.0, 12.0, 34.0, 49.0, 67.0, 121.0, 158.0, 250.0, 416.0, 632.0, 1026.0, 1536.0, 2295.0, 3624.0, 5300.0, 8016.0, 11692.0, 16834.0, 23720.0, 31866.0, 41574.0, 53282.0, 64967.0, 76181.0, 84158.0, 89399.0, 89227.0, 85669.0, 77192.0, 66871.0, 55094.0, 43665.0, 33322.0, 24825.0, 17670.0, 12428.0, 8635.0, 5728.0, 3858.0, 2509.0, 1660.0, 1046.0, 656.0, 482.0, 267.0, 185.0, 151.0, 79.0, 38.0, 25.0, 23.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.125, -15.606201171875, -15.08740234375, -14.568603515625, -14.0498046875, -13.531005859375, -13.01220703125, -12.493408203125, -11.974609375, -11.455810546875, -10.93701171875, -10.418212890625, -9.8994140625, -9.380615234375, -8.86181640625, -8.343017578125, -7.82421875, -7.305419921875, -6.78662109375, -6.267822265625, -5.7490234375, -5.230224609375, -4.71142578125, -4.192626953125, -3.673828125, -3.155029296875, -2.63623046875, -2.117431640625, -1.5986328125, -1.079833984375, -0.56103515625, -0.042236328125, 0.4765625, 0.995361328125, 1.51416015625, 2.032958984375, 2.5517578125, 3.070556640625, 3.58935546875, 4.108154296875, 4.626953125, 5.145751953125, 5.66455078125, 6.183349609375, 6.7021484375, 7.220947265625, 7.73974609375, 8.258544921875, 8.77734375, 9.296142578125, 9.81494140625, 10.333740234375, 10.8525390625, 11.371337890625, 11.89013671875, 12.408935546875, 12.927734375, 13.446533203125, 13.96533203125, 14.484130859375, 15.0029296875, 15.521728515625, 16.04052734375, 16.559326171875, 17.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 10.0, 19.0, 14.0, 14.0, 23.0, 23.0, 18.0, 22.0, 27.0, 31.0, 28.0, 27.0, 33.0, 38.0, 32.0, 40.0, 44.0, 33.0, 44.0, 44.0, 40.0, 35.0, 37.0, 36.0, 30.0, 34.0, 20.0, 22.0, 30.0, 19.0, 24.0, 16.0, 11.0, 9.0, 10.0, 5.0, 10.0, 2.0, 9.0, 2.0, 2.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-35.875, -34.708984375, -33.54296875, -32.376953125, -31.2109375, -30.044921875, -28.87890625, -27.712890625, -26.546875, -25.380859375, -24.21484375, -23.048828125, -21.8828125, -20.716796875, -19.55078125, -18.384765625, -17.21875, -16.052734375, -14.88671875, -13.720703125, -12.5546875, -11.388671875, -10.22265625, -9.056640625, -7.890625, -6.724609375, -5.55859375, -4.392578125, -3.2265625, -2.060546875, -0.89453125, 0.271484375, 1.4375, 2.603515625, 3.76953125, 4.935546875, 6.1015625, 7.267578125, 8.43359375, 9.599609375, 10.765625, 11.931640625, 13.09765625, 14.263671875, 15.4296875, 16.595703125, 17.76171875, 18.927734375, 20.09375, 21.259765625, 22.42578125, 23.591796875, 24.7578125, 25.923828125, 27.08984375, 28.255859375, 29.421875, 30.587890625, 31.75390625, 32.919921875, 34.0859375, 35.251953125, 36.41796875, 37.583984375, 38.75]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 12.0, 32.0, 47.0, 55.0, 73.0, 145.0, 208.0, 376.0, 585.0, 926.0, 1513.0, 2426.0, 3733.0, 5890.0, 9137.0, 14058.0, 20517.0, 30524.0, 43245.0, 58414.0, 75248.0, 90907.0, 102497.0, 106880.0, 104152.0, 93707.0, 78302.0, 61802.0, 45760.0, 32732.0, 22628.0, 15059.0, 9726.0, 6386.0, 4022.0, 2551.0, 1542.0, 1007.0, 642.0, 406.0, 229.0, 177.0, 98.0, 67.0, 33.0, 25.0, 15.0, 13.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-22.75, -22.052001953125, -21.35400390625, -20.656005859375, -19.9580078125, -19.260009765625, -18.56201171875, -17.864013671875, -17.166015625, -16.468017578125, -15.77001953125, -15.072021484375, -14.3740234375, -13.676025390625, -12.97802734375, -12.280029296875, -11.58203125, -10.884033203125, -10.18603515625, -9.488037109375, -8.7900390625, -8.092041015625, -7.39404296875, -6.696044921875, -5.998046875, -5.300048828125, -4.60205078125, -3.904052734375, -3.2060546875, -2.508056640625, -1.81005859375, -1.112060546875, -0.4140625, 0.283935546875, 0.98193359375, 1.679931640625, 2.3779296875, 3.075927734375, 3.77392578125, 4.471923828125, 5.169921875, 5.867919921875, 6.56591796875, 7.263916015625, 7.9619140625, 8.659912109375, 9.35791015625, 10.055908203125, 10.75390625, 11.451904296875, 12.14990234375, 12.847900390625, 13.5458984375, 14.243896484375, 14.94189453125, 15.639892578125, 16.337890625, 17.035888671875, 17.73388671875, 18.431884765625, 19.1298828125, 19.827880859375, 20.52587890625, 21.223876953125, 21.921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 13.0, 10.0, 10.0, 16.0, 18.0, 21.0, 20.0, 23.0, 42.0, 33.0, 35.0, 41.0, 40.0, 42.0, 49.0, 44.0, 35.0, 50.0, 35.0, 52.0, 51.0, 47.0, 39.0, 30.0, 29.0, 24.0, 19.0, 18.0, 20.0, 16.0, 21.0, 10.0, 13.0, 7.0, 7.0, 5.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.582763671875, -27.61865234375, -26.654541015625, -25.6904296875, -24.726318359375, -23.76220703125, -22.798095703125, -21.833984375, -20.869873046875, -19.90576171875, -18.941650390625, -17.9775390625, -17.013427734375, -16.04931640625, -15.085205078125, -14.12109375, -13.156982421875, -12.19287109375, -11.228759765625, -10.2646484375, -9.300537109375, -8.33642578125, -7.372314453125, -6.408203125, -5.444091796875, -4.47998046875, -3.515869140625, -2.5517578125, -1.587646484375, -0.62353515625, 0.340576171875, 1.3046875, 2.268798828125, 3.23291015625, 4.197021484375, 5.1611328125, 6.125244140625, 7.08935546875, 8.053466796875, 9.017578125, 9.981689453125, 10.94580078125, 11.909912109375, 12.8740234375, 13.838134765625, 14.80224609375, 15.766357421875, 16.73046875, 17.694580078125, 18.65869140625, 19.622802734375, 20.5869140625, 21.551025390625, 22.51513671875, 23.479248046875, 24.443359375, 25.407470703125, 26.37158203125, 27.335693359375, 28.2998046875, 29.263916015625, 30.22802734375, 31.192138671875, 32.15625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 22.0, 35.0, 60.0, 60.0, 119.0, 207.0, 297.0, 508.0, 900.0, 1329.0, 2223.0, 3549.0, 5505.0, 8760.0, 13238.0, 20186.0, 28743.0, 40052.0, 54061.0, 68936.0, 83114.0, 94313.0, 100846.0, 100802.0, 94252.0, 82835.0, 67980.0, 52988.0, 39331.0, 27861.0, 19540.0, 13029.0, 8408.0, 5372.0, 3455.0, 2105.0, 1336.0, 857.0, 494.0, 347.0, 198.0, 120.0, 69.0, 39.0, 32.0, 18.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0, -6.76641845703125, -6.5328369140625, -6.29925537109375, -6.065673828125, -5.83209228515625, -5.5985107421875, -5.36492919921875, -5.13134765625, -4.89776611328125, -4.6641845703125, -4.43060302734375, -4.197021484375, -3.96343994140625, -3.7298583984375, -3.49627685546875, -3.2626953125, -3.02911376953125, -2.7955322265625, -2.56195068359375, -2.328369140625, -2.09478759765625, -1.8612060546875, -1.62762451171875, -1.39404296875, -1.16046142578125, -0.9268798828125, -0.69329833984375, -0.459716796875, -0.22613525390625, 0.0074462890625, 0.24102783203125, 0.474609375, 0.70819091796875, 0.9417724609375, 1.17535400390625, 1.408935546875, 1.64251708984375, 1.8760986328125, 2.10968017578125, 2.34326171875, 2.57684326171875, 2.8104248046875, 3.04400634765625, 3.277587890625, 3.51116943359375, 3.7447509765625, 3.97833251953125, 4.2119140625, 4.44549560546875, 4.6790771484375, 4.91265869140625, 5.146240234375, 5.37982177734375, 5.6134033203125, 5.84698486328125, 6.08056640625, 6.31414794921875, 6.5477294921875, 6.78131103515625, 7.014892578125, 7.24847412109375, 7.4820556640625, 7.71563720703125, 7.94921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 13.0, 10.0, 14.0, 15.0, 24.0, 28.0, 23.0, 30.0, 43.0, 35.0, 35.0, 44.0, 50.0, 58.0, 51.0, 46.0, 49.0, 45.0, 49.0, 46.0, 48.0, 27.0, 18.0, 24.0, 40.0, 15.0, 23.0, 18.0, 10.0, 6.0, 4.0, 5.0, 2.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0011224746704101562, -0.001089334487915039, -0.0010561943054199219, -0.0010230541229248047, -0.0009899139404296875, -0.0009567737579345703, -0.0009236335754394531, -0.0008904933929443359, -0.0008573532104492188, -0.0008242130279541016, -0.0007910728454589844, -0.0007579326629638672, -0.00072479248046875, -0.0006916522979736328, -0.0006585121154785156, -0.0006253719329833984, -0.0005922317504882812, -0.0005590915679931641, -0.0005259513854980469, -0.0004928112030029297, -0.0004596710205078125, -0.0004265308380126953, -0.0003933906555175781, -0.00036025047302246094, -0.00032711029052734375, -0.00029397010803222656, -0.0002608299255371094, -0.0002276897430419922, -0.000194549560546875, -0.0001614093780517578, -0.00012826919555664062, -9.512901306152344e-05, -6.198883056640625e-05, -2.8848648071289062e-05, 4.291534423828125e-06, 3.743171691894531e-05, 7.05718994140625e-05, 0.00010371208190917969, 0.00013685226440429688, 0.00016999244689941406, 0.00020313262939453125, 0.00023627281188964844, 0.0002694129943847656, 0.0003025531768798828, 0.000335693359375, 0.0003688335418701172, 0.0004019737243652344, 0.00043511390686035156, 0.00046825408935546875, 0.0005013942718505859, 0.0005345344543457031, 0.0005676746368408203, 0.0006008148193359375, 0.0006339550018310547, 0.0006670951843261719, 0.0007002353668212891, 0.0007333755493164062, 0.0007665157318115234, 0.0007996559143066406, 0.0008327960968017578, 0.000865936279296875, 0.0008990764617919922, 0.0009322166442871094, 0.0009653568267822266, 0.0009984970092773438]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 16.0, 16.0, 41.0, 60.0, 83.0, 161.0, 278.0, 484.0, 822.0, 1294.0, 1955.0, 3088.0, 4748.0, 7143.0, 10640.0, 15368.0, 21883.0, 29552.0, 38852.0, 50424.0, 61257.0, 71746.0, 80893.0, 86499.0, 88318.0, 85892.0, 79778.0, 70101.0, 59040.0, 48083.0, 37695.0, 28624.0, 20581.0, 14310.0, 10063.0, 6689.0, 4381.0, 2923.0, 1818.0, 1167.0, 755.0, 405.0, 255.0, 146.0, 81.0, 64.0, 30.0, 18.0, 12.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0], "bins": [-7.08984375, -6.877685546875, -6.66552734375, -6.453369140625, -6.2412109375, -6.029052734375, -5.81689453125, -5.604736328125, -5.392578125, -5.180419921875, -4.96826171875, -4.756103515625, -4.5439453125, -4.331787109375, -4.11962890625, -3.907470703125, -3.6953125, -3.483154296875, -3.27099609375, -3.058837890625, -2.8466796875, -2.634521484375, -2.42236328125, -2.210205078125, -1.998046875, -1.785888671875, -1.57373046875, -1.361572265625, -1.1494140625, -0.937255859375, -0.72509765625, -0.512939453125, -0.30078125, -0.088623046875, 0.12353515625, 0.335693359375, 0.5478515625, 0.760009765625, 0.97216796875, 1.184326171875, 1.396484375, 1.608642578125, 1.82080078125, 2.032958984375, 2.2451171875, 2.457275390625, 2.66943359375, 2.881591796875, 3.09375, 3.305908203125, 3.51806640625, 3.730224609375, 3.9423828125, 4.154541015625, 4.36669921875, 4.578857421875, 4.791015625, 5.003173828125, 5.21533203125, 5.427490234375, 5.6396484375, 5.851806640625, 6.06396484375, 6.276123046875, 6.48828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 7.0, 15.0, 8.0, 10.0, 19.0, 22.0, 16.0, 24.0, 32.0, 20.0, 32.0, 33.0, 33.0, 35.0, 35.0, 30.0, 36.0, 42.0, 32.0, 35.0, 41.0, 43.0, 39.0, 32.0, 30.0, 31.0, 32.0, 29.0, 16.0, 24.0, 18.0, 17.0, 11.0, 17.0, 19.0, 11.0, 10.0, 10.0, 12.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.5234375, -3.4136962890625, -3.303955078125, -3.1942138671875, -3.08447265625, -2.9747314453125, -2.864990234375, -2.7552490234375, -2.6455078125, -2.5357666015625, -2.426025390625, -2.3162841796875, -2.20654296875, -2.0968017578125, -1.987060546875, -1.8773193359375, -1.767578125, -1.6578369140625, -1.548095703125, -1.4383544921875, -1.32861328125, -1.2188720703125, -1.109130859375, -0.9993896484375, -0.8896484375, -0.7799072265625, -0.670166015625, -0.5604248046875, -0.45068359375, -0.3409423828125, -0.231201171875, -0.1214599609375, -0.01171875, 0.0980224609375, 0.207763671875, 0.3175048828125, 0.42724609375, 0.5369873046875, 0.646728515625, 0.7564697265625, 0.8662109375, 0.9759521484375, 1.085693359375, 1.1954345703125, 1.30517578125, 1.4149169921875, 1.524658203125, 1.6343994140625, 1.744140625, 1.8538818359375, 1.963623046875, 2.0733642578125, 2.18310546875, 2.2928466796875, 2.402587890625, 2.5123291015625, 2.6220703125, 2.7318115234375, 2.841552734375, 2.9512939453125, 3.06103515625, 3.1707763671875, 3.280517578125, 3.3902587890625, 3.5]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 10.0, 13.0, 23.0, 16.0, 20.0, 29.0, 29.0, 35.0, 24.0, 37.0, 29.0, 39.0, 43.0, 42.0, 31.0, 32.0, 31.0, 39.0, 42.0, 34.0, 44.0, 38.0, 37.0, 39.0, 19.0, 29.0, 25.0, 16.0, 29.0, 15.0, 17.0, 10.0, 10.0, 11.0, 6.0, 6.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.699382781982422, -28.756195068359375, -27.813005447387695, -26.86981773376465, -25.9266300201416, -24.983440399169922, -24.040252685546875, -23.097064971923828, -22.15387725830078, -21.210689544677734, -20.267499923706055, -19.324312210083008, -18.38112449645996, -17.43793487548828, -16.494747161865234, -15.551559448242188, -14.608369827270508, -13.665181159973145, -12.721993446350098, -11.778804779052734, -10.835617065429688, -9.892428398132324, -8.949239730834961, -8.006052017211914, -7.062863349914551, -6.119675159454346, -5.176486968994141, -4.233298301696777, -3.2901101112365723, -2.346921920776367, -1.403733253479004, -0.46054506301879883, 0.48264122009277344, 1.425829529762268, 2.3690178394317627, 3.312206268310547, 4.255394458770752, 5.198582649230957, 6.14177131652832, 7.084959506988525, 8.02814769744873, 8.971336364746094, 9.91452407836914, 10.857712745666504, 11.800901412963867, 12.744089126586914, 13.687277793884277, 14.63046646118164, 15.573654174804688, 16.516841888427734, 17.460031509399414, 18.40321922302246, 19.346406936645508, 20.289596557617188, 21.232784271240234, 22.17597198486328, 23.119159698486328, 24.062347412109375, 25.005537033081055, 25.9487247467041, 26.89191246032715, 27.835102081298828, 28.778289794921875, 29.721477508544922, 30.6646671295166]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 13.0, 12.0, 12.0, 18.0, 18.0, 27.0, 21.0, 16.0, 25.0, 26.0, 24.0, 53.0, 38.0, 38.0, 46.0, 38.0, 39.0, 33.0, 41.0, 31.0, 29.0, 44.0, 34.0, 41.0, 32.0, 29.0, 29.0, 22.0, 21.0, 20.0, 22.0, 13.0, 13.0, 14.0, 12.0, 9.0, 11.0, 4.0, 10.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-48.507598876953125, -47.037899017333984, -45.56820297241211, -44.09850311279297, -42.62880325317383, -41.15910339355469, -39.68940734863281, -38.21970748901367, -36.75000762939453, -35.28030776977539, -33.810611724853516, -32.340911865234375, -30.871212005615234, -29.401514053344727, -27.93181610107422, -26.462116241455078, -24.992420196533203, -23.522722244262695, -22.053022384643555, -20.583324432373047, -19.113624572753906, -17.6439266204834, -16.17422866821289, -14.704529762268066, -13.234830856323242, -11.765131950378418, -10.295433044433594, -8.825735092163086, -7.356036186218262, -5.8863372802734375, -4.41663932800293, -2.9469404220581055, -1.4772377014160156, -0.007539033889770508, 1.4621596336364746, 2.9318580627441406, 4.401556968688965, 5.871255874633789, 7.340953826904297, 8.810652732849121, 10.280351638793945, 11.75005054473877, 13.219749450683594, 14.689447402954102, 16.15914535522461, 17.62884521484375, 19.098543167114258, 20.568241119384766, 22.037940979003906, 23.507638931274414, 24.977338790893555, 26.447036743164062, 27.916736602783203, 29.38643455505371, 30.85613250732422, 32.32583236694336, 33.7955322265625, 35.26523208618164, 36.734928131103516, 38.204627990722656, 39.6743278503418, 41.14402770996094, 42.61372375488281, 44.08342361450195, 45.55311965942383]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 13.0, 18.0, 23.0, 27.0, 40.0, 55.0, 84.0, 112.0, 113.0, 156.0, 234.0, 312.0, 396.0, 501.0, 668.0, 925.0, 1101.0, 1478.0, 1953.0, 2512.0, 3283.0, 4769.0, 6644.0, 998793.0, 6936.0, 4849.0, 3538.0, 2551.0, 1979.0, 1495.0, 1171.0, 906.0, 758.0, 550.0, 425.0, 300.0, 235.0, 161.0, 145.0, 113.0, 83.0, 47.0, 39.0, 30.0, 24.0, 13.0, 18.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-253.26527404785156, -245.48699951171875, -237.708740234375, -229.9304656982422, -222.15219116210938, -214.37393188476562, -206.5956573486328, -198.8173828125, -191.03912353515625, -183.26084899902344, -175.4825897216797, -167.70431518554688, -159.92605590820312, -152.1477813720703, -144.3695068359375, -136.59124755859375, -128.81297302246094, -121.03470611572266, -113.25643920898438, -105.47816467285156, -97.69989776611328, -89.921630859375, -82.14335632324219, -74.3650894165039, -66.58682250976562, -58.808555603027344, -51.0302848815918, -43.25201416015625, -35.47374725341797, -27.695480346679688, -19.91720962524414, -12.138938903808594, -4.360687255859375, 3.417581558227539, 11.195850372314453, 18.974119186401367, 26.75238800048828, 34.53065490722656, 42.30892562866211, 50.087196350097656, 57.86546325683594, 65.64373016357422, 73.4219970703125, 81.20027160644531, 88.9785385131836, 96.75680541992188, 104.53507995605469, 112.31334686279297, 120.09161376953125, 127.86988067626953, 135.6481475830078, 143.42642211914062, 151.20468139648438, 158.9829559326172, 166.76123046875, 174.53948974609375, 182.31776428222656, 190.09603881835938, 197.87429809570312, 205.65257263183594, 213.43084716796875, 221.2091064453125, 228.9873809814453, 236.76565551757812, 244.54391479492188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 10.0, 9.0, 13.0, 10.0, 27.0, 46.0, 64.0, 71.0, 104.0, 144.0, 203.0, 271.0, 387.0, 467.0, 621.0, 840.0, 1105.0, 1487.0, 1928.0, 2588.0, 3425.0, 4996.0, 7646.0, 14104.0, 31745.0, 51302640.0, 48362.0, 18123.0, 9058.0, 5583.0, 3834.0, 2903.0, 2123.0, 1548.0, 1180.0, 933.0, 686.0, 550.0, 390.0, 290.0, 245.0, 174.0, 113.0, 96.0, 67.0, 50.0, 37.0, 19.0, 11.0, 14.0, 8.0, 7.0, 4.0, 1.0, 1.0], "bins": [-298.9438781738281, -290.31976318359375, -281.6956787109375, -273.0715637207031, -264.44744873046875, -255.82333374023438, -247.19923400878906, -238.57513427734375, -229.95101928710938, -221.326904296875, -212.7028045654297, -204.07870483398438, -195.45458984375, -186.83047485351562, -178.2063751220703, -169.582275390625, -160.95816040039062, -152.33404541015625, -143.70994567871094, -135.08584594726562, -126.46173095703125, -117.8376235961914, -109.21351623535156, -100.58940887451172, -91.96530151367188, -83.34119415283203, -74.71708679199219, -66.09297943115234, -57.4688720703125, -48.844764709472656, -40.22065734863281, -31.59654998779297, -22.972457885742188, -14.348350524902344, -5.7242431640625, 2.8998641967773438, 11.523971557617188, 20.14807891845703, 28.772186279296875, 37.39629364013672, 46.02040100097656, 54.644508361816406, 63.26861572265625, 71.8927230834961, 80.51683044433594, 89.14093780517578, 97.76504516601562, 106.38915252685547, 115.01325988769531, 123.63736724853516, 132.261474609375, 140.88558959960938, 149.5096893310547, 158.1337890625, 166.75790405273438, 175.38201904296875, 184.00611877441406, 192.63021850585938, 201.25433349609375, 209.87844848632812, 218.50254821777344, 227.12664794921875, 235.75076293945312, 244.3748779296875, 252.9989776611328]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 12.0, 6.0, 14.0, 18.0, 14.0, 18.0, 20.0, 28.0, 36.0, 34.0, 30.0, 48.0, 37.0, 49.0, 55.0, 56.0, 41.0, 50.0, 45.0, 41.0, 40.0, 40.0, 35.0, 26.0, 29.0, 20.0, 19.0, 18.0, 11.0, 10.0, 16.0, 9.0, 11.0, 7.0, 10.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0], "bins": [-281.85919189453125, -274.5696716308594, -267.2801513671875, -259.9906311035156, -252.7011260986328, -245.41160583496094, -238.12210083007812, -230.83258056640625, -223.54306030273438, -216.2535400390625, -208.96401977539062, -201.6745147705078, -194.38499450683594, -187.09547424316406, -179.80596923828125, -172.51644897460938, -165.2269287109375, -157.93740844726562, -150.64788818359375, -143.35838317871094, -136.06886291503906, -128.7793426513672, -121.48983001708984, -114.2003173828125, -106.91079711914062, -99.62127685546875, -92.3317642211914, -85.04225158691406, -77.75273132324219, -70.46321105957031, -63.17369842529297, -55.88418197631836, -48.59468078613281, -41.3051643371582, -34.015647888183594, -26.726131439208984, -19.436614990234375, -12.147098541259766, -4.857582092285156, 2.431934356689453, 9.721450805664062, 17.010967254638672, 24.30048370361328, 31.59000015258789, 38.8795166015625, 46.16903305053711, 53.45854949951172, 60.74806594848633, 68.03758239746094, 75.32710266113281, 82.61661529541016, 89.9061279296875, 97.19564819335938, 104.48516845703125, 111.7746810913086, 119.06419372558594, 126.35371398925781, 133.6432342529297, 140.9327392578125, 148.22225952148438, 155.51177978515625, 162.80130004882812, 170.0908203125, 177.3803253173828, 184.6698455810547]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 4.0, 6.0, 15.0, 14.0, 11.0, 21.0, 16.0, 19.0, 25.0, 27.0, 40.0, 45.0, 40.0, 50.0, 52.0, 55.0, 80.0, 55.0, 43.0, 41.0, 42.0, 26.0, 35.0, 26.0, 26.0, 15.0, 26.0, 20.0, 9.0, 14.0, 13.0, 12.0, 14.0, 8.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-339.97601318359375, -329.10198974609375, -318.22796630859375, -307.35394287109375, -296.4798889160156, -285.6058654785156, -274.7318420410156, -263.8578186035156, -252.98377990722656, -242.10975646972656, -231.2357177734375, -220.3616943359375, -209.4876708984375, -198.61363220214844, -187.73960876464844, -176.86557006835938, -165.99154663085938, -155.11752319335938, -144.2434844970703, -133.3694610595703, -122.49542999267578, -111.62139892578125, -100.74737548828125, -89.87334442138672, -78.99931335449219, -68.12528228759766, -57.25125503540039, -46.377227783203125, -35.503196716308594, -24.629165649414062, -13.755142211914062, -2.8811111450195312, 7.992919921875, 18.8669490814209, 29.740978240966797, 40.61500549316406, 51.489036560058594, 62.363067626953125, 73.23709106445312, 84.11112213134766, 94.98515319824219, 105.85918426513672, 116.73321533203125, 127.60723876953125, 138.48126220703125, 149.3553009033203, 160.2293243408203, 171.10336303710938, 181.97738647460938, 192.85140991210938, 203.72544860839844, 214.59947204589844, 225.4735107421875, 236.3475341796875, 247.2215576171875, 258.0955810546875, 268.9696044921875, 279.8436279296875, 290.7176513671875, 301.5916748046875, 312.4657287597656, 323.3397521972656, 334.2137756347656, 345.0877990722656, 355.96185302734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 13.0, 24.0, 21.0, 28.0, 33.0, 46.0, 70.0, 100.0, 121.0, 173.0, 183.0, 278.0, 385.0, 514.0, 699.0, 1039.0, 1451.0, 2148.0, 3258.0, 5132.0, 8346.0, 14144.0, 26139.0, 51729.0, 116317.0, 350089.0, 2687356.0, 607702.0, 172616.0, 68434.0, 32045.0, 16948.0, 9517.0, 5820.0, 3585.0, 2508.0, 1611.0, 1119.0, 813.0, 559.0, 352.0, 277.0, 175.0, 126.0, 89.0, 48.0, 38.0, 30.0, 13.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.4375, -11.097900390625, -10.75830078125, -10.418701171875, -10.0791015625, -9.739501953125, -9.39990234375, -9.060302734375, -8.720703125, -8.381103515625, -8.04150390625, -7.701904296875, -7.3623046875, -7.022705078125, -6.68310546875, -6.343505859375, -6.00390625, -5.664306640625, -5.32470703125, -4.985107421875, -4.6455078125, -4.305908203125, -3.96630859375, -3.626708984375, -3.287109375, -2.947509765625, -2.60791015625, -2.268310546875, -1.9287109375, -1.589111328125, -1.24951171875, -0.909912109375, -0.5703125, -0.230712890625, 0.10888671875, 0.448486328125, 0.7880859375, 1.127685546875, 1.46728515625, 1.806884765625, 2.146484375, 2.486083984375, 2.82568359375, 3.165283203125, 3.5048828125, 3.844482421875, 4.18408203125, 4.523681640625, 4.86328125, 5.202880859375, 5.54248046875, 5.882080078125, 6.2216796875, 6.561279296875, 6.90087890625, 7.240478515625, 7.580078125, 7.919677734375, 8.25927734375, 8.598876953125, 8.9384765625, 9.278076171875, 9.61767578125, 9.957275390625, 10.296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 12.0, 8.0, 15.0, 19.0, 25.0, 38.0, 47.0, 68.0, 75.0, 92.0, 123.0, 86.0, 92.0, 76.0, 54.0, 34.0, 29.0, 20.0, 17.0, 8.0, 3.0, 9.0, 1.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.57421875, -1.53094482421875, -1.4876708984375, -1.44439697265625, -1.401123046875, -1.35784912109375, -1.3145751953125, -1.27130126953125, -1.22802734375, -1.18475341796875, -1.1414794921875, -1.09820556640625, -1.054931640625, -1.01165771484375, -0.9683837890625, -0.92510986328125, -0.8818359375, -0.83856201171875, -0.7952880859375, -0.75201416015625, -0.708740234375, -0.66546630859375, -0.6221923828125, -0.57891845703125, -0.53564453125, -0.49237060546875, -0.4490966796875, -0.40582275390625, -0.362548828125, -0.31927490234375, -0.2760009765625, -0.23272705078125, -0.189453125, -0.14617919921875, -0.1029052734375, -0.05963134765625, -0.016357421875, 0.02691650390625, 0.0701904296875, 0.11346435546875, 0.15673828125, 0.20001220703125, 0.2432861328125, 0.28656005859375, 0.329833984375, 0.37310791015625, 0.4163818359375, 0.45965576171875, 0.5029296875, 0.54620361328125, 0.5894775390625, 0.63275146484375, 0.676025390625, 0.71929931640625, 0.7625732421875, 0.80584716796875, 0.84912109375, 0.89239501953125, 0.9356689453125, 0.97894287109375, 1.022216796875, 1.06549072265625, 1.1087646484375, 1.15203857421875, 1.1953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 12.0, 20.0, 25.0, 57.0, 50.0, 92.0, 145.0, 247.0, 474.0, 1138.0, 3043.0, 9867.0, 41348.0, 226570.0, 2563696.0, 1157425.0, 148429.0, 29565.0, 7586.0, 2493.0, 931.0, 404.0, 228.0, 134.0, 82.0, 55.0, 40.0, 25.0, 22.0, 15.0, 8.0, 7.0, 6.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.645751953125, -15.10400390625, -14.562255859375, -14.0205078125, -13.478759765625, -12.93701171875, -12.395263671875, -11.853515625, -11.311767578125, -10.77001953125, -10.228271484375, -9.6865234375, -9.144775390625, -8.60302734375, -8.061279296875, -7.51953125, -6.977783203125, -6.43603515625, -5.894287109375, -5.3525390625, -4.810791015625, -4.26904296875, -3.727294921875, -3.185546875, -2.643798828125, -2.10205078125, -1.560302734375, -1.0185546875, -0.476806640625, 0.06494140625, 0.606689453125, 1.1484375, 1.690185546875, 2.23193359375, 2.773681640625, 3.3154296875, 3.857177734375, 4.39892578125, 4.940673828125, 5.482421875, 6.024169921875, 6.56591796875, 7.107666015625, 7.6494140625, 8.191162109375, 8.73291015625, 9.274658203125, 9.81640625, 10.358154296875, 10.89990234375, 11.441650390625, 11.9833984375, 12.525146484375, 13.06689453125, 13.608642578125, 14.150390625, 14.692138671875, 15.23388671875, 15.775634765625, 16.3173828125, 16.859130859375, 17.40087890625, 17.942626953125, 18.484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 9.0, 14.0, 16.0, 12.0, 29.0, 31.0, 35.0, 39.0, 68.0, 76.0, 86.0, 131.0, 170.0, 268.0, 333.0, 828.0, 586.0, 315.0, 242.0, 185.0, 147.0, 102.0, 80.0, 61.0, 49.0, 28.0, 27.0, 30.0, 16.0, 11.0, 10.0, 12.0, 7.0, 6.0, 7.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.3790283203125, -3.265869140625, -3.1527099609375, -3.03955078125, -2.9263916015625, -2.813232421875, -2.7000732421875, -2.5869140625, -2.4737548828125, -2.360595703125, -2.2474365234375, -2.13427734375, -2.0211181640625, -1.907958984375, -1.7947998046875, -1.681640625, -1.5684814453125, -1.455322265625, -1.3421630859375, -1.22900390625, -1.1158447265625, -1.002685546875, -0.8895263671875, -0.7763671875, -0.6632080078125, -0.550048828125, -0.4368896484375, -0.32373046875, -0.2105712890625, -0.097412109375, 0.0157470703125, 0.12890625, 0.2420654296875, 0.355224609375, 0.4683837890625, 0.58154296875, 0.6947021484375, 0.807861328125, 0.9210205078125, 1.0341796875, 1.1473388671875, 1.260498046875, 1.3736572265625, 1.48681640625, 1.5999755859375, 1.713134765625, 1.8262939453125, 1.939453125, 2.0526123046875, 2.165771484375, 2.2789306640625, 2.39208984375, 2.5052490234375, 2.618408203125, 2.7315673828125, 2.8447265625, 2.9578857421875, 3.071044921875, 3.1842041015625, 3.29736328125, 3.4105224609375, 3.523681640625, 3.6368408203125, 3.75]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 15.0, 56.0, 147.0, 255.0, 268.0, 149.0, 77.0, 24.0, 11.0, 8.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.955406188964844, -23.580018997192383, -21.20462989807129, -18.829242706298828, -16.453853607177734, -14.078466415405273, -11.703079223632812, -9.327690124511719, -6.952302932739258, -4.5769147872924805, -2.2015271186828613, 0.1738605499267578, 2.549248695373535, 4.9246368408203125, 7.300024032592773, 9.675413131713867, 12.050800323486328, 14.426188468933105, 16.801576614379883, 19.176963806152344, 21.552352905273438, 23.9277400970459, 26.30312728881836, 28.678516387939453, 31.053903579711914, 33.429290771484375, 35.80467987060547, 38.18006896972656, 40.55545425415039, 42.930843353271484, 45.30622863769531, 47.681617736816406, 50.0570068359375, 52.432395935058594, 54.80778121948242, 57.183170318603516, 59.55855941772461, 61.93394470214844, 64.30933380126953, 66.68472290039062, 69.06011199951172, 71.43550109863281, 73.8108901977539, 76.186279296875, 78.56166076660156, 80.93704986572266, 83.31243896484375, 85.68782806396484, 88.06321716308594, 90.43860626220703, 92.81399536132812, 95.18937683105469, 97.56476593017578, 99.94015502929688, 102.31554412841797, 104.69093322753906, 107.06631469726562, 109.44170379638672, 111.81709289550781, 114.19247436523438, 116.56786346435547, 118.94325256347656, 121.31864166259766, 123.69403076171875, 126.06941986083984]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 5.0, 7.0, 12.0, 8.0, 20.0, 12.0, 24.0, 30.0, 21.0, 27.0, 35.0, 37.0, 42.0, 36.0, 36.0, 50.0, 39.0, 57.0, 47.0, 38.0, 48.0, 42.0, 41.0, 38.0, 33.0, 25.0, 29.0, 21.0, 23.0, 16.0, 15.0, 11.0, 16.0, 11.0, 12.0, 8.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.200023651123047, -17.639678955078125, -17.079336166381836, -16.518991470336914, -15.958647727966309, -15.398303985595703, -14.837959289550781, -14.277615547180176, -13.71727180480957, -13.156928062438965, -12.596583366394043, -12.036239624023438, -11.475895881652832, -10.915552139282227, -10.355207443237305, -9.7948637008667, -9.234519004821777, -8.674175262451172, -8.11383056640625, -7.5534868240356445, -6.993143081665039, -6.432798862457275, -5.872454643249512, -5.312110900878906, -4.751766681671143, -4.191422462463379, -3.6310787200927734, -3.0707345008850098, -2.510390520095825, -1.9500465393066406, -1.389702320098877, -0.8293583393096924, -0.2690143585205078, 0.29132968187332153, 0.8516737222671509, 1.412017822265625, 1.9723618030548096, 2.532705783843994, 3.093050003051758, 3.6533939838409424, 4.213737964630127, 4.774082183837891, 5.334425926208496, 5.89477014541626, 6.455114364624023, 7.015458106994629, 7.575802326202393, 8.136146545410156, 8.696490287780762, 9.256834030151367, 9.817178726196289, 10.377522468566895, 10.9378662109375, 11.498210906982422, 12.058554649353027, 12.618898391723633, 13.179243087768555, 13.73958683013916, 14.299931526184082, 14.860275268554688, 15.420619010925293, 15.980962753295898, 16.54130744934082, 17.101652145385742, 17.66199493408203]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 11.0, 9.0, 21.0, 19.0, 40.0, 52.0, 79.0, 104.0, 173.0, 210.0, 312.0, 412.0, 573.0, 865.0, 1292.0, 1912.0, 3076.0, 5020.0, 8467.0, 16013.0, 31552.0, 68261.0, 158708.0, 297535.0, 242572.0, 109241.0, 48374.0, 23163.0, 11949.0, 6792.0, 4088.0, 2457.0, 1592.0, 1106.0, 731.0, 540.0, 358.0, 245.0, 189.0, 140.0, 86.0, 68.0, 38.0, 25.0, 28.0, 18.0, 7.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.9921875, -9.6873779296875, -9.382568359375, -9.0777587890625, -8.77294921875, -8.4681396484375, -8.163330078125, -7.8585205078125, -7.5537109375, -7.2489013671875, -6.944091796875, -6.6392822265625, -6.33447265625, -6.0296630859375, -5.724853515625, -5.4200439453125, -5.115234375, -4.8104248046875, -4.505615234375, -4.2008056640625, -3.89599609375, -3.5911865234375, -3.286376953125, -2.9815673828125, -2.6767578125, -2.3719482421875, -2.067138671875, -1.7623291015625, -1.45751953125, -1.1527099609375, -0.847900390625, -0.5430908203125, -0.23828125, 0.0665283203125, 0.371337890625, 0.6761474609375, 0.98095703125, 1.2857666015625, 1.590576171875, 1.8953857421875, 2.2001953125, 2.5050048828125, 2.809814453125, 3.1146240234375, 3.41943359375, 3.7242431640625, 4.029052734375, 4.3338623046875, 4.638671875, 4.9434814453125, 5.248291015625, 5.5531005859375, 5.85791015625, 6.1627197265625, 6.467529296875, 6.7723388671875, 7.0771484375, 7.3819580078125, 7.686767578125, 7.9915771484375, 8.29638671875, 8.6011962890625, 8.906005859375, 9.2108154296875, 9.515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 13.0, 26.0, 24.0, 34.0, 47.0, 59.0, 84.0, 96.0, 97.0, 95.0, 102.0, 74.0, 61.0, 52.0, 23.0, 23.0, 9.0, 11.0, 8.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.0718841552734375, -2.016815185546875, -1.9617462158203125, -1.90667724609375, -1.8516082763671875, -1.796539306640625, -1.7414703369140625, -1.6864013671875, -1.6313323974609375, -1.576263427734375, -1.5211944580078125, -1.46612548828125, -1.4110565185546875, -1.355987548828125, -1.3009185791015625, -1.245849609375, -1.1907806396484375, -1.135711669921875, -1.0806427001953125, -1.02557373046875, -0.9705047607421875, -0.915435791015625, -0.8603668212890625, -0.8052978515625, -0.7502288818359375, -0.695159912109375, -0.6400909423828125, -0.58502197265625, -0.5299530029296875, -0.474884033203125, -0.4198150634765625, -0.36474609375, -0.3096771240234375, -0.254608154296875, -0.1995391845703125, -0.14447021484375, -0.0894012451171875, -0.034332275390625, 0.0207366943359375, 0.0758056640625, 0.1308746337890625, 0.185943603515625, 0.2410125732421875, 0.29608154296875, 0.3511505126953125, 0.406219482421875, 0.4612884521484375, 0.516357421875, 0.5714263916015625, 0.626495361328125, 0.6815643310546875, 0.73663330078125, 0.7917022705078125, 0.846771240234375, 0.9018402099609375, 0.9569091796875, 1.0119781494140625, 1.067047119140625, 1.1221160888671875, 1.17718505859375, 1.2322540283203125, 1.287322998046875, 1.3423919677734375, 1.3974609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 15.0, 12.0, 16.0, 25.0, 33.0, 51.0, 72.0, 109.0, 252.0, 400.0, 778.0, 1478.0, 2957.0, 6326.0, 14603.0, 44449.0, 243129.0, 571886.0, 115213.0, 26931.0, 10272.0, 4696.0, 2262.0, 1155.0, 627.0, 321.0, 173.0, 115.0, 45.0, 41.0, 20.0, 17.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.049072265625, -16.50439453125, -15.959716796875, -15.4150390625, -14.870361328125, -14.32568359375, -13.781005859375, -13.236328125, -12.691650390625, -12.14697265625, -11.602294921875, -11.0576171875, -10.512939453125, -9.96826171875, -9.423583984375, -8.87890625, -8.334228515625, -7.78955078125, -7.244873046875, -6.7001953125, -6.155517578125, -5.61083984375, -5.066162109375, -4.521484375, -3.976806640625, -3.43212890625, -2.887451171875, -2.3427734375, -1.798095703125, -1.25341796875, -0.708740234375, -0.1640625, 0.380615234375, 0.92529296875, 1.469970703125, 2.0146484375, 2.559326171875, 3.10400390625, 3.648681640625, 4.193359375, 4.738037109375, 5.28271484375, 5.827392578125, 6.3720703125, 6.916748046875, 7.46142578125, 8.006103515625, 8.55078125, 9.095458984375, 9.64013671875, 10.184814453125, 10.7294921875, 11.274169921875, 11.81884765625, 12.363525390625, 12.908203125, 13.452880859375, 13.99755859375, 14.542236328125, 15.0869140625, 15.631591796875, 16.17626953125, 16.720947265625, 17.265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 0.0, 4.0, 10.0, 6.0, 5.0, 11.0, 16.0, 10.0, 18.0, 24.0, 17.0, 23.0, 34.0, 25.0, 24.0, 31.0, 44.0, 33.0, 48.0, 42.0, 37.0, 39.0, 44.0, 47.0, 49.0, 34.0, 40.0, 36.0, 27.0, 31.0, 35.0, 21.0, 21.0, 20.0, 17.0, 11.0, 9.0, 12.0, 12.0, 1.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.5546875, -8.2862548828125, -8.017822265625, -7.7493896484375, -7.48095703125, -7.2125244140625, -6.944091796875, -6.6756591796875, -6.4072265625, -6.1387939453125, -5.870361328125, -5.6019287109375, -5.33349609375, -5.0650634765625, -4.796630859375, -4.5281982421875, -4.259765625, -3.9913330078125, -3.722900390625, -3.4544677734375, -3.18603515625, -2.9176025390625, -2.649169921875, -2.3807373046875, -2.1123046875, -1.8438720703125, -1.575439453125, -1.3070068359375, -1.03857421875, -0.7701416015625, -0.501708984375, -0.2332763671875, 0.03515625, 0.3035888671875, 0.572021484375, 0.8404541015625, 1.10888671875, 1.3773193359375, 1.645751953125, 1.9141845703125, 2.1826171875, 2.4510498046875, 2.719482421875, 2.9879150390625, 3.25634765625, 3.5247802734375, 3.793212890625, 4.0616455078125, 4.330078125, 4.5985107421875, 4.866943359375, 5.1353759765625, 5.40380859375, 5.6722412109375, 5.940673828125, 6.2091064453125, 6.4775390625, 6.7459716796875, 7.014404296875, 7.2828369140625, 7.55126953125, 7.8197021484375, 8.088134765625, 8.3565673828125, 8.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 12.0, 14.0, 24.0, 39.0, 59.0, 79.0, 148.0, 200.0, 379.0, 593.0, 1118.0, 2244.0, 4933.0, 12559.0, 42811.0, 285708.0, 589483.0, 76172.0, 18930.0, 6839.0, 2819.0, 1455.0, 809.0, 433.0, 231.0, 157.0, 113.0, 68.0, 30.0, 28.0, 10.0, 11.0, 12.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0625, -24.232177734375, -23.40185546875, -22.571533203125, -21.7412109375, -20.910888671875, -20.08056640625, -19.250244140625, -18.419921875, -17.589599609375, -16.75927734375, -15.928955078125, -15.0986328125, -14.268310546875, -13.43798828125, -12.607666015625, -11.77734375, -10.947021484375, -10.11669921875, -9.286376953125, -8.4560546875, -7.625732421875, -6.79541015625, -5.965087890625, -5.134765625, -4.304443359375, -3.47412109375, -2.643798828125, -1.8134765625, -0.983154296875, -0.15283203125, 0.677490234375, 1.5078125, 2.338134765625, 3.16845703125, 3.998779296875, 4.8291015625, 5.659423828125, 6.48974609375, 7.320068359375, 8.150390625, 8.980712890625, 9.81103515625, 10.641357421875, 11.4716796875, 12.302001953125, 13.13232421875, 13.962646484375, 14.79296875, 15.623291015625, 16.45361328125, 17.283935546875, 18.1142578125, 18.944580078125, 19.77490234375, 20.605224609375, 21.435546875, 22.265869140625, 23.09619140625, 23.926513671875, 24.7568359375, 25.587158203125, 26.41748046875, 27.247802734375, 28.078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 8.0, 16.0, 17.0, 30.0, 34.0, 73.0, 112.0, 173.0, 184.0, 141.0, 69.0, 45.0, 26.0, 20.0, 11.0, 6.0, 12.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00402069091796875, -0.003909289836883545, -0.00379788875579834, -0.0036864876747131348, -0.0035750865936279297, -0.0034636855125427246, -0.0033522844314575195, -0.0032408833503723145, -0.0031294822692871094, -0.0030180811882019043, -0.0029066801071166992, -0.002795279026031494, -0.002683877944946289, -0.002572476863861084, -0.002461075782775879, -0.002349674701690674, -0.0022382736206054688, -0.0021268725395202637, -0.0020154714584350586, -0.0019040703773498535, -0.0017926692962646484, -0.0016812682151794434, -0.0015698671340942383, -0.0014584660530090332, -0.0013470649719238281, -0.001235663890838623, -0.001124262809753418, -0.0010128617286682129, -0.0009014606475830078, -0.0007900595664978027, -0.0006786584854125977, -0.0005672574043273926, -0.0004558563232421875, -0.0003444552421569824, -0.00023305416107177734, -0.00012165307998657227, -1.0251998901367188e-05, 0.00010114908218383789, 0.00021255016326904297, 0.00032395124435424805, 0.0004353523254394531, 0.0005467534065246582, 0.0006581544876098633, 0.0007695555686950684, 0.0008809566497802734, 0.0009923577308654785, 0.0011037588119506836, 0.0012151598930358887, 0.0013265609741210938, 0.0014379620552062988, 0.001549363136291504, 0.001660764217376709, 0.001772165298461914, 0.0018835663795471191, 0.0019949674606323242, 0.0021063685417175293, 0.0022177696228027344, 0.0023291707038879395, 0.0024405717849731445, 0.0025519728660583496, 0.0026633739471435547, 0.0027747750282287598, 0.002886176109313965, 0.00299757719039917, 0.003108978271484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 8.0, 22.0, 29.0, 39.0, 68.0, 115.0, 205.0, 405.0, 778.0, 1648.0, 3674.0, 9445.0, 30815.0, 221249.0, 672411.0, 78970.0, 17413.0, 6252.0, 2568.0, 1195.0, 571.0, 275.0, 147.0, 98.0, 65.0, 27.0, 13.0, 13.0, 13.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -24.021484375, -23.27734375, -22.533203125, -21.7890625, -21.044921875, -20.30078125, -19.556640625, -18.8125, -18.068359375, -17.32421875, -16.580078125, -15.8359375, -15.091796875, -14.34765625, -13.603515625, -12.859375, -12.115234375, -11.37109375, -10.626953125, -9.8828125, -9.138671875, -8.39453125, -7.650390625, -6.90625, -6.162109375, -5.41796875, -4.673828125, -3.9296875, -3.185546875, -2.44140625, -1.697265625, -0.953125, -0.208984375, 0.53515625, 1.279296875, 2.0234375, 2.767578125, 3.51171875, 4.255859375, 5.0, 5.744140625, 6.48828125, 7.232421875, 7.9765625, 8.720703125, 9.46484375, 10.208984375, 10.953125, 11.697265625, 12.44140625, 13.185546875, 13.9296875, 14.673828125, 15.41796875, 16.162109375, 16.90625, 17.650390625, 18.39453125, 19.138671875, 19.8828125, 20.626953125, 21.37109375, 22.115234375, 22.859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 13.0, 7.0, 12.0, 17.0, 24.0, 31.0, 40.0, 50.0, 52.0, 55.0, 67.0, 62.0, 78.0, 88.0, 78.0, 54.0, 59.0, 46.0, 39.0, 29.0, 29.0, 15.0, 11.0, 14.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.9866943359375, -9.668701171875, -9.3507080078125, -9.03271484375, -8.7147216796875, -8.396728515625, -8.0787353515625, -7.7607421875, -7.4427490234375, -7.124755859375, -6.8067626953125, -6.48876953125, -6.1707763671875, -5.852783203125, -5.5347900390625, -5.216796875, -4.8988037109375, -4.580810546875, -4.2628173828125, -3.94482421875, -3.6268310546875, -3.308837890625, -2.9908447265625, -2.6728515625, -2.3548583984375, -2.036865234375, -1.7188720703125, -1.40087890625, -1.0828857421875, -0.764892578125, -0.4468994140625, -0.12890625, 0.1890869140625, 0.507080078125, 0.8250732421875, 1.14306640625, 1.4610595703125, 1.779052734375, 2.0970458984375, 2.4150390625, 2.7330322265625, 3.051025390625, 3.3690185546875, 3.68701171875, 4.0050048828125, 4.322998046875, 4.6409912109375, 4.958984375, 5.2769775390625, 5.594970703125, 5.9129638671875, 6.23095703125, 6.5489501953125, 6.866943359375, 7.1849365234375, 7.5029296875, 7.8209228515625, 8.138916015625, 8.4569091796875, 8.77490234375, 9.0928955078125, 9.410888671875, 9.7288818359375, 10.046875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 11.0, 22.0, 18.0, 39.0, 153.0, 400.0, 225.0, 66.0, 24.0, 16.0, 11.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-353.36859130859375, -342.2578125, -331.14703369140625, -320.0362548828125, -308.9255065917969, -297.8147277832031, -286.7039489746094, -275.5931701660156, -264.4823913574219, -253.37161254882812, -242.26084899902344, -231.1500701904297, -220.03929138183594, -208.92852783203125, -197.8177490234375, -186.70697021484375, -175.59620666503906, -164.4854278564453, -153.37466430664062, -142.26388549804688, -131.15310668945312, -120.0423355102539, -108.93156433105469, -97.82078552246094, -86.71001434326172, -75.5992431640625, -64.48846435546875, -53.37769317626953, -42.26691818237305, -31.156143188476562, -20.045372009277344, -8.934593200683594, 2.176177978515625, 13.286952018737793, 24.39772605895996, 35.50849914550781, 46.6192741394043, 57.73004913330078, 68.8408203125, 79.95159912109375, 91.06237030029297, 102.17314147949219, 113.28392028808594, 124.39469146728516, 135.50546264648438, 146.61624145507812, 157.72702026367188, 168.83779907226562, 179.9485626220703, 191.05934143066406, 202.17010498046875, 213.2808837890625, 224.39166259765625, 235.50244140625, 246.6132049560547, 257.7239990234375, 268.8347473144531, 279.9455261230469, 291.0563049316406, 302.16705322265625, 313.27783203125, 324.38861083984375, 335.4993896484375, 346.61016845703125, 357.720947265625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 7.0, 7.0, 10.0, 17.0, 20.0, 32.0, 46.0, 96.0, 128.0, 146.0, 128.0, 122.0, 71.0, 47.0, 19.0, 13.0, 17.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.73660278320312, -150.3291778564453, -144.9217529296875, -139.51431274414062, -134.1068878173828, -128.699462890625, -123.29203796386719, -117.88461303710938, -112.47718811035156, -107.06976318359375, -101.6623306274414, -96.2549057006836, -90.84748077392578, -85.44004821777344, -80.03262329101562, -74.62519836425781, -69.21776580810547, -63.81033706665039, -58.40291213989258, -52.9954833984375, -47.58805847167969, -42.18062973022461, -36.77320098876953, -31.36577606201172, -25.95834732055664, -20.550920486450195, -15.143492698669434, -9.736064910888672, -4.328638076782227, 1.0787887573242188, 6.486217498779297, 11.89364242553711, 17.301071166992188, 22.708498001098633, 28.115924835205078, 33.523353576660156, 38.93077850341797, 44.33820724487305, 49.745635986328125, 55.15306091308594, 60.560489654541016, 65.9679183959961, 71.3753433227539, 76.78277587890625, 82.19020080566406, 87.59762573242188, 93.00505065917969, 98.4124755859375, 103.81990814208984, 109.22733306884766, 114.634765625, 120.04219055175781, 125.44961547851562, 130.85704040527344, 136.26446533203125, 141.67190551757812, 147.07933044433594, 152.48675537109375, 157.89418029785156, 163.30160522460938, 168.70904541015625, 174.11647033691406, 179.52389526367188, 184.9313201904297, 190.3387451171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 5.0, 16.0, 18.0, 42.0, 63.0, 108.0, 187.0, 265.0, 493.0, 965.0, 2008.0, 4697.0, 13668.0, 53639.0, 488710.0, 3491201.0, 104933.0, 21619.0, 6664.0, 2526.0, 1075.0, 583.0, 321.0, 162.0, 101.0, 76.0, 45.0, 29.0, 27.0, 11.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.625, -40.09423828125, -38.5634765625, -37.03271484375, -35.501953125, -33.97119140625, -32.4404296875, -30.90966796875, -29.37890625, -27.84814453125, -26.3173828125, -24.78662109375, -23.255859375, -21.72509765625, -20.1943359375, -18.66357421875, -17.1328125, -15.60205078125, -14.0712890625, -12.54052734375, -11.009765625, -9.47900390625, -7.9482421875, -6.41748046875, -4.88671875, -3.35595703125, -1.8251953125, -0.29443359375, 1.236328125, 2.76708984375, 4.2978515625, 5.82861328125, 7.359375, 8.89013671875, 10.4208984375, 11.95166015625, 13.482421875, 15.01318359375, 16.5439453125, 18.07470703125, 19.60546875, 21.13623046875, 22.6669921875, 24.19775390625, 25.728515625, 27.25927734375, 28.7900390625, 30.32080078125, 31.8515625, 33.38232421875, 34.9130859375, 36.44384765625, 37.974609375, 39.50537109375, 41.0361328125, 42.56689453125, 44.09765625, 45.62841796875, 47.1591796875, 48.68994140625, 50.220703125, 51.75146484375, 53.2822265625, 54.81298828125, 56.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 14.0, 9.0, 24.0, 17.0, 25.0, 40.0, 49.0, 62.0, 57.0, 94.0, 97.0, 77.0, 76.0, 78.0, 54.0, 64.0, 38.0, 26.0, 17.0, 15.0, 10.0, 6.0, 7.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9072265625, -1.8523101806640625, -1.797393798828125, -1.7424774169921875, -1.68756103515625, -1.6326446533203125, -1.577728271484375, -1.5228118896484375, -1.4678955078125, -1.4129791259765625, -1.358062744140625, -1.3031463623046875, -1.24822998046875, -1.1933135986328125, -1.138397216796875, -1.0834808349609375, -1.028564453125, -0.9736480712890625, -0.918731689453125, -0.8638153076171875, -0.80889892578125, -0.7539825439453125, -0.699066162109375, -0.6441497802734375, -0.5892333984375, -0.5343170166015625, -0.479400634765625, -0.4244842529296875, -0.36956787109375, -0.3146514892578125, -0.259735107421875, -0.2048187255859375, -0.14990234375, -0.0949859619140625, -0.040069580078125, 0.0148468017578125, 0.06976318359375, 0.1246795654296875, 0.179595947265625, 0.2345123291015625, 0.2894287109375, 0.3443450927734375, 0.399261474609375, 0.4541778564453125, 0.50909423828125, 0.5640106201171875, 0.618927001953125, 0.6738433837890625, 0.728759765625, 0.7836761474609375, 0.838592529296875, 0.8935089111328125, 0.94842529296875, 1.0033416748046875, 1.058258056640625, 1.1131744384765625, 1.1680908203125, 1.2230072021484375, 1.277923583984375, 1.3328399658203125, 1.38775634765625, 1.4426727294921875, 1.497589111328125, 1.5525054931640625, 1.607421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 11.0, 14.0, 21.0, 26.0, 37.0, 80.0, 103.0, 179.0, 338.0, 635.0, 1292.0, 2827.0, 7229.0, 21769.0, 81146.0, 425508.0, 2997040.0, 522910.0, 95006.0, 24379.0, 7778.0, 3017.0, 1384.0, 665.0, 337.0, 202.0, 126.0, 74.0, 42.0, 34.0, 21.0, 10.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-29.8125, -28.996826171875, -28.18115234375, -27.365478515625, -26.5498046875, -25.734130859375, -24.91845703125, -24.102783203125, -23.287109375, -22.471435546875, -21.65576171875, -20.840087890625, -20.0244140625, -19.208740234375, -18.39306640625, -17.577392578125, -16.76171875, -15.946044921875, -15.13037109375, -14.314697265625, -13.4990234375, -12.683349609375, -11.86767578125, -11.052001953125, -10.236328125, -9.420654296875, -8.60498046875, -7.789306640625, -6.9736328125, -6.157958984375, -5.34228515625, -4.526611328125, -3.7109375, -2.895263671875, -2.07958984375, -1.263916015625, -0.4482421875, 0.367431640625, 1.18310546875, 1.998779296875, 2.814453125, 3.630126953125, 4.44580078125, 5.261474609375, 6.0771484375, 6.892822265625, 7.70849609375, 8.524169921875, 9.33984375, 10.155517578125, 10.97119140625, 11.786865234375, 12.6025390625, 13.418212890625, 14.23388671875, 15.049560546875, 15.865234375, 16.680908203125, 17.49658203125, 18.312255859375, 19.1279296875, 19.943603515625, 20.75927734375, 21.574951171875, 22.390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 11.0, 16.0, 23.0, 39.0, 46.0, 62.0, 115.0, 174.0, 297.0, 558.0, 1278.0, 542.0, 301.0, 216.0, 140.0, 80.0, 50.0, 45.0, 13.0, 12.0, 13.0, 12.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.3828125, -4.234375, -4.0859375, -3.9375, -3.7890625, -3.640625, -3.4921875, -3.34375, -3.1953125, -3.046875, -2.8984375, -2.75, -2.6015625, -2.453125, -2.3046875, -2.15625, -2.0078125, -1.859375, -1.7109375, -1.5625, -1.4140625, -1.265625, -1.1171875, -0.96875, -0.8203125, -0.671875, -0.5234375, -0.375, -0.2265625, -0.078125, 0.0703125, 0.21875, 0.3671875, 0.515625, 0.6640625, 0.8125, 0.9609375, 1.109375, 1.2578125, 1.40625, 1.5546875, 1.703125, 1.8515625, 2.0, 2.1484375, 2.296875, 2.4453125, 2.59375, 2.7421875, 2.890625, 3.0390625, 3.1875, 3.3359375, 3.484375, 3.6328125, 3.78125, 3.9296875, 4.078125, 4.2265625, 4.375, 4.5234375, 4.671875, 4.8203125, 4.96875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 32.0, 66.0, 167.0, 321.0, 250.0, 95.0, 33.0, 12.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.17215347290039, -51.10664749145508, -49.04114532470703, -46.97563934326172, -44.910133361816406, -42.844627380371094, -40.77912139892578, -38.713619232177734, -36.64811325073242, -34.58260726928711, -32.51710510253906, -30.45159912109375, -28.386093139648438, -26.320587158203125, -24.255083084106445, -22.189579010009766, -20.124073028564453, -18.05856704711914, -15.993062973022461, -13.927557945251465, -11.862052917480469, -9.796547889709473, -7.731042861938477, -5.6655378341674805, -3.6000328063964844, -1.5345277786254883, 0.5309772491455078, 2.596482276916504, 4.6619873046875, 6.727492332458496, 8.792997360229492, 10.858502388000488, 12.924003601074219, 14.989508628845215, 17.05501365661621, 19.12051773071289, 21.186023712158203, 23.251529693603516, 25.317033767700195, 27.382537841796875, 29.448043823242188, 31.5135498046875, 33.57905578613281, 35.64455795288086, 37.71006393432617, 39.775569915771484, 41.84107208251953, 43.906578063964844, 45.972084045410156, 48.03759002685547, 50.10309600830078, 52.16859817504883, 54.23410415649414, 56.29961013793945, 58.3651123046875, 60.43061828613281, 62.496124267578125, 64.56163024902344, 66.62713623046875, 68.69264221191406, 70.75814819335938, 72.82364654541016, 74.88915252685547, 76.95465850830078, 79.0201644897461]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 7.0, 4.0, 14.0, 8.0, 19.0, 21.0, 32.0, 40.0, 51.0, 73.0, 57.0, 67.0, 77.0, 70.0, 70.0, 59.0, 69.0, 41.0, 46.0, 34.0, 26.0, 24.0, 21.0, 8.0, 12.0, 4.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.335447311401367, -18.68726348876953, -18.039077758789062, -17.390893936157227, -16.74271011352539, -16.094524383544922, -15.446340560913086, -14.798155784606934, -14.149971008300781, -13.501786231994629, -12.853601455688477, -12.20541763305664, -11.557232856750488, -10.909048080444336, -10.2608642578125, -9.612679481506348, -8.964494705200195, -8.316309928894043, -7.668125629425049, -7.019941329956055, -6.371756553649902, -5.72357177734375, -5.075387477874756, -4.427203178405762, -3.7790184020996094, -3.130833864212036, -2.482649326324463, -1.8344647884368896, -1.1862802505493164, -0.5380957126617432, 0.11008882522583008, 0.7582731246948242, 1.4064559936523438, 2.054640531539917, 2.7028250694274902, 3.3510096073150635, 3.9991941452026367, 4.647378921508789, 5.295563220977783, 5.943747520446777, 6.59193229675293, 7.240117073059082, 7.888301372528076, 8.53648567199707, 9.184670448303223, 9.832855224609375, 10.481039047241211, 11.129223823547363, 11.777408599853516, 12.425593376159668, 13.07377815246582, 13.721961975097656, 14.370146751403809, 15.018331527709961, 15.666515350341797, 16.314701080322266, 16.9628849029541, 17.611068725585938, 18.259254455566406, 18.907438278198242, 19.555622100830078, 20.203807830810547, 20.851991653442383, 21.50017547607422, 22.148361206054688]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 14.0, 8.0, 9.0, 31.0, 26.0, 42.0, 52.0, 109.0, 280.0, 1797.0, 17639.0, 307383.0, 673021.0, 43483.0, 3767.0, 553.0, 136.0, 53.0, 29.0, 33.0, 16.0, 15.0, 15.0, 7.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-45.375, -44.154296875, -42.93359375, -41.712890625, -40.4921875, -39.271484375, -38.05078125, -36.830078125, -35.609375, -34.388671875, -33.16796875, -31.947265625, -30.7265625, -29.505859375, -28.28515625, -27.064453125, -25.84375, -24.623046875, -23.40234375, -22.181640625, -20.9609375, -19.740234375, -18.51953125, -17.298828125, -16.078125, -14.857421875, -13.63671875, -12.416015625, -11.1953125, -9.974609375, -8.75390625, -7.533203125, -6.3125, -5.091796875, -3.87109375, -2.650390625, -1.4296875, -0.208984375, 1.01171875, 2.232421875, 3.453125, 4.673828125, 5.89453125, 7.115234375, 8.3359375, 9.556640625, 10.77734375, 11.998046875, 13.21875, 14.439453125, 15.66015625, 16.880859375, 18.1015625, 19.322265625, 20.54296875, 21.763671875, 22.984375, 24.205078125, 25.42578125, 26.646484375, 27.8671875, 29.087890625, 30.30859375, 31.529296875, 32.75]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 11.0, 11.0, 13.0, 33.0, 35.0, 43.0, 47.0, 61.0, 82.0, 78.0, 78.0, 108.0, 80.0, 75.0, 64.0, 61.0, 40.0, 28.0, 18.0, 13.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2010040283203125, -1.143218994140625, -1.0854339599609375, -1.02764892578125, -0.9698638916015625, -0.912078857421875, -0.8542938232421875, -0.7965087890625, -0.7387237548828125, -0.680938720703125, -0.6231536865234375, -0.56536865234375, -0.5075836181640625, -0.449798583984375, -0.3920135498046875, -0.334228515625, -0.2764434814453125, -0.218658447265625, -0.1608734130859375, -0.10308837890625, -0.0453033447265625, 0.012481689453125, 0.0702667236328125, 0.1280517578125, 0.1858367919921875, 0.243621826171875, 0.3014068603515625, 0.35919189453125, 0.4169769287109375, 0.474761962890625, 0.5325469970703125, 0.59033203125, 0.6481170654296875, 0.705902099609375, 0.7636871337890625, 0.82147216796875, 0.8792572021484375, 0.937042236328125, 0.9948272705078125, 1.0526123046875, 1.1103973388671875, 1.168182373046875, 1.2259674072265625, 1.28375244140625, 1.3415374755859375, 1.399322509765625, 1.4571075439453125, 1.514892578125, 1.5726776123046875, 1.630462646484375, 1.6882476806640625, 1.74603271484375, 1.8038177490234375, 1.861602783203125, 1.9193878173828125, 1.9771728515625, 2.0349578857421875, 2.092742919921875, 2.1505279541015625, 2.20831298828125, 2.2660980224609375, 2.323883056640625, 2.3816680908203125, 2.439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 16.0, 20.0, 27.0, 74.0, 175.0, 293.0, 718.0, 1884.0, 5455.0, 18714.0, 80539.0, 373433.0, 436505.0, 99056.0, 21930.0, 6202.0, 2083.0, 716.0, 345.0, 155.0, 84.0, 33.0, 33.0, 14.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6695556640625, -11.221923828125, -10.7742919921875, -10.32666015625, -9.8790283203125, -9.431396484375, -8.9837646484375, -8.5361328125, -8.0885009765625, -7.640869140625, -7.1932373046875, -6.74560546875, -6.2979736328125, -5.850341796875, -5.4027099609375, -4.955078125, -4.5074462890625, -4.059814453125, -3.6121826171875, -3.16455078125, -2.7169189453125, -2.269287109375, -1.8216552734375, -1.3740234375, -0.9263916015625, -0.478759765625, -0.0311279296875, 0.41650390625, 0.8641357421875, 1.311767578125, 1.7593994140625, 2.20703125, 2.6546630859375, 3.102294921875, 3.5499267578125, 3.99755859375, 4.4451904296875, 4.892822265625, 5.3404541015625, 5.7880859375, 6.2357177734375, 6.683349609375, 7.1309814453125, 7.57861328125, 8.0262451171875, 8.473876953125, 8.9215087890625, 9.369140625, 9.8167724609375, 10.264404296875, 10.7120361328125, 11.15966796875, 11.6072998046875, 12.054931640625, 12.5025634765625, 12.9501953125, 13.3978271484375, 13.845458984375, 14.2930908203125, 14.74072265625, 15.1883544921875, 15.635986328125, 16.0836181640625, 16.53125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 8.0, 13.0, 14.0, 8.0, 18.0, 26.0, 24.0, 29.0, 30.0, 39.0, 38.0, 39.0, 40.0, 50.0, 34.0, 51.0, 57.0, 51.0, 39.0, 38.0, 52.0, 44.0, 31.0, 25.0, 42.0, 30.0, 20.0, 19.0, 20.0, 9.0, 15.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.9085693359375, -5.707763671875, -5.5069580078125, -5.30615234375, -5.1053466796875, -4.904541015625, -4.7037353515625, -4.5029296875, -4.3021240234375, -4.101318359375, -3.9005126953125, -3.69970703125, -3.4989013671875, -3.298095703125, -3.0972900390625, -2.896484375, -2.6956787109375, -2.494873046875, -2.2940673828125, -2.09326171875, -1.8924560546875, -1.691650390625, -1.4908447265625, -1.2900390625, -1.0892333984375, -0.888427734375, -0.6876220703125, -0.48681640625, -0.2860107421875, -0.085205078125, 0.1156005859375, 0.31640625, 0.5172119140625, 0.718017578125, 0.9188232421875, 1.11962890625, 1.3204345703125, 1.521240234375, 1.7220458984375, 1.9228515625, 2.1236572265625, 2.324462890625, 2.5252685546875, 2.72607421875, 2.9268798828125, 3.127685546875, 3.3284912109375, 3.529296875, 3.7301025390625, 3.930908203125, 4.1317138671875, 4.33251953125, 4.5333251953125, 4.734130859375, 4.9349365234375, 5.1357421875, 5.3365478515625, 5.537353515625, 5.7381591796875, 5.93896484375, 6.1397705078125, 6.340576171875, 6.5413818359375, 6.7421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 10.0, 18.0, 28.0, 47.0, 89.0, 229.0, 420.0, 1258.0, 4130.0, 19607.0, 198796.0, 728111.0, 80707.0, 10904.0, 2689.0, 889.0, 312.0, 151.0, 84.0, 32.0, 16.0, 10.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -36.165771484375, -35.26904296875, -34.372314453125, -33.4755859375, -32.578857421875, -31.68212890625, -30.785400390625, -29.888671875, -28.991943359375, -28.09521484375, -27.198486328125, -26.3017578125, -25.405029296875, -24.50830078125, -23.611572265625, -22.71484375, -21.818115234375, -20.92138671875, -20.024658203125, -19.1279296875, -18.231201171875, -17.33447265625, -16.437744140625, -15.541015625, -14.644287109375, -13.74755859375, -12.850830078125, -11.9541015625, -11.057373046875, -10.16064453125, -9.263916015625, -8.3671875, -7.470458984375, -6.57373046875, -5.677001953125, -4.7802734375, -3.883544921875, -2.98681640625, -2.090087890625, -1.193359375, -0.296630859375, 0.60009765625, 1.496826171875, 2.3935546875, 3.290283203125, 4.18701171875, 5.083740234375, 5.98046875, 6.877197265625, 7.77392578125, 8.670654296875, 9.5673828125, 10.464111328125, 11.36083984375, 12.257568359375, 13.154296875, 14.051025390625, 14.94775390625, 15.844482421875, 16.7412109375, 17.637939453125, 18.53466796875, 19.431396484375, 20.328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 9.0, 6.0, 21.0, 11.0, 16.0, 30.0, 28.0, 33.0, 41.0, 55.0, 49.0, 70.0, 63.0, 98.0, 63.0, 78.0, 56.0, 51.0, 47.0, 24.0, 27.0, 16.0, 20.0, 13.0, 10.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0007228851318359375, -0.0007006004452705383, -0.0006783157587051392, -0.00065603107213974, -0.0006337463855743408, -0.0006114616990089417, -0.0005891770124435425, -0.0005668923258781433, -0.0005446076393127441, -0.000522322952747345, -0.0005000382661819458, -0.00047775357961654663, -0.00045546889305114746, -0.0004331842064857483, -0.0004108995199203491, -0.00038861483335494995, -0.0003663301467895508, -0.0003440454602241516, -0.00032176077365875244, -0.00029947608709335327, -0.0002771914005279541, -0.00025490671396255493, -0.00023262202739715576, -0.0002103373408317566, -0.00018805265426635742, -0.00016576796770095825, -0.00014348328113555908, -0.00012119859457015991, -9.891390800476074e-05, -7.662922143936157e-05, -5.43445348739624e-05, -3.205984830856323e-05, -9.775161743164062e-06, 1.2509524822235107e-05, 3.479421138763428e-05, 5.707889795303345e-05, 7.936358451843262e-05, 0.00010164827108383179, 0.00012393295764923096, 0.00014621764421463013, 0.0001685023307800293, 0.00019078701734542847, 0.00021307170391082764, 0.0002353563904762268, 0.000257641077041626, 0.00027992576360702515, 0.0003022104501724243, 0.0003244951367378235, 0.00034677982330322266, 0.0003690645098686218, 0.000391349196434021, 0.00041363388299942017, 0.00043591856956481934, 0.0004582032561302185, 0.0004804879426956177, 0.0005027726292610168, 0.000525057315826416, 0.0005473420023918152, 0.0005696266889572144, 0.0005919113755226135, 0.0006141960620880127, 0.0006364807486534119, 0.000658765435218811, 0.0006810501217842102, 0.0007033348083496094]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 14.0, 17.0, 27.0, 31.0, 55.0, 79.0, 104.0, 189.0, 306.0, 518.0, 959.0, 1824.0, 3751.0, 8369.0, 21800.0, 64982.0, 217440.0, 424899.0, 204985.0, 61878.0, 20578.0, 8171.0, 3521.0, 1791.0, 925.0, 511.0, 307.0, 183.0, 114.0, 61.0, 37.0, 26.0, 29.0, 16.0, 13.0, 7.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.4375, -14.041748046875, -13.64599609375, -13.250244140625, -12.8544921875, -12.458740234375, -12.06298828125, -11.667236328125, -11.271484375, -10.875732421875, -10.47998046875, -10.084228515625, -9.6884765625, -9.292724609375, -8.89697265625, -8.501220703125, -8.10546875, -7.709716796875, -7.31396484375, -6.918212890625, -6.5224609375, -6.126708984375, -5.73095703125, -5.335205078125, -4.939453125, -4.543701171875, -4.14794921875, -3.752197265625, -3.3564453125, -2.960693359375, -2.56494140625, -2.169189453125, -1.7734375, -1.377685546875, -0.98193359375, -0.586181640625, -0.1904296875, 0.205322265625, 0.60107421875, 0.996826171875, 1.392578125, 1.788330078125, 2.18408203125, 2.579833984375, 2.9755859375, 3.371337890625, 3.76708984375, 4.162841796875, 4.55859375, 4.954345703125, 5.35009765625, 5.745849609375, 6.1416015625, 6.537353515625, 6.93310546875, 7.328857421875, 7.724609375, 8.120361328125, 8.51611328125, 8.911865234375, 9.3076171875, 9.703369140625, 10.09912109375, 10.494873046875, 10.890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 2.0, 6.0, 11.0, 14.0, 20.0, 24.0, 32.0, 51.0, 77.0, 70.0, 78.0, 84.0, 91.0, 78.0, 75.0, 77.0, 45.0, 47.0, 33.0, 17.0, 14.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.84375, -10.60003662109375, -10.3563232421875, -10.11260986328125, -9.868896484375, -9.62518310546875, -9.3814697265625, -9.13775634765625, -8.89404296875, -8.65032958984375, -8.4066162109375, -8.16290283203125, -7.919189453125, -7.67547607421875, -7.4317626953125, -7.18804931640625, -6.9443359375, -6.70062255859375, -6.4569091796875, -6.21319580078125, -5.969482421875, -5.72576904296875, -5.4820556640625, -5.23834228515625, -4.99462890625, -4.75091552734375, -4.5072021484375, -4.26348876953125, -4.019775390625, -3.77606201171875, -3.5323486328125, -3.28863525390625, -3.044921875, -2.80120849609375, -2.5574951171875, -2.31378173828125, -2.070068359375, -1.82635498046875, -1.5826416015625, -1.33892822265625, -1.09521484375, -0.85150146484375, -0.6077880859375, -0.36407470703125, -0.120361328125, 0.12335205078125, 0.3670654296875, 0.61077880859375, 0.8544921875, 1.09820556640625, 1.3419189453125, 1.58563232421875, 1.829345703125, 2.07305908203125, 2.3167724609375, 2.56048583984375, 2.80419921875, 3.04791259765625, 3.2916259765625, 3.53533935546875, 3.779052734375, 4.02276611328125, 4.2664794921875, 4.51019287109375, 4.75390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 10.0, 21.0, 34.0, 64.0, 113.0, 176.0, 219.0, 170.0, 86.0, 45.0, 24.0, 13.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-116.05673217773438, -112.68064880371094, -109.30457305908203, -105.9284896850586, -102.55241394042969, -99.17633056640625, -95.80024719238281, -92.4241714477539, -89.04808807373047, -85.67200469970703, -82.29592895507812, -78.91984558105469, -75.54376983642578, -72.16768646240234, -68.79161071777344, -65.41552734375, -62.03944778442383, -58.663368225097656, -55.287288665771484, -51.91120910644531, -48.535125732421875, -45.1590461730957, -41.78296661376953, -38.406883239746094, -35.03080749511719, -31.654727935791016, -28.27864646911621, -24.90256690979004, -21.526485443115234, -18.150405883789062, -14.77432632446289, -11.398244857788086, -8.022163391113281, -4.646082878112793, -1.270002841949463, 2.106077194213867, 5.4821577072143555, 8.858238220214844, 12.234317779541016, 15.61039924621582, 18.986478805541992, 22.362558364868164, 25.73863983154297, 29.11471939086914, 32.49079895019531, 35.86688232421875, 39.242958068847656, 42.619041442871094, 45.995121002197266, 49.37120056152344, 52.74728012084961, 56.12335968017578, 59.49944305419922, 62.87552261352539, 66.25160217285156, 69.627685546875, 73.0037612915039, 76.37984466552734, 79.75592041015625, 83.13200378417969, 86.5080795288086, 89.88416290283203, 93.26023864746094, 96.63632202148438, 100.01240539550781]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 7.0, 9.0, 13.0, 14.0, 19.0, 30.0, 38.0, 44.0, 46.0, 53.0, 77.0, 75.0, 68.0, 74.0, 73.0, 64.0, 58.0, 42.0, 44.0, 33.0, 24.0, 15.0, 13.0, 9.0, 2.0, 3.0, 5.0, 1.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.847251892089844, -42.85832214355469, -40.86939239501953, -38.88045883178711, -36.89152908325195, -34.9025993347168, -32.91366958618164, -30.92473793029785, -28.935806274414062, -26.946876525878906, -24.957944869995117, -22.96901512145996, -20.980083465576172, -18.991153717041016, -17.00222396850586, -15.01329231262207, -13.024362564086914, -11.035431861877441, -9.046501159667969, -7.057570934295654, -5.068640232086182, -3.079710006713867, -1.0907793045043945, 0.8981513977050781, 2.887082099914551, 4.876012802124023, 6.864943504333496, 8.853874206542969, 10.842803955078125, 12.831734657287598, 14.82066535949707, 16.80959701538086, 18.798526763916016, 20.787456512451172, 22.77638816833496, 24.765317916870117, 26.754249572753906, 28.743179321289062, 30.73210906982422, 32.721038818359375, 34.7099723815918, 36.69890213012695, 38.68783187866211, 40.67676544189453, 42.66569519042969, 44.654624938964844, 46.6435546875, 48.632484436035156, 50.62141418457031, 52.61034393310547, 54.599273681640625, 56.58820724487305, 58.5771369934082, 60.56606674194336, 62.554996490478516, 64.54393005371094, 66.5328598022461, 68.52178955078125, 70.5107192993164, 72.49964904785156, 74.48857879638672, 76.47750854492188, 78.46644592285156, 80.45537567138672, 82.44430541992188]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 15.0, 41.0, 68.0, 131.0, 278.0, 586.0, 1390.0, 3717.0, 10570.0, 40658.0, 568541.0, 3484132.0, 62766.0, 14216.0, 4346.0, 1523.0, 619.0, 273.0, 135.0, 73.0, 39.0, 29.0, 25.0, 19.0, 12.0, 16.0, 6.0, 8.0, 8.0, 10.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.203125, -28.623779296875, -27.04443359375, -25.465087890625, -23.8857421875, -22.306396484375, -20.72705078125, -19.147705078125, -17.568359375, -15.989013671875, -14.40966796875, -12.830322265625, -11.2509765625, -9.671630859375, -8.09228515625, -6.512939453125, -4.93359375, -3.354248046875, -1.77490234375, -0.195556640625, 1.3837890625, 2.963134765625, 4.54248046875, 6.121826171875, 7.701171875, 9.280517578125, 10.85986328125, 12.439208984375, 14.0185546875, 15.597900390625, 17.17724609375, 18.756591796875, 20.3359375, 21.915283203125, 23.49462890625, 25.073974609375, 26.6533203125, 28.232666015625, 29.81201171875, 31.391357421875, 32.970703125, 34.550048828125, 36.12939453125, 37.708740234375, 39.2880859375, 40.867431640625, 42.44677734375, 44.026123046875, 45.60546875, 47.184814453125, 48.76416015625, 50.343505859375, 51.9228515625, 53.502197265625, 55.08154296875, 56.660888671875, 58.240234375, 59.819580078125, 61.39892578125, 62.978271484375, 64.5576171875, 66.136962890625, 67.71630859375, 69.295654296875, 70.875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 11.0, 14.0, 11.0, 14.0, 18.0, 12.0, 37.0, 54.0, 44.0, 47.0, 52.0, 92.0, 72.0, 73.0, 64.0, 67.0, 54.0, 51.0, 48.0, 42.0, 34.0, 23.0, 15.0, 12.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.4427642822265625, -1.393341064453125, -1.3439178466796875, -1.29449462890625, -1.2450714111328125, -1.195648193359375, -1.1462249755859375, -1.0968017578125, -1.0473785400390625, -0.997955322265625, -0.9485321044921875, -0.89910888671875, -0.8496856689453125, -0.800262451171875, -0.7508392333984375, -0.701416015625, -0.6519927978515625, -0.602569580078125, -0.5531463623046875, -0.50372314453125, -0.4542999267578125, -0.404876708984375, -0.3554534912109375, -0.3060302734375, -0.2566070556640625, -0.207183837890625, -0.1577606201171875, -0.10833740234375, -0.0589141845703125, -0.009490966796875, 0.0399322509765625, 0.08935546875, 0.1387786865234375, 0.188201904296875, 0.2376251220703125, 0.28704833984375, 0.3364715576171875, 0.385894775390625, 0.4353179931640625, 0.4847412109375, 0.5341644287109375, 0.583587646484375, 0.6330108642578125, 0.68243408203125, 0.7318572998046875, 0.781280517578125, 0.8307037353515625, 0.880126953125, 0.9295501708984375, 0.978973388671875, 1.0283966064453125, 1.07781982421875, 1.1272430419921875, 1.176666259765625, 1.2260894775390625, 1.2755126953125, 1.3249359130859375, 1.374359130859375, 1.4237823486328125, 1.47320556640625, 1.5226287841796875, 1.572052001953125, 1.6214752197265625, 1.6708984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 0.0, 2.0, 4.0, 17.0, 11.0, 22.0, 36.0, 52.0, 72.0, 100.0, 206.0, 346.0, 820.0, 2163.0, 6472.0, 23386.0, 120471.0, 2937008.0, 998626.0, 79762.0, 16779.0, 4796.0, 1690.0, 667.0, 341.0, 152.0, 84.0, 61.0, 42.0, 22.0, 27.0, 9.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.796875, -28.688720703125, -27.58056640625, -26.472412109375, -25.3642578125, -24.256103515625, -23.14794921875, -22.039794921875, -20.931640625, -19.823486328125, -18.71533203125, -17.607177734375, -16.4990234375, -15.390869140625, -14.28271484375, -13.174560546875, -12.06640625, -10.958251953125, -9.85009765625, -8.741943359375, -7.6337890625, -6.525634765625, -5.41748046875, -4.309326171875, -3.201171875, -2.093017578125, -0.98486328125, 0.123291015625, 1.2314453125, 2.339599609375, 3.44775390625, 4.555908203125, 5.6640625, 6.772216796875, 7.88037109375, 8.988525390625, 10.0966796875, 11.204833984375, 12.31298828125, 13.421142578125, 14.529296875, 15.637451171875, 16.74560546875, 17.853759765625, 18.9619140625, 20.070068359375, 21.17822265625, 22.286376953125, 23.39453125, 24.502685546875, 25.61083984375, 26.718994140625, 27.8271484375, 28.935302734375, 30.04345703125, 31.151611328125, 32.259765625, 33.367919921875, 34.47607421875, 35.584228515625, 36.6923828125, 37.800537109375, 38.90869140625, 40.016845703125, 41.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 9.0, 7.0, 18.0, 30.0, 29.0, 42.0, 47.0, 98.0, 140.0, 200.0, 318.0, 703.0, 1172.0, 460.0, 261.0, 141.0, 91.0, 67.0, 40.0, 37.0, 27.0, 20.0, 17.0, 23.0, 10.0, 8.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.94549560546875, -3.8363037109375, -3.72711181640625, -3.617919921875, -3.50872802734375, -3.3995361328125, -3.29034423828125, -3.18115234375, -3.07196044921875, -2.9627685546875, -2.85357666015625, -2.744384765625, -2.63519287109375, -2.5260009765625, -2.41680908203125, -2.3076171875, -2.19842529296875, -2.0892333984375, -1.98004150390625, -1.870849609375, -1.76165771484375, -1.6524658203125, -1.54327392578125, -1.43408203125, -1.32489013671875, -1.2156982421875, -1.10650634765625, -0.997314453125, -0.88812255859375, -0.7789306640625, -0.66973876953125, -0.560546875, -0.45135498046875, -0.3421630859375, -0.23297119140625, -0.123779296875, -0.01458740234375, 0.0946044921875, 0.20379638671875, 0.31298828125, 0.42218017578125, 0.5313720703125, 0.64056396484375, 0.749755859375, 0.85894775390625, 0.9681396484375, 1.07733154296875, 1.1865234375, 1.29571533203125, 1.4049072265625, 1.51409912109375, 1.623291015625, 1.73248291015625, 1.8416748046875, 1.95086669921875, 2.06005859375, 2.16925048828125, 2.2784423828125, 2.38763427734375, 2.496826171875, 2.60601806640625, 2.7152099609375, 2.82440185546875, 2.93359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 16.0, 30.0, 41.0, 68.0, 107.0, 161.0, 162.0, 159.0, 97.0, 63.0, 36.0, 16.0, 19.0, 10.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.286975860595703, -18.184234619140625, -17.081491470336914, -15.978750228881836, -14.876008033752441, -13.773265838623047, -12.670524597167969, -11.567782402038574, -10.46504020690918, -9.362298011779785, -8.25955581665039, -7.1568145751953125, -6.054072380065918, -4.951330184936523, -3.848588466644287, -2.745846748352051, -1.6431045532226562, -0.5403625965118408, 0.5623793601989746, 1.66512131690979, 2.7678632736206055, 3.87060546875, 4.973347187042236, 6.076088905334473, 7.178831100463867, 8.281573295593262, 9.384315490722656, 10.487056732177734, 11.589798927307129, 12.692541122436523, 13.795282363891602, 14.898024559020996, 16.000762939453125, 17.103504180908203, 18.206247329711914, 19.308988571166992, 20.411731719970703, 21.51447296142578, 22.61721420288086, 23.719955444335938, 24.82269859313965, 25.925439834594727, 27.028182983398438, 28.130924224853516, 29.233665466308594, 30.336408615112305, 31.439149856567383, 32.541893005371094, 33.64463424682617, 34.74737548828125, 35.85011672973633, 36.95286178588867, 38.05560302734375, 39.15834426879883, 40.261085510253906, 41.363826751708984, 42.46656799316406, 43.56930923461914, 44.67205047607422, 45.77479553222656, 46.87753677368164, 47.98027801513672, 49.0830192565918, 50.185760498046875, 51.28850555419922]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 13.0, 15.0, 25.0, 27.0, 45.0, 39.0, 37.0, 60.0, 90.0, 82.0, 76.0, 94.0, 77.0, 67.0, 44.0, 43.0, 34.0, 32.0, 20.0, 20.0, 14.0, 9.0, 8.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.44953155517578, -22.775856018066406, -22.1021785736084, -21.428503036499023, -20.754825592041016, -20.08115005493164, -19.407474517822266, -18.73379898071289, -18.060121536254883, -17.386445999145508, -16.7127685546875, -16.039093017578125, -15.365416526794434, -14.691740036010742, -14.018064498901367, -13.344388008117676, -12.670711517333984, -11.997035026550293, -11.323358535766602, -10.649682998657227, -9.976006507873535, -9.302330017089844, -8.628654479980469, -7.954977989196777, -7.281301498413086, -6.6076250076293945, -5.933948993682861, -5.260272979736328, -4.586596488952637, -3.9129202365875244, -3.239243984222412, -2.565567970275879, -1.8918914794921875, -1.2182152271270752, -0.5445389747619629, 0.12913727760314941, 0.8028135299682617, 1.476489782333374, 2.1501660346984863, 2.8238420486450195, 3.497518539428711, 4.171195030212402, 4.8448710441589355, 5.518547058105469, 6.19222354888916, 6.865900039672852, 7.539576053619385, 8.213252067565918, 8.88692855834961, 9.5606050491333, 10.234281539916992, 10.907957077026367, 11.581633567810059, 12.25531005859375, 12.928985595703125, 13.602662086486816, 14.276338577270508, 14.9500150680542, 15.62369155883789, 16.297367095947266, 16.97104263305664, 17.64472007751465, 18.318395614624023, 18.99207305908203, 19.665748596191406]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 12.0, 10.0, 26.0, 30.0, 51.0, 86.0, 114.0, 226.0, 419.0, 742.0, 1590.0, 3302.0, 7652.0, 17321.0, 42701.0, 106163.0, 238174.0, 314821.0, 183482.0, 77032.0, 30896.0, 12853.0, 5557.0, 2607.0, 1202.0, 665.0, 341.0, 175.0, 106.0, 62.0, 47.0, 22.0, 18.0, 14.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.223388671875, -11.84521484375, -11.467041015625, -11.0888671875, -10.710693359375, -10.33251953125, -9.954345703125, -9.576171875, -9.197998046875, -8.81982421875, -8.441650390625, -8.0634765625, -7.685302734375, -7.30712890625, -6.928955078125, -6.55078125, -6.172607421875, -5.79443359375, -5.416259765625, -5.0380859375, -4.659912109375, -4.28173828125, -3.903564453125, -3.525390625, -3.147216796875, -2.76904296875, -2.390869140625, -2.0126953125, -1.634521484375, -1.25634765625, -0.878173828125, -0.5, -0.121826171875, 0.25634765625, 0.634521484375, 1.0126953125, 1.390869140625, 1.76904296875, 2.147216796875, 2.525390625, 2.903564453125, 3.28173828125, 3.659912109375, 4.0380859375, 4.416259765625, 4.79443359375, 5.172607421875, 5.55078125, 5.928955078125, 6.30712890625, 6.685302734375, 7.0634765625, 7.441650390625, 7.81982421875, 8.197998046875, 8.576171875, 8.954345703125, 9.33251953125, 9.710693359375, 10.0888671875, 10.467041015625, 10.84521484375, 11.223388671875, 11.6015625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 10.0, 8.0, 11.0, 14.0, 17.0, 15.0, 21.0, 24.0, 36.0, 33.0, 43.0, 53.0, 50.0, 59.0, 74.0, 75.0, 66.0, 62.0, 55.0, 48.0, 44.0, 40.0, 35.0, 24.0, 23.0, 20.0, 14.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0], "bins": [-1.830078125, -1.7885208129882812, -1.7469635009765625, -1.7054061889648438, -1.663848876953125, -1.6222915649414062, -1.5807342529296875, -1.5391769409179688, -1.49761962890625, -1.4560623168945312, -1.4145050048828125, -1.3729476928710938, -1.331390380859375, -1.2898330688476562, -1.2482757568359375, -1.2067184448242188, -1.1651611328125, -1.1236038208007812, -1.0820465087890625, -1.0404891967773438, -0.998931884765625, -0.9573745727539062, -0.9158172607421875, -0.8742599487304688, -0.83270263671875, -0.7911453247070312, -0.7495880126953125, -0.7080307006835938, -0.666473388671875, -0.6249160766601562, -0.5833587646484375, -0.5418014526367188, -0.500244140625, -0.45868682861328125, -0.4171295166015625, -0.37557220458984375, -0.334014892578125, -0.29245758056640625, -0.2509002685546875, -0.20934295654296875, -0.16778564453125, -0.12622833251953125, -0.0846710205078125, -0.04311370849609375, -0.001556396484375, 0.04000091552734375, 0.0815582275390625, 0.12311553955078125, 0.1646728515625, 0.20623016357421875, 0.2477874755859375, 0.28934478759765625, 0.330902099609375, 0.37245941162109375, 0.4140167236328125, 0.45557403564453125, 0.49713134765625, 0.5386886596679688, 0.5802459716796875, 0.6218032836914062, 0.663360595703125, 0.7049179077148438, 0.7464752197265625, 0.7880325317382812, 0.82958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 8.0, 11.0, 9.0, 18.0, 21.0, 26.0, 44.0, 58.0, 79.0, 106.0, 146.0, 163.0, 246.0, 324.0, 496.0, 798.0, 1311.0, 2794.0, 6703.0, 18423.0, 53402.0, 158667.0, 337764.0, 289079.0, 115973.0, 37978.0, 13157.0, 5060.0, 2246.0, 1141.0, 684.0, 437.0, 305.0, 222.0, 182.0, 121.0, 90.0, 68.0, 55.0, 40.0, 17.0, 26.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.8671875, -13.45751953125, -13.0478515625, -12.63818359375, -12.228515625, -11.81884765625, -11.4091796875, -10.99951171875, -10.58984375, -10.18017578125, -9.7705078125, -9.36083984375, -8.951171875, -8.54150390625, -8.1318359375, -7.72216796875, -7.3125, -6.90283203125, -6.4931640625, -6.08349609375, -5.673828125, -5.26416015625, -4.8544921875, -4.44482421875, -4.03515625, -3.62548828125, -3.2158203125, -2.80615234375, -2.396484375, -1.98681640625, -1.5771484375, -1.16748046875, -0.7578125, -0.34814453125, 0.0615234375, 0.47119140625, 0.880859375, 1.29052734375, 1.7001953125, 2.10986328125, 2.51953125, 2.92919921875, 3.3388671875, 3.74853515625, 4.158203125, 4.56787109375, 4.9775390625, 5.38720703125, 5.796875, 6.20654296875, 6.6162109375, 7.02587890625, 7.435546875, 7.84521484375, 8.2548828125, 8.66455078125, 9.07421875, 9.48388671875, 9.8935546875, 10.30322265625, 10.712890625, 11.12255859375, 11.5322265625, 11.94189453125, 12.3515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 11.0, 5.0, 7.0, 12.0, 12.0, 15.0, 16.0, 22.0, 22.0, 24.0, 30.0, 26.0, 36.0, 35.0, 32.0, 46.0, 41.0, 41.0, 41.0, 42.0, 33.0, 34.0, 49.0, 39.0, 39.0, 39.0, 28.0, 30.0, 24.0, 22.0, 15.0, 19.0, 21.0, 20.0, 11.0, 13.0, 9.0, 4.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.615234375, -5.42578125, -5.236328125, -5.046875, -4.857421875, -4.66796875, -4.478515625, -4.2890625, -4.099609375, -3.91015625, -3.720703125, -3.53125, -3.341796875, -3.15234375, -2.962890625, -2.7734375, -2.583984375, -2.39453125, -2.205078125, -2.015625, -1.826171875, -1.63671875, -1.447265625, -1.2578125, -1.068359375, -0.87890625, -0.689453125, -0.5, -0.310546875, -0.12109375, 0.068359375, 0.2578125, 0.447265625, 0.63671875, 0.826171875, 1.015625, 1.205078125, 1.39453125, 1.583984375, 1.7734375, 1.962890625, 2.15234375, 2.341796875, 2.53125, 2.720703125, 2.91015625, 3.099609375, 3.2890625, 3.478515625, 3.66796875, 3.857421875, 4.046875, 4.236328125, 4.42578125, 4.615234375, 4.8046875, 4.994140625, 5.18359375, 5.373046875, 5.5625, 5.751953125, 5.94140625, 6.130859375, 6.3203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 10.0, 6.0, 20.0, 33.0, 38.0, 68.0, 107.0, 187.0, 277.0, 592.0, 1269.0, 3362.0, 10131.0, 37018.0, 174068.0, 520893.0, 232276.0, 48684.0, 12539.0, 3917.0, 1553.0, 615.0, 388.0, 180.0, 96.0, 81.0, 41.0, 23.0, 27.0, 12.0, 13.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.546875, -19.896484375, -19.24609375, -18.595703125, -17.9453125, -17.294921875, -16.64453125, -15.994140625, -15.34375, -14.693359375, -14.04296875, -13.392578125, -12.7421875, -12.091796875, -11.44140625, -10.791015625, -10.140625, -9.490234375, -8.83984375, -8.189453125, -7.5390625, -6.888671875, -6.23828125, -5.587890625, -4.9375, -4.287109375, -3.63671875, -2.986328125, -2.3359375, -1.685546875, -1.03515625, -0.384765625, 0.265625, 0.916015625, 1.56640625, 2.216796875, 2.8671875, 3.517578125, 4.16796875, 4.818359375, 5.46875, 6.119140625, 6.76953125, 7.419921875, 8.0703125, 8.720703125, 9.37109375, 10.021484375, 10.671875, 11.322265625, 11.97265625, 12.623046875, 13.2734375, 13.923828125, 14.57421875, 15.224609375, 15.875, 16.525390625, 17.17578125, 17.826171875, 18.4765625, 19.126953125, 19.77734375, 20.427734375, 21.078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 3.0, 4.0, 11.0, 10.0, 12.0, 21.0, 22.0, 31.0, 31.0, 43.0, 60.0, 68.0, 84.0, 72.0, 79.0, 88.0, 60.0, 52.0, 47.0, 38.0, 24.0, 22.0, 27.0, 22.0, 13.0, 17.0, 10.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014448165893554688, -0.0014014095067977905, -0.0013580024242401123, -0.001314595341682434, -0.0012711882591247559, -0.0012277811765670776, -0.0011843740940093994, -0.0011409670114517212, -0.001097559928894043, -0.0010541528463363647, -0.0010107457637786865, -0.0009673386812210083, -0.0009239315986633301, -0.0008805245161056519, -0.0008371174335479736, -0.0007937103509902954, -0.0007503032684326172, -0.000706896185874939, -0.0006634891033172607, -0.0006200820207595825, -0.0005766749382019043, -0.0005332678556442261, -0.0004898607730865479, -0.00044645369052886963, -0.0004030466079711914, -0.0003596395254135132, -0.00031623244285583496, -0.00027282536029815674, -0.00022941827774047852, -0.0001860111951828003, -0.00014260411262512207, -9.919703006744385e-05, -5.5789947509765625e-05, -1.2382864952087402e-05, 3.102421760559082e-05, 7.443130016326904e-05, 0.00011783838272094727, 0.0001612454652786255, 0.0002046525478363037, 0.00024805963039398193, 0.00029146671295166016, 0.0003348737955093384, 0.0003782808780670166, 0.0004216879606246948, 0.00046509504318237305, 0.0005085021257400513, 0.0005519092082977295, 0.0005953162908554077, 0.0006387233734130859, 0.0006821304559707642, 0.0007255375385284424, 0.0007689446210861206, 0.0008123517036437988, 0.000855758786201477, 0.0008991658687591553, 0.0009425729513168335, 0.0009859800338745117, 0.00102938711643219, 0.0010727941989898682, 0.0011162012815475464, 0.0011596083641052246, 0.0012030154466629028, 0.001246422529220581, 0.0012898296117782593, 0.0013332366943359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 9.0, 4.0, 10.0, 12.0, 32.0, 38.0, 62.0, 97.0, 186.0, 331.0, 643.0, 1272.0, 3150.0, 8796.0, 33634.0, 188015.0, 582798.0, 181612.0, 33354.0, 8720.0, 3091.0, 1332.0, 605.0, 322.0, 162.0, 109.0, 50.0, 31.0, 28.0, 20.0, 6.0, 9.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.734375, -26.952880859375, -26.17138671875, -25.389892578125, -24.6083984375, -23.826904296875, -23.04541015625, -22.263916015625, -21.482421875, -20.700927734375, -19.91943359375, -19.137939453125, -18.3564453125, -17.574951171875, -16.79345703125, -16.011962890625, -15.23046875, -14.448974609375, -13.66748046875, -12.885986328125, -12.1044921875, -11.322998046875, -10.54150390625, -9.760009765625, -8.978515625, -8.197021484375, -7.41552734375, -6.634033203125, -5.8525390625, -5.071044921875, -4.28955078125, -3.508056640625, -2.7265625, -1.945068359375, -1.16357421875, -0.382080078125, 0.3994140625, 1.180908203125, 1.96240234375, 2.743896484375, 3.525390625, 4.306884765625, 5.08837890625, 5.869873046875, 6.6513671875, 7.432861328125, 8.21435546875, 8.995849609375, 9.77734375, 10.558837890625, 11.34033203125, 12.121826171875, 12.9033203125, 13.684814453125, 14.46630859375, 15.247802734375, 16.029296875, 16.810791015625, 17.59228515625, 18.373779296875, 19.1552734375, 19.936767578125, 20.71826171875, 21.499755859375, 22.28125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 17.0, 25.0, 31.0, 43.0, 62.0, 74.0, 63.0, 84.0, 98.0, 83.0, 75.0, 56.0, 64.0, 31.0, 27.0, 28.0, 28.0, 20.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.9609375, -11.6561279296875, -11.351318359375, -11.0465087890625, -10.74169921875, -10.4368896484375, -10.132080078125, -9.8272705078125, -9.5224609375, -9.2176513671875, -8.912841796875, -8.6080322265625, -8.30322265625, -7.9984130859375, -7.693603515625, -7.3887939453125, -7.083984375, -6.7791748046875, -6.474365234375, -6.1695556640625, -5.86474609375, -5.5599365234375, -5.255126953125, -4.9503173828125, -4.6455078125, -4.3406982421875, -4.035888671875, -3.7310791015625, -3.42626953125, -3.1214599609375, -2.816650390625, -2.5118408203125, -2.20703125, -1.9022216796875, -1.597412109375, -1.2926025390625, -0.98779296875, -0.6829833984375, -0.378173828125, -0.0733642578125, 0.2314453125, 0.5362548828125, 0.841064453125, 1.1458740234375, 1.45068359375, 1.7554931640625, 2.060302734375, 2.3651123046875, 2.669921875, 2.9747314453125, 3.279541015625, 3.5843505859375, 3.88916015625, 4.1939697265625, 4.498779296875, 4.8035888671875, 5.1083984375, 5.4132080078125, 5.718017578125, 6.0228271484375, 6.32763671875, 6.6324462890625, 6.937255859375, 7.2420654296875, 7.546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 8.0, 24.0, 29.0, 67.0, 140.0, 201.0, 207.0, 171.0, 86.0, 39.0, 15.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.872802734375, -145.87551879882812, -140.8782501220703, -135.88096618652344, -130.88369750976562, -125.88641357421875, -120.88912963867188, -115.89185333251953, -110.89457702636719, -105.89730072021484, -100.9000244140625, -95.90274047851562, -90.90546417236328, -85.90818786621094, -80.91090393066406, -75.91362762451172, -70.91635131835938, -65.91907501220703, -60.92179489135742, -55.92451477050781, -50.92723846435547, -45.929962158203125, -40.932682037353516, -35.935401916503906, -30.938125610351562, -25.940847396850586, -20.94356918334961, -15.946290969848633, -10.949012756347656, -5.95173454284668, -0.9544563293457031, 4.042823791503906, 9.040115356445312, 14.037393569946289, 19.034671783447266, 24.031949996948242, 29.02922821044922, 34.02650451660156, 39.02378463745117, 44.02106475830078, 49.018341064453125, 54.01561737060547, 59.01289749145508, 64.01017761230469, 69.00745391845703, 74.00473022460938, 79.00201416015625, 83.9992904663086, 88.99656677246094, 93.99384307861328, 98.99111938476562, 103.9884033203125, 108.98567962646484, 113.98295593261719, 118.98023986816406, 123.9775161743164, 128.97479248046875, 133.97207641601562, 138.96934509277344, 143.9666290283203, 148.96389770507812, 153.961181640625, 158.95846557617188, 163.95574951171875, 168.95301818847656]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 12.0, 9.0, 13.0, 25.0, 35.0, 37.0, 44.0, 40.0, 44.0, 66.0, 62.0, 49.0, 58.0, 64.0, 64.0, 67.0, 49.0, 44.0, 42.0, 35.0, 27.0, 16.0, 21.0, 16.0, 8.0, 13.0, 10.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.16239929199219, -47.096717834472656, -45.031036376953125, -42.965354919433594, -40.89967346191406, -38.83399200439453, -36.768310546875, -34.70262908935547, -32.63694763183594, -30.571266174316406, -28.505584716796875, -26.439903259277344, -24.374221801757812, -22.30854034423828, -20.24285888671875, -18.17717742919922, -16.111495971679688, -14.045814514160156, -11.980133056640625, -9.914451599121094, -7.8487701416015625, -5.783088684082031, -3.7174072265625, -1.6517257690429688, 0.4139556884765625, 2.4796371459960938, 4.545318603515625, 6.611000061035156, 8.676681518554688, 10.742362976074219, 12.80804443359375, 14.873725891113281, 16.939407348632812, 19.005088806152344, 21.070770263671875, 23.136451721191406, 25.202133178710938, 27.26781463623047, 29.33349609375, 31.39917755126953, 33.46485900878906, 35.530540466308594, 37.596221923828125, 39.661903381347656, 41.72758483886719, 43.79326629638672, 45.85894775390625, 47.92462921142578, 49.99031066894531, 52.055992126464844, 54.121673583984375, 56.187355041503906, 58.25303649902344, 60.31871795654297, 62.3843994140625, 64.45008087158203, 66.51576232910156, 68.5814437866211, 70.64712524414062, 72.71280670166016, 74.77848815917969, 76.84416961669922, 78.90985107421875, 80.97553253173828, 83.04121398925781]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 7.0, 6.0, 19.0, 13.0, 19.0, 33.0, 46.0, 85.0, 137.0, 441.0, 2633.0, 32719.0, 3941370.0, 207385.0, 7946.0, 911.0, 207.0, 107.0, 48.0, 53.0, 27.0, 22.0, 10.0, 14.0, 11.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.75, -66.3583984375, -63.966796875, -61.5751953125, -59.18359375, -56.7919921875, -54.400390625, -52.0087890625, -49.6171875, -47.2255859375, -44.833984375, -42.4423828125, -40.05078125, -37.6591796875, -35.267578125, -32.8759765625, -30.484375, -28.0927734375, -25.701171875, -23.3095703125, -20.91796875, -18.5263671875, -16.134765625, -13.7431640625, -11.3515625, -8.9599609375, -6.568359375, -4.1767578125, -1.78515625, 0.6064453125, 2.998046875, 5.3896484375, 7.78125, 10.1728515625, 12.564453125, 14.9560546875, 17.34765625, 19.7392578125, 22.130859375, 24.5224609375, 26.9140625, 29.3056640625, 31.697265625, 34.0888671875, 36.48046875, 38.8720703125, 41.263671875, 43.6552734375, 46.046875, 48.4384765625, 50.830078125, 53.2216796875, 55.61328125, 58.0048828125, 60.396484375, 62.7880859375, 65.1796875, 67.5712890625, 69.962890625, 72.3544921875, 74.74609375, 77.1376953125, 79.529296875, 81.9208984375, 84.3125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 14.0, 18.0, 22.0, 28.0, 40.0, 67.0, 73.0, 61.0, 77.0, 82.0, 75.0, 73.0, 87.0, 64.0, 57.0, 42.0, 35.0, 15.0, 22.0, 12.0, 14.0, 5.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.936309814453125, -1.86480712890625, -1.793304443359375, -1.7218017578125, -1.650299072265625, -1.57879638671875, -1.507293701171875, -1.435791015625, -1.364288330078125, -1.29278564453125, -1.221282958984375, -1.1497802734375, -1.078277587890625, -1.00677490234375, -0.935272216796875, -0.86376953125, -0.792266845703125, -0.72076416015625, -0.649261474609375, -0.5777587890625, -0.506256103515625, -0.43475341796875, -0.363250732421875, -0.291748046875, -0.220245361328125, -0.14874267578125, -0.077239990234375, -0.0057373046875, 0.065765380859375, 0.13726806640625, 0.208770751953125, 0.2802734375, 0.351776123046875, 0.42327880859375, 0.494781494140625, 0.5662841796875, 0.637786865234375, 0.70928955078125, 0.780792236328125, 0.852294921875, 0.923797607421875, 0.99530029296875, 1.066802978515625, 1.1383056640625, 1.209808349609375, 1.28131103515625, 1.352813720703125, 1.42431640625, 1.495819091796875, 1.56732177734375, 1.638824462890625, 1.7103271484375, 1.781829833984375, 1.85333251953125, 1.924835205078125, 1.996337890625, 2.067840576171875, 2.13934326171875, 2.210845947265625, 2.2823486328125, 2.353851318359375, 2.42535400390625, 2.496856689453125, 2.568359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 13.0, 4.0, 9.0, 19.0, 21.0, 27.0, 51.0, 66.0, 134.0, 241.0, 670.0, 2157.0, 8714.0, 48394.0, 500016.0, 3433894.0, 170537.0, 22736.0, 4622.0, 1171.0, 386.0, 156.0, 73.0, 50.0, 30.0, 14.0, 9.0, 14.0, 10.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.828125, -26.633544921875, -25.43896484375, -24.244384765625, -23.0498046875, -21.855224609375, -20.66064453125, -19.466064453125, -18.271484375, -17.076904296875, -15.88232421875, -14.687744140625, -13.4931640625, -12.298583984375, -11.10400390625, -9.909423828125, -8.71484375, -7.520263671875, -6.32568359375, -5.131103515625, -3.9365234375, -2.741943359375, -1.54736328125, -0.352783203125, 0.841796875, 2.036376953125, 3.23095703125, 4.425537109375, 5.6201171875, 6.814697265625, 8.00927734375, 9.203857421875, 10.3984375, 11.593017578125, 12.78759765625, 13.982177734375, 15.1767578125, 16.371337890625, 17.56591796875, 18.760498046875, 19.955078125, 21.149658203125, 22.34423828125, 23.538818359375, 24.7333984375, 25.927978515625, 27.12255859375, 28.317138671875, 29.51171875, 30.706298828125, 31.90087890625, 33.095458984375, 34.2900390625, 35.484619140625, 36.67919921875, 37.873779296875, 39.068359375, 40.262939453125, 41.45751953125, 42.652099609375, 43.8466796875, 45.041259765625, 46.23583984375, 47.430419921875, 48.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 8.0, 5.0, 11.0, 14.0, 17.0, 31.0, 29.0, 56.0, 87.0, 133.0, 241.0, 508.0, 1603.0, 599.0, 283.0, 158.0, 92.0, 57.0, 49.0, 31.0, 17.0, 14.0, 13.0, 13.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.4609375, -8.2752685546875, -8.089599609375, -7.9039306640625, -7.71826171875, -7.5325927734375, -7.346923828125, -7.1612548828125, -6.9755859375, -6.7899169921875, -6.604248046875, -6.4185791015625, -6.23291015625, -6.0472412109375, -5.861572265625, -5.6759033203125, -5.490234375, -5.3045654296875, -5.118896484375, -4.9332275390625, -4.74755859375, -4.5618896484375, -4.376220703125, -4.1905517578125, -4.0048828125, -3.8192138671875, -3.633544921875, -3.4478759765625, -3.26220703125, -3.0765380859375, -2.890869140625, -2.7052001953125, -2.51953125, -2.3338623046875, -2.148193359375, -1.9625244140625, -1.77685546875, -1.5911865234375, -1.405517578125, -1.2198486328125, -1.0341796875, -0.8485107421875, -0.662841796875, -0.4771728515625, -0.29150390625, -0.1058349609375, 0.079833984375, 0.2655029296875, 0.451171875, 0.6368408203125, 0.822509765625, 1.0081787109375, 1.19384765625, 1.3795166015625, 1.565185546875, 1.7508544921875, 1.9365234375, 2.1221923828125, 2.307861328125, 2.4935302734375, 2.67919921875, 2.8648681640625, 3.050537109375, 3.2362060546875, 3.421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 12.0, 27.0, 58.0, 83.0, 101.0, 131.0, 162.0, 138.0, 97.0, 65.0, 45.0, 26.0, 17.0, 13.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-42.3389892578125, -41.02665328979492, -39.71432113647461, -38.40198516845703, -37.08964920043945, -35.777313232421875, -34.46498107910156, -33.152645111083984, -31.840309143066406, -30.52797508239746, -29.215639114379883, -27.903305053710938, -26.59096908569336, -25.278635025024414, -23.96630096435547, -22.65396499633789, -21.341630935668945, -20.029296875, -18.716960906982422, -17.404626846313477, -16.0922908782959, -14.779956817626953, -13.467621803283691, -12.15528678894043, -10.842951774597168, -9.530616760253906, -8.218281745910645, -6.905947208404541, -5.593612194061279, -4.281277179718018, -2.968942642211914, -1.6566076278686523, -0.3442726135253906, 0.9680622816085815, 2.2803971767425537, 3.5927319526672363, 4.905066967010498, 6.21740198135376, 7.529736518859863, 8.842071533203125, 10.154406547546387, 11.466741561889648, 12.77907657623291, 14.091411590576172, 15.403745651245117, 16.716081619262695, 18.02841567993164, 19.34075164794922, 20.653085708618164, 21.96541976928711, 23.277755737304688, 24.590089797973633, 25.90242576599121, 27.214759826660156, 28.527095794677734, 29.83942985534668, 31.151763916015625, 32.4640998840332, 33.776432037353516, 35.088768005371094, 36.40110397338867, 37.71343994140625, 39.02577209472656, 40.33810806274414, 41.65044403076172]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 6.0, 18.0, 16.0, 16.0, 17.0, 13.0, 19.0, 27.0, 26.0, 31.0, 26.0, 34.0, 42.0, 39.0, 37.0, 41.0, 41.0, 35.0, 39.0, 47.0, 38.0, 30.0, 35.0, 34.0, 41.0, 30.0, 38.0, 21.0, 22.0, 19.0, 11.0, 21.0, 15.0, 10.0, 10.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 2.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.81633758544922, -16.284326553344727, -15.752313613891602, -15.220301628112793, -14.688289642333984, -14.156278610229492, -13.624266624450684, -13.092254638671875, -12.560242652893066, -12.028230667114258, -11.49621868133545, -10.96420669555664, -10.432195663452148, -9.900182723999023, -9.368171691894531, -8.836159706115723, -8.304147720336914, -7.7721357345581055, -7.240123748779297, -6.7081122398376465, -6.176100254058838, -5.644088268280029, -5.112076759338379, -4.58006477355957, -4.048052787780762, -3.516040802001953, -2.9840290546417236, -2.452017307281494, -1.9200053215026855, -1.387993335723877, -0.8559815883636475, -0.32396984100341797, 0.20804405212402344, 0.7400559186935425, 1.2720677852630615, 1.8040796518325806, 2.3360915184020996, 2.868103504180908, 3.4001152515411377, 3.932126998901367, 4.464138984680176, 4.996150970458984, 5.528162956237793, 6.060174465179443, 6.592186450958252, 7.1241984367370605, 7.656209945678711, 8.18822193145752, 8.720233917236328, 9.252245903015137, 9.784257888793945, 10.316269874572754, 10.848281860351562, 11.380292892456055, 11.912304878234863, 12.444316864013672, 12.97632884979248, 13.508340835571289, 14.040352821350098, 14.572364807128906, 15.104375839233398, 15.636388778686523, 16.168399810791016, 16.70041275024414, 17.232423782348633]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 9.0, 3.0, 8.0, 14.0, 16.0, 12.0, 8.0, 44.0, 68.0, 104.0, 145.0, 247.0, 469.0, 939.0, 2210.0, 5174.0, 13987.0, 41164.0, 119723.0, 302380.0, 340103.0, 143780.0, 49620.0, 17221.0, 6343.0, 2441.0, 1073.0, 516.0, 262.0, 155.0, 99.0, 60.0, 54.0, 24.0, 18.0, 14.0, 10.0, 17.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5390625, -12.1357421875, -11.732421875, -11.3291015625, -10.92578125, -10.5224609375, -10.119140625, -9.7158203125, -9.3125, -8.9091796875, -8.505859375, -8.1025390625, -7.69921875, -7.2958984375, -6.892578125, -6.4892578125, -6.0859375, -5.6826171875, -5.279296875, -4.8759765625, -4.47265625, -4.0693359375, -3.666015625, -3.2626953125, -2.859375, -2.4560546875, -2.052734375, -1.6494140625, -1.24609375, -0.8427734375, -0.439453125, -0.0361328125, 0.3671875, 0.7705078125, 1.173828125, 1.5771484375, 1.98046875, 2.3837890625, 2.787109375, 3.1904296875, 3.59375, 3.9970703125, 4.400390625, 4.8037109375, 5.20703125, 5.6103515625, 6.013671875, 6.4169921875, 6.8203125, 7.2236328125, 7.626953125, 8.0302734375, 8.43359375, 8.8369140625, 9.240234375, 9.6435546875, 10.046875, 10.4501953125, 10.853515625, 11.2568359375, 11.66015625, 12.0634765625, 12.466796875, 12.8701171875, 13.2734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 13.0, 17.0, 31.0, 35.0, 54.0, 61.0, 64.0, 73.0, 95.0, 98.0, 94.0, 71.0, 75.0, 66.0, 49.0, 40.0, 18.0, 14.0, 9.0, 5.0, 7.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.9815673828125, -1.900634765625, -1.8197021484375, -1.73876953125, -1.6578369140625, -1.576904296875, -1.4959716796875, -1.4150390625, -1.3341064453125, -1.253173828125, -1.1722412109375, -1.09130859375, -1.0103759765625, -0.929443359375, -0.8485107421875, -0.767578125, -0.6866455078125, -0.605712890625, -0.5247802734375, -0.44384765625, -0.3629150390625, -0.281982421875, -0.2010498046875, -0.1201171875, -0.0391845703125, 0.041748046875, 0.1226806640625, 0.20361328125, 0.2845458984375, 0.365478515625, 0.4464111328125, 0.52734375, 0.6082763671875, 0.689208984375, 0.7701416015625, 0.85107421875, 0.9320068359375, 1.012939453125, 1.0938720703125, 1.1748046875, 1.2557373046875, 1.336669921875, 1.4176025390625, 1.49853515625, 1.5794677734375, 1.660400390625, 1.7413330078125, 1.822265625, 1.9031982421875, 1.984130859375, 2.0650634765625, 2.14599609375, 2.2269287109375, 2.307861328125, 2.3887939453125, 2.4697265625, 2.5506591796875, 2.631591796875, 2.7125244140625, 2.79345703125, 2.8743896484375, 2.955322265625, 3.0362548828125, 3.1171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 16.0, 12.0, 20.0, 30.0, 31.0, 45.0, 61.0, 69.0, 124.0, 141.0, 207.0, 319.0, 491.0, 809.0, 1569.0, 3738.0, 10683.0, 38376.0, 152949.0, 467765.0, 273298.0, 68733.0, 18259.0, 5747.0, 2162.0, 1019.0, 610.0, 354.0, 262.0, 161.0, 123.0, 95.0, 66.0, 54.0, 29.0, 21.0, 16.0, 16.0, 12.0, 8.0, 3.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.71875, -14.223388671875, -13.72802734375, -13.232666015625, -12.7373046875, -12.241943359375, -11.74658203125, -11.251220703125, -10.755859375, -10.260498046875, -9.76513671875, -9.269775390625, -8.7744140625, -8.279052734375, -7.78369140625, -7.288330078125, -6.79296875, -6.297607421875, -5.80224609375, -5.306884765625, -4.8115234375, -4.316162109375, -3.82080078125, -3.325439453125, -2.830078125, -2.334716796875, -1.83935546875, -1.343994140625, -0.8486328125, -0.353271484375, 0.14208984375, 0.637451171875, 1.1328125, 1.628173828125, 2.12353515625, 2.618896484375, 3.1142578125, 3.609619140625, 4.10498046875, 4.600341796875, 5.095703125, 5.591064453125, 6.08642578125, 6.581787109375, 7.0771484375, 7.572509765625, 8.06787109375, 8.563232421875, 9.05859375, 9.553955078125, 10.04931640625, 10.544677734375, 11.0400390625, 11.535400390625, 12.03076171875, 12.526123046875, 13.021484375, 13.516845703125, 14.01220703125, 14.507568359375, 15.0029296875, 15.498291015625, 15.99365234375, 16.489013671875, 16.984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 13.0, 4.0, 6.0, 6.0, 5.0, 7.0, 9.0, 15.0, 24.0, 16.0, 20.0, 26.0, 30.0, 27.0, 33.0, 31.0, 43.0, 38.0, 49.0, 42.0, 36.0, 48.0, 42.0, 50.0, 41.0, 41.0, 37.0, 33.0, 19.0, 28.0, 28.0, 30.0, 19.0, 22.0, 17.0, 13.0, 16.0, 14.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2177734375, -6.986328125, -6.7548828125, -6.5234375, -6.2919921875, -6.060546875, -5.8291015625, -5.59765625, -5.3662109375, -5.134765625, -4.9033203125, -4.671875, -4.4404296875, -4.208984375, -3.9775390625, -3.74609375, -3.5146484375, -3.283203125, -3.0517578125, -2.8203125, -2.5888671875, -2.357421875, -2.1259765625, -1.89453125, -1.6630859375, -1.431640625, -1.2001953125, -0.96875, -0.7373046875, -0.505859375, -0.2744140625, -0.04296875, 0.1884765625, 0.419921875, 0.6513671875, 0.8828125, 1.1142578125, 1.345703125, 1.5771484375, 1.80859375, 2.0400390625, 2.271484375, 2.5029296875, 2.734375, 2.9658203125, 3.197265625, 3.4287109375, 3.66015625, 3.8916015625, 4.123046875, 4.3544921875, 4.5859375, 4.8173828125, 5.048828125, 5.2802734375, 5.51171875, 5.7431640625, 5.974609375, 6.2060546875, 6.4375, 6.6689453125, 6.900390625, 7.1318359375, 7.36328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 13.0, 16.0, 21.0, 32.0, 52.0, 64.0, 112.0, 181.0, 329.0, 520.0, 1023.0, 2149.0, 4861.0, 12306.0, 35475.0, 112198.0, 324873.0, 361553.0, 128021.0, 40654.0, 13880.0, 5337.0, 2214.0, 1188.0, 579.0, 335.0, 202.0, 117.0, 76.0, 43.0, 38.0, 13.0, 11.0, 14.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4815673828125, -8.189697265625, -7.8978271484375, -7.60595703125, -7.3140869140625, -7.022216796875, -6.7303466796875, -6.4384765625, -6.1466064453125, -5.854736328125, -5.5628662109375, -5.27099609375, -4.9791259765625, -4.687255859375, -4.3953857421875, -4.103515625, -3.8116455078125, -3.519775390625, -3.2279052734375, -2.93603515625, -2.6441650390625, -2.352294921875, -2.0604248046875, -1.7685546875, -1.4766845703125, -1.184814453125, -0.8929443359375, -0.60107421875, -0.3092041015625, -0.017333984375, 0.2745361328125, 0.56640625, 0.8582763671875, 1.150146484375, 1.4420166015625, 1.73388671875, 2.0257568359375, 2.317626953125, 2.6094970703125, 2.9013671875, 3.1932373046875, 3.485107421875, 3.7769775390625, 4.06884765625, 4.3607177734375, 4.652587890625, 4.9444580078125, 5.236328125, 5.5281982421875, 5.820068359375, 6.1119384765625, 6.40380859375, 6.6956787109375, 6.987548828125, 7.2794189453125, 7.5712890625, 7.8631591796875, 8.155029296875, 8.4468994140625, 8.73876953125, 9.0306396484375, 9.322509765625, 9.6143798828125, 9.90625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 12.0, 10.0, 8.0, 11.0, 20.0, 30.0, 30.0, 38.0, 54.0, 60.0, 111.0, 90.0, 94.0, 91.0, 76.0, 58.0, 28.0, 37.0, 24.0, 25.0, 24.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.001331329345703125, -0.0012964680790901184, -0.0012616068124771118, -0.0012267455458641052, -0.0011918842792510986, -0.001157023012638092, -0.0011221617460250854, -0.0010873004794120789, -0.0010524392127990723, -0.0010175779461860657, -0.000982716679573059, -0.0009478554129600525, -0.0009129941463470459, -0.0008781328797340393, -0.0008432716131210327, -0.0008084103465080261, -0.0007735490798950195, -0.0007386878132820129, -0.0007038265466690063, -0.0006689652800559998, -0.0006341040134429932, -0.0005992427468299866, -0.00056438148021698, -0.0005295202136039734, -0.0004946589469909668, -0.0004597976803779602, -0.0004249364137649536, -0.000390075147151947, -0.00035521388053894043, -0.00032035261392593384, -0.00028549134731292725, -0.00025063008069992065, -0.00021576881408691406, -0.00018090754747390747, -0.00014604628086090088, -0.00011118501424789429, -7.63237476348877e-05, -4.1462481021881104e-05, -6.601214408874512e-06, 2.826005220413208e-05, 6.312131881713867e-05, 9.798258543014526e-05, 0.00013284385204315186, 0.00016770511865615845, 0.00020256638526916504, 0.00023742765188217163, 0.0002722889184951782, 0.0003071501851081848, 0.0003420114517211914, 0.000376872718334198, 0.0004117339849472046, 0.0004465952515602112, 0.0004814565181732178, 0.0005163177847862244, 0.000551179051399231, 0.0005860403180122375, 0.0006209015846252441, 0.0006557628512382507, 0.0006906241178512573, 0.0007254853844642639, 0.0007603466510772705, 0.0007952079176902771, 0.0008300691843032837, 0.0008649304509162903, 0.0008997917175292969]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 11.0, 20.0, 37.0, 33.0, 88.0, 111.0, 154.0, 299.0, 502.0, 961.0, 2217.0, 5635.0, 17559.0, 66949.0, 291122.0, 479982.0, 134288.0, 32328.0, 9537.0, 3523.0, 1490.0, 683.0, 394.0, 220.0, 120.0, 87.0, 56.0, 35.0, 22.0, 18.0, 10.0, 11.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.9970703125, -11.572265625, -11.1474609375, -10.72265625, -10.2978515625, -9.873046875, -9.4482421875, -9.0234375, -8.5986328125, -8.173828125, -7.7490234375, -7.32421875, -6.8994140625, -6.474609375, -6.0498046875, -5.625, -5.2001953125, -4.775390625, -4.3505859375, -3.92578125, -3.5009765625, -3.076171875, -2.6513671875, -2.2265625, -1.8017578125, -1.376953125, -0.9521484375, -0.52734375, -0.1025390625, 0.322265625, 0.7470703125, 1.171875, 1.5966796875, 2.021484375, 2.4462890625, 2.87109375, 3.2958984375, 3.720703125, 4.1455078125, 4.5703125, 4.9951171875, 5.419921875, 5.8447265625, 6.26953125, 6.6943359375, 7.119140625, 7.5439453125, 7.96875, 8.3935546875, 8.818359375, 9.2431640625, 9.66796875, 10.0927734375, 10.517578125, 10.9423828125, 11.3671875, 11.7919921875, 12.216796875, 12.6416015625, 13.06640625, 13.4912109375, 13.916015625, 14.3408203125, 14.765625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 0.0, 7.0, 6.0, 3.0, 6.0, 8.0, 11.0, 6.0, 19.0, 11.0, 18.0, 23.0, 27.0, 22.0, 30.0, 31.0, 39.0, 40.0, 56.0, 75.0, 68.0, 58.0, 62.0, 65.0, 38.0, 40.0, 36.0, 36.0, 31.0, 26.0, 23.0, 18.0, 9.0, 15.0, 8.0, 5.0, 9.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.6953125, -4.54022216796875, -4.3851318359375, -4.23004150390625, -4.074951171875, -3.91986083984375, -3.7647705078125, -3.60968017578125, -3.45458984375, -3.29949951171875, -3.1444091796875, -2.98931884765625, -2.834228515625, -2.67913818359375, -2.5240478515625, -2.36895751953125, -2.2138671875, -2.05877685546875, -1.9036865234375, -1.74859619140625, -1.593505859375, -1.43841552734375, -1.2833251953125, -1.12823486328125, -0.97314453125, -0.81805419921875, -0.6629638671875, -0.50787353515625, -0.352783203125, -0.19769287109375, -0.0426025390625, 0.11248779296875, 0.267578125, 0.42266845703125, 0.5777587890625, 0.73284912109375, 0.887939453125, 1.04302978515625, 1.1981201171875, 1.35321044921875, 1.50830078125, 1.66339111328125, 1.8184814453125, 1.97357177734375, 2.128662109375, 2.28375244140625, 2.4388427734375, 2.59393310546875, 2.7490234375, 2.90411376953125, 3.0592041015625, 3.21429443359375, 3.369384765625, 3.52447509765625, 3.6795654296875, 3.83465576171875, 3.98974609375, 4.14483642578125, 4.2999267578125, 4.45501708984375, 4.610107421875, 4.76519775390625, 4.9202880859375, 5.07537841796875, 5.23046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 15.0, 40.0, 72.0, 123.0, 185.0, 183.0, 177.0, 80.0, 54.0, 33.0, 10.0, 12.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.84677124023438, -113.82637786865234, -109.80599212646484, -105.78559875488281, -101.76521301269531, -97.74481964111328, -93.72442626953125, -89.70404052734375, -85.68364715576172, -81.66325378417969, -77.64286804199219, -73.62247467041016, -69.60208129882812, -65.58169555664062, -61.561302185058594, -57.54091262817383, -53.52052307128906, -49.5001335144043, -45.47974395751953, -41.4593505859375, -37.438961029052734, -33.41857147216797, -29.39818000793457, -25.377788543701172, -21.357398986816406, -17.33700942993164, -13.316617965698242, -9.29622745513916, -5.275836944580078, -1.2554473876953125, 2.764944076538086, 6.785335540771484, 10.805709838867188, 14.82610034942627, 18.84649085998535, 22.86688232421875, 26.887271881103516, 30.90766143798828, 34.92805480957031, 38.94844436645508, 42.968833923339844, 46.98922348022461, 51.009613037109375, 55.030006408691406, 59.05039596557617, 63.07078552246094, 67.09117889404297, 71.111572265625, 75.1319580078125, 79.15235137939453, 83.17273712158203, 87.19313049316406, 91.21351623535156, 95.2339096069336, 99.25430297851562, 103.27468872070312, 107.29508209228516, 111.31547546386719, 115.33586120605469, 119.35625457763672, 123.37664794921875, 127.39703369140625, 131.41741943359375, 135.4378204345703, 139.4582061767578]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 17.0, 14.0, 24.0, 22.0, 22.0, 24.0, 43.0, 38.0, 43.0, 38.0, 53.0, 54.0, 66.0, 45.0, 52.0, 50.0, 60.0, 45.0, 40.0, 34.0, 36.0, 29.0, 20.0, 14.0, 17.0, 25.0, 15.0, 4.0, 3.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.23907470703125, -66.34447479248047, -64.44987487792969, -62.55527877807617, -60.66067886352539, -58.76607894897461, -56.871482849121094, -54.97688293457031, -53.08228302001953, -51.18768310546875, -49.29308319091797, -47.39848709106445, -45.50388717651367, -43.60928726196289, -41.714691162109375, -39.820091247558594, -37.92549133300781, -36.03089141845703, -34.13629150390625, -32.241695404052734, -30.347095489501953, -28.452495574951172, -26.557897567749023, -24.663299560546875, -22.768699645996094, -20.874099731445312, -18.979501724243164, -17.084903717041016, -15.190303802490234, -13.29570484161377, -11.401105880737305, -9.50650691986084, -7.611907958984375, -5.71730899810791, -3.8227100372314453, -1.9281110763549805, -0.033512115478515625, 1.8610868453979492, 3.755685806274414, 5.650284767150879, 7.544883728027344, 9.439482688903809, 11.334081649780273, 13.228680610656738, 15.123279571533203, 17.017879486083984, 18.912477493286133, 20.80707550048828, 22.701675415039062, 24.596275329589844, 26.490873336791992, 28.38547134399414, 30.280071258544922, 32.1746711730957, 34.06926727294922, 35.9638671875, 37.85846710205078, 39.75306701660156, 41.647666931152344, 43.54226303100586, 45.43686294555664, 47.33146286010742, 49.22605895996094, 51.12065887451172, 53.0152587890625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 8.0, 13.0, 15.0, 27.0, 29.0, 55.0, 87.0, 151.0, 308.0, 637.0, 1824.0, 6064.0, 27112.0, 253274.0, 3762829.0, 118261.0, 17117.0, 4207.0, 1281.0, 477.0, 198.0, 89.0, 70.0, 44.0, 34.0, 18.0, 16.0, 15.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.045654296875, -26.98193359375, -25.918212890625, -24.8544921875, -23.790771484375, -22.72705078125, -21.663330078125, -20.599609375, -19.535888671875, -18.47216796875, -17.408447265625, -16.3447265625, -15.281005859375, -14.21728515625, -13.153564453125, -12.08984375, -11.026123046875, -9.96240234375, -8.898681640625, -7.8349609375, -6.771240234375, -5.70751953125, -4.643798828125, -3.580078125, -2.516357421875, -1.45263671875, -0.388916015625, 0.6748046875, 1.738525390625, 2.80224609375, 3.865966796875, 4.9296875, 5.993408203125, 7.05712890625, 8.120849609375, 9.1845703125, 10.248291015625, 11.31201171875, 12.375732421875, 13.439453125, 14.503173828125, 15.56689453125, 16.630615234375, 17.6943359375, 18.758056640625, 19.82177734375, 20.885498046875, 21.94921875, 23.012939453125, 24.07666015625, 25.140380859375, 26.2041015625, 27.267822265625, 28.33154296875, 29.395263671875, 30.458984375, 31.522705078125, 32.58642578125, 33.650146484375, 34.7138671875, 35.777587890625, 36.84130859375, 37.905029296875, 38.96875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 14.0, 15.0, 10.0, 24.0, 30.0, 41.0, 50.0, 45.0, 33.0, 56.0, 53.0, 50.0, 62.0, 63.0, 70.0, 60.0, 55.0, 47.0, 47.0, 33.0, 37.0, 23.0, 15.0, 17.0, 9.0, 7.0, 10.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.38671875, -2.3218231201171875, -2.256927490234375, -2.1920318603515625, -2.12713623046875, -2.0622406005859375, -1.997344970703125, -1.9324493408203125, -1.8675537109375, -1.8026580810546875, -1.737762451171875, -1.6728668212890625, -1.60797119140625, -1.5430755615234375, -1.478179931640625, -1.4132843017578125, -1.348388671875, -1.2834930419921875, -1.218597412109375, -1.1537017822265625, -1.08880615234375, -1.0239105224609375, -0.959014892578125, -0.8941192626953125, -0.8292236328125, -0.7643280029296875, -0.699432373046875, -0.6345367431640625, -0.56964111328125, -0.5047454833984375, -0.439849853515625, -0.3749542236328125, -0.31005859375, -0.2451629638671875, -0.180267333984375, -0.1153717041015625, -0.05047607421875, 0.0144195556640625, 0.079315185546875, 0.1442108154296875, 0.2091064453125, 0.2740020751953125, 0.338897705078125, 0.4037933349609375, 0.46868896484375, 0.5335845947265625, 0.598480224609375, 0.6633758544921875, 0.728271484375, 0.7931671142578125, 0.858062744140625, 0.9229583740234375, 0.98785400390625, 1.0527496337890625, 1.117645263671875, 1.1825408935546875, 1.2474365234375, 1.3123321533203125, 1.377227783203125, 1.4421234130859375, 1.50701904296875, 1.5719146728515625, 1.636810302734375, 1.7017059326171875, 1.7666015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 10.0, 6.0, 8.0, 19.0, 18.0, 35.0, 53.0, 88.0, 137.0, 249.0, 465.0, 980.0, 2491.0, 6795.0, 23141.0, 104052.0, 1000910.0, 2838159.0, 166190.0, 34065.0, 9949.0, 3483.0, 1458.0, 663.0, 350.0, 176.0, 98.0, 70.0, 45.0, 27.0, 25.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.515625, -23.85546875, -23.1953125, -22.53515625, -21.875, -21.21484375, -20.5546875, -19.89453125, -19.234375, -18.57421875, -17.9140625, -17.25390625, -16.59375, -15.93359375, -15.2734375, -14.61328125, -13.953125, -13.29296875, -12.6328125, -11.97265625, -11.3125, -10.65234375, -9.9921875, -9.33203125, -8.671875, -8.01171875, -7.3515625, -6.69140625, -6.03125, -5.37109375, -4.7109375, -4.05078125, -3.390625, -2.73046875, -2.0703125, -1.41015625, -0.75, -0.08984375, 0.5703125, 1.23046875, 1.890625, 2.55078125, 3.2109375, 3.87109375, 4.53125, 5.19140625, 5.8515625, 6.51171875, 7.171875, 7.83203125, 8.4921875, 9.15234375, 9.8125, 10.47265625, 11.1328125, 11.79296875, 12.453125, 13.11328125, 13.7734375, 14.43359375, 15.09375, 15.75390625, 16.4140625, 17.07421875, 17.734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 3.0, 19.0, 23.0, 25.0, 58.0, 79.0, 144.0, 221.0, 427.0, 1384.0, 906.0, 346.0, 161.0, 80.0, 46.0, 49.0, 26.0, 20.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.46875, -6.29327392578125, -6.1177978515625, -5.94232177734375, -5.766845703125, -5.59136962890625, -5.4158935546875, -5.24041748046875, -5.06494140625, -4.88946533203125, -4.7139892578125, -4.53851318359375, -4.363037109375, -4.18756103515625, -4.0120849609375, -3.83660888671875, -3.6611328125, -3.48565673828125, -3.3101806640625, -3.13470458984375, -2.959228515625, -2.78375244140625, -2.6082763671875, -2.43280029296875, -2.25732421875, -2.08184814453125, -1.9063720703125, -1.73089599609375, -1.555419921875, -1.37994384765625, -1.2044677734375, -1.02899169921875, -0.853515625, -0.67803955078125, -0.5025634765625, -0.32708740234375, -0.151611328125, 0.02386474609375, 0.1993408203125, 0.37481689453125, 0.55029296875, 0.72576904296875, 0.9012451171875, 1.07672119140625, 1.252197265625, 1.42767333984375, 1.6031494140625, 1.77862548828125, 1.9541015625, 2.12957763671875, 2.3050537109375, 2.48052978515625, 2.656005859375, 2.83148193359375, 3.0069580078125, 3.18243408203125, 3.35791015625, 3.53338623046875, 3.7088623046875, 3.88433837890625, 4.059814453125, 4.23529052734375, 4.4107666015625, 4.58624267578125, 4.76171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 27.0, 53.0, 92.0, 213.0, 205.0, 209.0, 119.0, 46.0, 20.0, 6.0, 6.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.61383056640625, -63.76617431640625, -61.91851806640625, -60.07086181640625, -58.22320556640625, -56.37554931640625, -54.52789306640625, -52.68023681640625, -50.83258056640625, -48.98492431640625, -47.13726806640625, -45.28961181640625, -43.44195556640625, -41.59429931640625, -39.74664306640625, -37.89898681640625, -36.051326751708984, -34.203670501708984, -32.356014251708984, -30.508358001708984, -28.660701751708984, -26.813045501708984, -24.96538734436035, -23.11773109436035, -21.27007484436035, -19.42241859436035, -17.57476234436035, -15.727105140686035, -13.879448890686035, -12.031792640686035, -10.184135437011719, -8.336479187011719, -6.488822937011719, -4.641166687011719, -2.7935099601745605, -0.9458532333374023, 0.9018030166625977, 2.7494592666625977, 4.597116470336914, 6.444772720336914, 8.292428970336914, 10.140085220336914, 11.987741470336914, 13.83539867401123, 15.68305492401123, 17.530712127685547, 19.378368377685547, 21.226024627685547, 23.073680877685547, 24.921337127685547, 26.768993377685547, 28.616649627685547, 30.464305877685547, 32.31196212768555, 34.15962219238281, 36.00727844238281, 37.85493469238281, 39.70259094238281, 41.55024719238281, 43.39790344238281, 45.24555969238281, 47.09321594238281, 48.94087219238281, 50.78852844238281, 52.63618469238281]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 4.0, 6.0, 5.0, 7.0, 8.0, 9.0, 13.0, 14.0, 17.0, 20.0, 18.0, 19.0, 27.0, 32.0, 29.0, 28.0, 37.0, 44.0, 47.0, 47.0, 42.0, 49.0, 45.0, 39.0, 34.0, 36.0, 37.0, 36.0, 31.0, 31.0, 20.0, 31.0, 21.0, 20.0, 19.0, 12.0, 12.0, 10.0, 5.0, 10.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-14.771269798278809, -14.335227012634277, -13.899185180664062, -13.463142395019531, -13.027100563049316, -12.591057777404785, -12.15501594543457, -11.718973159790039, -11.282930374145508, -10.846887588500977, -10.410845756530762, -9.97480297088623, -9.538761138916016, -9.102718353271484, -8.666675567626953, -8.230633735656738, -7.794591426849365, -7.358549118041992, -6.922506809234619, -6.486464500427246, -6.050421714782715, -5.614379405975342, -5.178337097167969, -4.7422943115234375, -4.306252479553223, -3.8702101707458496, -3.4341676235198975, -2.9981253147125244, -2.5620827674865723, -2.126040458679199, -1.6899981498718262, -1.253955602645874, -0.8179130554199219, -0.38187065720558167, 0.054171741008758545, 0.49021410942077637, 0.926256537437439, 1.3622989654541016, 1.7983412742614746, 2.2343838214874268, 2.6704261302948, 3.106468439102173, 3.542510986328125, 3.978553295135498, 4.414595603942871, 4.850638389587402, 5.286680221557617, 5.722723007202148, 6.1587653160095215, 6.5948076248168945, 7.030849933624268, 7.466892242431641, 7.902935028076172, 8.338977813720703, 8.775019645690918, 9.21106243133545, 9.647104263305664, 10.083147048950195, 10.51918888092041, 10.955231666564941, 11.391273498535156, 11.827316284179688, 12.263359069824219, 12.699400901794434, 13.135443687438965]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 20.0, 39.0, 59.0, 88.0, 145.0, 274.0, 495.0, 891.0, 1698.0, 3577.0, 7621.0, 17938.0, 46357.0, 118692.0, 261328.0, 312422.0, 165382.0, 66190.0, 25412.0, 10368.0, 4698.0, 2229.0, 1208.0, 579.0, 346.0, 161.0, 118.0, 74.0, 48.0, 16.0, 14.0, 15.0, 8.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.7322998046875, -9.409912109375, -9.0875244140625, -8.76513671875, -8.4427490234375, -8.120361328125, -7.7979736328125, -7.4755859375, -7.1531982421875, -6.830810546875, -6.5084228515625, -6.18603515625, -5.8636474609375, -5.541259765625, -5.2188720703125, -4.896484375, -4.5740966796875, -4.251708984375, -3.9293212890625, -3.60693359375, -3.2845458984375, -2.962158203125, -2.6397705078125, -2.3173828125, -1.9949951171875, -1.672607421875, -1.3502197265625, -1.02783203125, -0.7054443359375, -0.383056640625, -0.0606689453125, 0.26171875, 0.5841064453125, 0.906494140625, 1.2288818359375, 1.55126953125, 1.8736572265625, 2.196044921875, 2.5184326171875, 2.8408203125, 3.1632080078125, 3.485595703125, 3.8079833984375, 4.13037109375, 4.4527587890625, 4.775146484375, 5.0975341796875, 5.419921875, 5.7423095703125, 6.064697265625, 6.3870849609375, 6.70947265625, 7.0318603515625, 7.354248046875, 7.6766357421875, 7.9990234375, 8.3214111328125, 8.643798828125, 8.9661865234375, 9.28857421875, 9.6109619140625, 9.933349609375, 10.2557373046875, 10.578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 15.0, 9.0, 15.0, 22.0, 22.0, 17.0, 33.0, 35.0, 42.0, 39.0, 55.0, 53.0, 47.0, 55.0, 55.0, 44.0, 61.0, 59.0, 50.0, 36.0, 32.0, 29.0, 35.0, 26.0, 27.0, 12.0, 13.0, 8.0, 9.0, 6.0, 5.0, 11.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.810546875, -1.7529296875, -1.6953125, -1.6376953125, -1.580078125, -1.5224609375, -1.46484375, -1.4072265625, -1.349609375, -1.2919921875, -1.234375, -1.1767578125, -1.119140625, -1.0615234375, -1.00390625, -0.9462890625, -0.888671875, -0.8310546875, -0.7734375, -0.7158203125, -0.658203125, -0.6005859375, -0.54296875, -0.4853515625, -0.427734375, -0.3701171875, -0.3125, -0.2548828125, -0.197265625, -0.1396484375, -0.08203125, -0.0244140625, 0.033203125, 0.0908203125, 0.1484375, 0.2060546875, 0.263671875, 0.3212890625, 0.37890625, 0.4365234375, 0.494140625, 0.5517578125, 0.609375, 0.6669921875, 0.724609375, 0.7822265625, 0.83984375, 0.8974609375, 0.955078125, 1.0126953125, 1.0703125, 1.1279296875, 1.185546875, 1.2431640625, 1.30078125, 1.3583984375, 1.416015625, 1.4736328125, 1.53125, 1.5888671875, 1.646484375, 1.7041015625, 1.76171875, 1.8193359375, 1.876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 7.0, 9.0, 14.0, 15.0, 19.0, 43.0, 54.0, 76.0, 98.0, 145.0, 169.0, 215.0, 427.0, 667.0, 1181.0, 2577.0, 6331.0, 18961.0, 61972.0, 197811.0, 399272.0, 242117.0, 78520.0, 23409.0, 7904.0, 2976.0, 1409.0, 715.0, 471.0, 279.0, 170.0, 142.0, 116.0, 70.0, 50.0, 46.0, 31.0, 17.0, 12.0, 13.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.3927001953125, -11.043212890625, -10.6937255859375, -10.34423828125, -9.9947509765625, -9.645263671875, -9.2957763671875, -8.9462890625, -8.5968017578125, -8.247314453125, -7.8978271484375, -7.54833984375, -7.1988525390625, -6.849365234375, -6.4998779296875, -6.150390625, -5.8009033203125, -5.451416015625, -5.1019287109375, -4.75244140625, -4.4029541015625, -4.053466796875, -3.7039794921875, -3.3544921875, -3.0050048828125, -2.655517578125, -2.3060302734375, -1.95654296875, -1.6070556640625, -1.257568359375, -0.9080810546875, -0.55859375, -0.2091064453125, 0.140380859375, 0.4898681640625, 0.83935546875, 1.1888427734375, 1.538330078125, 1.8878173828125, 2.2373046875, 2.5867919921875, 2.936279296875, 3.2857666015625, 3.63525390625, 3.9847412109375, 4.334228515625, 4.6837158203125, 5.033203125, 5.3826904296875, 5.732177734375, 6.0816650390625, 6.43115234375, 6.7806396484375, 7.130126953125, 7.4796142578125, 7.8291015625, 8.1785888671875, 8.528076171875, 8.8775634765625, 9.22705078125, 9.5765380859375, 9.926025390625, 10.2755126953125, 10.625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 9.0, 14.0, 9.0, 10.0, 23.0, 15.0, 14.0, 27.0, 23.0, 27.0, 26.0, 30.0, 32.0, 30.0, 55.0, 48.0, 39.0, 44.0, 35.0, 36.0, 38.0, 42.0, 33.0, 32.0, 38.0, 27.0, 29.0, 22.0, 29.0, 30.0, 23.0, 18.0, 15.0, 12.0, 10.0, 16.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.509033203125, -6.27978515625, -6.050537109375, -5.8212890625, -5.592041015625, -5.36279296875, -5.133544921875, -4.904296875, -4.675048828125, -4.44580078125, -4.216552734375, -3.9873046875, -3.758056640625, -3.52880859375, -3.299560546875, -3.0703125, -2.841064453125, -2.61181640625, -2.382568359375, -2.1533203125, -1.924072265625, -1.69482421875, -1.465576171875, -1.236328125, -1.007080078125, -0.77783203125, -0.548583984375, -0.3193359375, -0.090087890625, 0.13916015625, 0.368408203125, 0.59765625, 0.826904296875, 1.05615234375, 1.285400390625, 1.5146484375, 1.743896484375, 1.97314453125, 2.202392578125, 2.431640625, 2.660888671875, 2.89013671875, 3.119384765625, 3.3486328125, 3.577880859375, 3.80712890625, 4.036376953125, 4.265625, 4.494873046875, 4.72412109375, 4.953369140625, 5.1826171875, 5.411865234375, 5.64111328125, 5.870361328125, 6.099609375, 6.328857421875, 6.55810546875, 6.787353515625, 7.0166015625, 7.245849609375, 7.47509765625, 7.704345703125, 7.93359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 6.0, 3.0, 10.0, 15.0, 22.0, 30.0, 37.0, 68.0, 93.0, 139.0, 236.0, 452.0, 839.0, 1591.0, 3411.0, 7620.0, 18394.0, 52057.0, 163761.0, 388181.0, 271563.0, 89143.0, 29841.0, 11297.0, 4812.0, 2282.0, 1135.0, 595.0, 350.0, 199.0, 140.0, 61.0, 48.0, 28.0, 27.0, 12.0, 12.0, 10.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9453125, -5.75189208984375, -5.5584716796875, -5.36505126953125, -5.171630859375, -4.97821044921875, -4.7847900390625, -4.59136962890625, -4.39794921875, -4.20452880859375, -4.0111083984375, -3.81768798828125, -3.624267578125, -3.43084716796875, -3.2374267578125, -3.04400634765625, -2.8505859375, -2.65716552734375, -2.4637451171875, -2.27032470703125, -2.076904296875, -1.88348388671875, -1.6900634765625, -1.49664306640625, -1.30322265625, -1.10980224609375, -0.9163818359375, -0.72296142578125, -0.529541015625, -0.33612060546875, -0.1427001953125, 0.05072021484375, 0.244140625, 0.43756103515625, 0.6309814453125, 0.82440185546875, 1.017822265625, 1.21124267578125, 1.4046630859375, 1.59808349609375, 1.79150390625, 1.98492431640625, 2.1783447265625, 2.37176513671875, 2.565185546875, 2.75860595703125, 2.9520263671875, 3.14544677734375, 3.3388671875, 3.53228759765625, 3.7257080078125, 3.91912841796875, 4.112548828125, 4.30596923828125, 4.4993896484375, 4.69281005859375, 4.88623046875, 5.07965087890625, 5.2730712890625, 5.46649169921875, 5.659912109375, 5.85333251953125, 6.0467529296875, 6.24017333984375, 6.43359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 8.0, 21.0, 33.0, 35.0, 39.0, 51.0, 58.0, 99.0, 140.0, 128.0, 97.0, 60.0, 56.0, 49.0, 31.0, 21.0, 16.0, 9.0, 9.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007333755493164062, -0.0007014721632003784, -0.0006695687770843506, -0.0006376653909683228, -0.0006057620048522949, -0.0005738586187362671, -0.0005419552326202393, -0.0005100518465042114, -0.0004781484603881836, -0.00044624507427215576, -0.00041434168815612793, -0.0003824383020401001, -0.00035053491592407227, -0.00031863152980804443, -0.0002867281436920166, -0.00025482475757598877, -0.00022292137145996094, -0.0001910179853439331, -0.00015911459922790527, -0.00012721121311187744, -9.530782699584961e-05, -6.340444087982178e-05, -3.1501054763793945e-05, 4.023313522338867e-07, 3.230571746826172e-05, 6.420910358428955e-05, 9.611248970031738e-05, 0.00012801587581634521, 0.00015991926193237305, 0.00019182264804840088, 0.0002237260341644287, 0.00025562942028045654, 0.0002875328063964844, 0.0003194361925125122, 0.00035133957862854004, 0.00038324296474456787, 0.0004151463508605957, 0.00044704973697662354, 0.00047895312309265137, 0.0005108565092086792, 0.000542759895324707, 0.0005746632814407349, 0.0006065666675567627, 0.0006384700536727905, 0.0006703734397888184, 0.0007022768259048462, 0.000734180212020874, 0.0007660835981369019, 0.0007979869842529297, 0.0008298903703689575, 0.0008617937564849854, 0.0008936971426010132, 0.000925600528717041, 0.0009575039148330688, 0.0009894073009490967, 0.0010213106870651245, 0.0010532140731811523, 0.0010851174592971802, 0.001117020845413208, 0.0011489242315292358, 0.0011808276176452637, 0.0012127310037612915, 0.0012446343898773193, 0.0012765377759933472, 0.001308441162109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 7.0, 7.0, 14.0, 20.0, 35.0, 62.0, 69.0, 153.0, 205.0, 440.0, 887.0, 1980.0, 5328.0, 19398.0, 109608.0, 578463.0, 276354.0, 40649.0, 9212.0, 3009.0, 1232.0, 610.0, 325.0, 188.0, 93.0, 62.0, 44.0, 28.0, 23.0, 13.0, 13.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-10.7890625, -10.43798828125, -10.0869140625, -9.73583984375, -9.384765625, -9.03369140625, -8.6826171875, -8.33154296875, -7.98046875, -7.62939453125, -7.2783203125, -6.92724609375, -6.576171875, -6.22509765625, -5.8740234375, -5.52294921875, -5.171875, -4.82080078125, -4.4697265625, -4.11865234375, -3.767578125, -3.41650390625, -3.0654296875, -2.71435546875, -2.36328125, -2.01220703125, -1.6611328125, -1.31005859375, -0.958984375, -0.60791015625, -0.2568359375, 0.09423828125, 0.4453125, 0.79638671875, 1.1474609375, 1.49853515625, 1.849609375, 2.20068359375, 2.5517578125, 2.90283203125, 3.25390625, 3.60498046875, 3.9560546875, 4.30712890625, 4.658203125, 5.00927734375, 5.3603515625, 5.71142578125, 6.0625, 6.41357421875, 6.7646484375, 7.11572265625, 7.466796875, 7.81787109375, 8.1689453125, 8.52001953125, 8.87109375, 9.22216796875, 9.5732421875, 9.92431640625, 10.275390625, 10.62646484375, 10.9775390625, 11.32861328125, 11.6796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 13.0, 6.0, 16.0, 7.0, 21.0, 47.0, 40.0, 78.0, 81.0, 93.0, 116.0, 105.0, 94.0, 82.0, 51.0, 33.0, 37.0, 17.0, 16.0, 11.0, 10.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.63079833984375, -8.4022216796875, -8.17364501953125, -7.945068359375, -7.71649169921875, -7.4879150390625, -7.25933837890625, -7.03076171875, -6.80218505859375, -6.5736083984375, -6.34503173828125, -6.116455078125, -5.88787841796875, -5.6593017578125, -5.43072509765625, -5.2021484375, -4.97357177734375, -4.7449951171875, -4.51641845703125, -4.287841796875, -4.05926513671875, -3.8306884765625, -3.60211181640625, -3.37353515625, -3.14495849609375, -2.9163818359375, -2.68780517578125, -2.459228515625, -2.23065185546875, -2.0020751953125, -1.77349853515625, -1.544921875, -1.31634521484375, -1.0877685546875, -0.85919189453125, -0.630615234375, -0.40203857421875, -0.1734619140625, 0.05511474609375, 0.28369140625, 0.51226806640625, 0.7408447265625, 0.96942138671875, 1.197998046875, 1.42657470703125, 1.6551513671875, 1.88372802734375, 2.1123046875, 2.34088134765625, 2.5694580078125, 2.79803466796875, 3.026611328125, 3.25518798828125, 3.4837646484375, 3.71234130859375, 3.94091796875, 4.16949462890625, 4.3980712890625, 4.62664794921875, 4.855224609375, 5.08380126953125, 5.3123779296875, 5.54095458984375, 5.76953125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 13.0, 11.0, 28.0, 64.0, 154.0, 189.0, 197.0, 162.0, 95.0, 40.0, 27.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.34928512573242, -53.4930305480957, -49.63677215576172, -45.780517578125, -41.924259185791016, -38.0680046081543, -34.21174621582031, -30.355491638183594, -26.499235153198242, -22.64297866821289, -18.78672218322754, -14.930466651916504, -11.074210166931152, -7.217954635620117, -3.3616981506347656, 0.49455833435058594, 4.3508148193359375, 8.207071304321289, 12.06332778930664, 15.919583320617676, 19.775840759277344, 23.632095336914062, 27.488351821899414, 31.344608306884766, 35.20086669921875, 39.05712127685547, 42.91337966918945, 46.76963424682617, 50.625892639160156, 54.482147216796875, 58.338401794433594, 62.19466018676758, 66.05091094970703, 69.90716552734375, 73.76342010498047, 77.61968231201172, 81.47593688964844, 85.33219146728516, 89.18844604492188, 93.04470825195312, 96.90096282958984, 100.75721740722656, 104.61347198486328, 108.46973419189453, 112.32598876953125, 116.18224334716797, 120.03849792480469, 123.89476013183594, 127.75100708007812, 131.60726928710938, 135.46351623535156, 139.3197784423828, 143.176025390625, 147.03228759765625, 150.8885498046875, 154.7447967529297, 158.60105895996094, 162.4573211669922, 166.31356811523438, 170.16983032226562, 174.0260772705078, 177.88233947753906, 181.7386016845703, 185.5948486328125, 189.45111083984375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 9.0, 19.0, 18.0, 15.0, 17.0, 31.0, 38.0, 46.0, 39.0, 56.0, 48.0, 55.0, 76.0, 73.0, 59.0, 55.0, 52.0, 57.0, 41.0, 38.0, 41.0, 20.0, 27.0, 14.0, 19.0, 6.0, 13.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.7430534362793, -56.71745300292969, -54.691856384277344, -52.666259765625, -50.64065933227539, -48.61505889892578, -46.58946228027344, -44.563865661621094, -42.538265228271484, -40.512664794921875, -38.48706817626953, -36.46147155761719, -34.43587112426758, -32.41027069091797, -30.384674072265625, -28.35907554626465, -26.333477020263672, -24.307878494262695, -22.28227996826172, -20.256681442260742, -18.231082916259766, -16.20548439025879, -14.179885864257812, -12.154287338256836, -10.12868881225586, -8.103090286254883, -6.077491760253906, -4.05189323425293, -2.026294708251953, -0.0006961822509765625, 2.02490234375, 4.050500869750977, 6.0760955810546875, 8.101694107055664, 10.12729263305664, 12.152891159057617, 14.178489685058594, 16.20408821105957, 18.229686737060547, 20.255285263061523, 22.2808837890625, 24.306482315063477, 26.332080841064453, 28.35767936706543, 30.383277893066406, 32.40887451171875, 34.43447494506836, 36.46007537841797, 38.48567199707031, 40.511268615722656, 42.536869049072266, 44.562469482421875, 46.58806610107422, 48.61366271972656, 50.63926315307617, 52.66486358642578, 54.690460205078125, 56.71605682373047, 58.74165725708008, 60.76725769042969, 62.79285430908203, 64.81845092773438, 66.84405517578125, 68.8696517944336, 70.89524841308594]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 2.0, 9.0, 8.0, 9.0, 19.0, 28.0, 36.0, 54.0, 70.0, 131.0, 175.0, 298.0, 446.0, 707.0, 1127.0, 2190.0, 4158.0, 8377.0, 20382.0, 59040.0, 275136.0, 3428045.0, 294209.0, 61284.0, 20883.0, 8513.0, 3941.0, 2027.0, 1102.0, 672.0, 387.0, 255.0, 183.0, 119.0, 69.0, 58.0, 39.0, 20.0, 19.0, 17.0, 8.0, 3.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.23193359375, -11.8310546875, -11.43017578125, -11.029296875, -10.62841796875, -10.2275390625, -9.82666015625, -9.42578125, -9.02490234375, -8.6240234375, -8.22314453125, -7.822265625, -7.42138671875, -7.0205078125, -6.61962890625, -6.21875, -5.81787109375, -5.4169921875, -5.01611328125, -4.615234375, -4.21435546875, -3.8134765625, -3.41259765625, -3.01171875, -2.61083984375, -2.2099609375, -1.80908203125, -1.408203125, -1.00732421875, -0.6064453125, -0.20556640625, 0.1953125, 0.59619140625, 0.9970703125, 1.39794921875, 1.798828125, 2.19970703125, 2.6005859375, 3.00146484375, 3.40234375, 3.80322265625, 4.2041015625, 4.60498046875, 5.005859375, 5.40673828125, 5.8076171875, 6.20849609375, 6.609375, 7.01025390625, 7.4111328125, 7.81201171875, 8.212890625, 8.61376953125, 9.0146484375, 9.41552734375, 9.81640625, 10.21728515625, 10.6181640625, 11.01904296875, 11.419921875, 11.82080078125, 12.2216796875, 12.62255859375, 13.0234375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 14.0, 19.0, 19.0, 30.0, 18.0, 35.0, 27.0, 46.0, 59.0, 65.0, 65.0, 59.0, 69.0, 56.0, 59.0, 63.0, 57.0, 45.0, 36.0, 38.0, 18.0, 16.0, 15.0, 16.0, 10.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.1822662353515625, -2.116485595703125, -2.0507049560546875, -1.98492431640625, -1.9191436767578125, -1.853363037109375, -1.7875823974609375, -1.7218017578125, -1.6560211181640625, -1.590240478515625, -1.5244598388671875, -1.45867919921875, -1.3928985595703125, -1.327117919921875, -1.2613372802734375, -1.195556640625, -1.1297760009765625, -1.063995361328125, -0.9982147216796875, -0.93243408203125, -0.8666534423828125, -0.800872802734375, -0.7350921630859375, -0.6693115234375, -0.6035308837890625, -0.537750244140625, -0.4719696044921875, -0.40618896484375, -0.3404083251953125, -0.274627685546875, -0.2088470458984375, -0.14306640625, -0.0772857666015625, -0.011505126953125, 0.0542755126953125, 0.12005615234375, 0.1858367919921875, 0.251617431640625, 0.3173980712890625, 0.3831787109375, 0.4489593505859375, 0.514739990234375, 0.5805206298828125, 0.64630126953125, 0.7120819091796875, 0.777862548828125, 0.8436431884765625, 0.909423828125, 0.9752044677734375, 1.040985107421875, 1.1067657470703125, 1.17254638671875, 1.2383270263671875, 1.304107666015625, 1.3698883056640625, 1.4356689453125, 1.5014495849609375, 1.567230224609375, 1.6330108642578125, 1.69879150390625, 1.7645721435546875, 1.830352783203125, 1.8961334228515625, 1.9619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 13.0, 14.0, 36.0, 27.0, 42.0, 71.0, 117.0, 157.0, 272.0, 492.0, 777.0, 1392.0, 2726.0, 5150.0, 11017.0, 26416.0, 71085.0, 245670.0, 2413950.0, 1133827.0, 183747.0, 56165.0, 21279.0, 9388.0, 4556.0, 2361.0, 1410.0, 820.0, 446.0, 314.0, 183.0, 118.0, 85.0, 54.0, 38.0, 26.0, 12.0, 11.0, 7.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0496826171875, -9.724365234375, -9.3990478515625, -9.07373046875, -8.7484130859375, -8.423095703125, -8.0977783203125, -7.7724609375, -7.4471435546875, -7.121826171875, -6.7965087890625, -6.47119140625, -6.1458740234375, -5.820556640625, -5.4952392578125, -5.169921875, -4.8446044921875, -4.519287109375, -4.1939697265625, -3.86865234375, -3.5433349609375, -3.218017578125, -2.8927001953125, -2.5673828125, -2.2420654296875, -1.916748046875, -1.5914306640625, -1.26611328125, -0.9407958984375, -0.615478515625, -0.2901611328125, 0.03515625, 0.3604736328125, 0.685791015625, 1.0111083984375, 1.33642578125, 1.6617431640625, 1.987060546875, 2.3123779296875, 2.6376953125, 2.9630126953125, 3.288330078125, 3.6136474609375, 3.93896484375, 4.2642822265625, 4.589599609375, 4.9149169921875, 5.240234375, 5.5655517578125, 5.890869140625, 6.2161865234375, 6.54150390625, 6.8668212890625, 7.192138671875, 7.5174560546875, 7.8427734375, 8.1680908203125, 8.493408203125, 8.8187255859375, 9.14404296875, 9.4693603515625, 9.794677734375, 10.1199951171875, 10.4453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 4.0, 4.0, 15.0, 19.0, 22.0, 31.0, 27.0, 51.0, 58.0, 84.0, 102.0, 188.0, 340.0, 793.0, 1163.0, 431.0, 238.0, 162.0, 95.0, 68.0, 36.0, 28.0, 21.0, 17.0, 11.0, 7.0, 15.0, 7.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.5703125, -3.46246337890625, -3.3546142578125, -3.24676513671875, -3.138916015625, -3.03106689453125, -2.9232177734375, -2.81536865234375, -2.70751953125, -2.59967041015625, -2.4918212890625, -2.38397216796875, -2.276123046875, -2.16827392578125, -2.0604248046875, -1.95257568359375, -1.8447265625, -1.73687744140625, -1.6290283203125, -1.52117919921875, -1.413330078125, -1.30548095703125, -1.1976318359375, -1.08978271484375, -0.98193359375, -0.87408447265625, -0.7662353515625, -0.65838623046875, -0.550537109375, -0.44268798828125, -0.3348388671875, -0.22698974609375, -0.119140625, -0.01129150390625, 0.0965576171875, 0.20440673828125, 0.312255859375, 0.42010498046875, 0.5279541015625, 0.63580322265625, 0.74365234375, 0.85150146484375, 0.9593505859375, 1.06719970703125, 1.175048828125, 1.28289794921875, 1.3907470703125, 1.49859619140625, 1.6064453125, 1.71429443359375, 1.8221435546875, 1.92999267578125, 2.037841796875, 2.14569091796875, 2.2535400390625, 2.36138916015625, 2.46923828125, 2.57708740234375, 2.6849365234375, 2.79278564453125, 2.900634765625, 3.00848388671875, 3.1163330078125, 3.22418212890625, 3.33203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 9.0, 5.0, 17.0, 25.0, 63.0, 86.0, 123.0, 151.0, 144.0, 130.0, 97.0, 79.0, 35.0, 13.0, 13.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.85492706298828, -48.840660095214844, -47.82638931274414, -46.81211853027344, -45.7978515625, -44.78358459472656, -43.76931381225586, -42.755043029785156, -41.74077606201172, -40.72650909423828, -39.71223831176758, -38.697967529296875, -37.68370056152344, -36.66943359375, -35.6551628112793, -34.640892028808594, -33.626625061035156, -32.61235809326172, -31.598087310791016, -30.583818435668945, -29.569549560546875, -28.555280685424805, -27.541011810302734, -26.526742935180664, -25.512474060058594, -24.498205184936523, -23.483936309814453, -22.469667434692383, -21.455398559570312, -20.441129684448242, -19.426860809326172, -18.4125919342041, -17.39832305908203, -16.38405418395996, -15.36978530883789, -14.35551643371582, -13.34124755859375, -12.32697868347168, -11.31270980834961, -10.298440933227539, -9.284172058105469, -8.269903182983398, -7.255634307861328, -6.241365432739258, -5.2270965576171875, -4.212827682495117, -3.198558807373047, -2.1842899322509766, -1.1700210571289062, -0.15575218200683594, 0.8585166931152344, 1.8727855682373047, 2.887054443359375, 3.9013233184814453, 4.915592193603516, 5.929861068725586, 6.944129943847656, 7.958398818969727, 8.972667694091797, 9.986936569213867, 11.001205444335938, 12.015474319458008, 13.029743194580078, 14.044012069702148, 15.058280944824219]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 3.0, 11.0, 16.0, 19.0, 34.0, 29.0, 31.0, 35.0, 52.0, 48.0, 59.0, 59.0, 59.0, 66.0, 55.0, 69.0, 55.0, 62.0, 51.0, 34.0, 38.0, 27.0, 19.0, 27.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.20915985107422, -23.619915008544922, -23.030668258666992, -22.441423416137695, -21.8521785736084, -21.2629337310791, -20.673686981201172, -20.084442138671875, -19.495197296142578, -18.90595245361328, -18.31670570373535, -17.727460861206055, -17.138216018676758, -16.54897117614746, -15.959724426269531, -15.370479583740234, -14.781233787536621, -14.191987991333008, -13.602743148803711, -13.013497352600098, -12.4242525100708, -11.835006713867188, -11.24576187133789, -10.656516075134277, -10.067270278930664, -9.47802448272705, -8.888779640197754, -8.29953384399414, -7.710289001464844, -7.1210432052612305, -6.531797885894775, -5.94255256652832, -5.353307723999023, -4.764062404632568, -4.174817085266113, -3.585571527481079, -2.996326208114624, -2.407080888748169, -1.8178353309631348, -1.2285900115966797, -0.6393446922302246, -0.050099313259124756, 0.5391460657119751, 1.1283915042877197, 1.7176368236541748, 2.30688214302063, 2.896127700805664, 3.485373020172119, 4.074618339538574, 4.663863658905029, 5.253108978271484, 5.842354774475098, 6.4315996170043945, 7.020845413208008, 7.610090732574463, 8.199336051940918, 8.788581848144531, 9.377827644348145, 9.967072486877441, 10.556318283081055, 11.145563125610352, 11.734808921813965, 12.324054718017578, 12.913299560546875, 13.502544403076172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 19.0, 34.0, 40.0, 82.0, 118.0, 178.0, 274.0, 471.0, 816.0, 1451.0, 2513.0, 4575.0, 9051.0, 18303.0, 39898.0, 85764.0, 175518.0, 267942.0, 219913.0, 116496.0, 54529.0, 25034.0, 11878.0, 6078.0, 3153.0, 1804.0, 1017.0, 580.0, 359.0, 237.0, 155.0, 91.0, 45.0, 33.0, 19.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.09375, -6.8699951171875, -6.646240234375, -6.4224853515625, -6.19873046875, -5.9749755859375, -5.751220703125, -5.5274658203125, -5.3037109375, -5.0799560546875, -4.856201171875, -4.6324462890625, -4.40869140625, -4.1849365234375, -3.961181640625, -3.7374267578125, -3.513671875, -3.2899169921875, -3.066162109375, -2.8424072265625, -2.61865234375, -2.3948974609375, -2.171142578125, -1.9473876953125, -1.7236328125, -1.4998779296875, -1.276123046875, -1.0523681640625, -0.82861328125, -0.6048583984375, -0.381103515625, -0.1573486328125, 0.06640625, 0.2901611328125, 0.513916015625, 0.7376708984375, 0.96142578125, 1.1851806640625, 1.408935546875, 1.6326904296875, 1.8564453125, 2.0802001953125, 2.303955078125, 2.5277099609375, 2.75146484375, 2.9752197265625, 3.198974609375, 3.4227294921875, 3.646484375, 3.8702392578125, 4.093994140625, 4.3177490234375, 4.54150390625, 4.7652587890625, 4.989013671875, 5.2127685546875, 5.4365234375, 5.6602783203125, 5.884033203125, 6.1077880859375, 6.33154296875, 6.5552978515625, 6.779052734375, 7.0028076171875, 7.2265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 8.0, 6.0, 12.0, 6.0, 13.0, 19.0, 23.0, 22.0, 15.0, 27.0, 40.0, 40.0, 39.0, 47.0, 61.0, 57.0, 48.0, 51.0, 64.0, 56.0, 52.0, 44.0, 34.0, 36.0, 37.0, 31.0, 24.0, 16.0, 19.0, 9.0, 8.0, 12.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-2.068359375, -2.01104736328125, -1.9537353515625, -1.89642333984375, -1.839111328125, -1.78179931640625, -1.7244873046875, -1.66717529296875, -1.60986328125, -1.55255126953125, -1.4952392578125, -1.43792724609375, -1.380615234375, -1.32330322265625, -1.2659912109375, -1.20867919921875, -1.1513671875, -1.09405517578125, -1.0367431640625, -0.97943115234375, -0.922119140625, -0.86480712890625, -0.8074951171875, -0.75018310546875, -0.69287109375, -0.63555908203125, -0.5782470703125, -0.52093505859375, -0.463623046875, -0.40631103515625, -0.3489990234375, -0.29168701171875, -0.234375, -0.17706298828125, -0.1197509765625, -0.06243896484375, -0.005126953125, 0.05218505859375, 0.1094970703125, 0.16680908203125, 0.22412109375, 0.28143310546875, 0.3387451171875, 0.39605712890625, 0.453369140625, 0.51068115234375, 0.5679931640625, 0.62530517578125, 0.6826171875, 0.73992919921875, 0.7972412109375, 0.85455322265625, 0.911865234375, 0.96917724609375, 1.0264892578125, 1.08380126953125, 1.14111328125, 1.19842529296875, 1.2557373046875, 1.31304931640625, 1.370361328125, 1.42767333984375, 1.4849853515625, 1.54229736328125, 1.599609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 8.0, 9.0, 7.0, 11.0, 8.0, 20.0, 25.0, 24.0, 49.0, 71.0, 99.0, 120.0, 159.0, 209.0, 275.0, 462.0, 711.0, 1291.0, 2642.0, 6015.0, 15805.0, 45176.0, 133180.0, 313255.0, 317818.0, 136205.0, 46561.0, 16087.0, 6129.0, 2567.0, 1312.0, 710.0, 457.0, 301.0, 195.0, 150.0, 119.0, 79.0, 50.0, 45.0, 36.0, 22.0, 23.0, 18.0, 14.0, 5.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.453125, -8.1805419921875, -7.907958984375, -7.6353759765625, -7.36279296875, -7.0902099609375, -6.817626953125, -6.5450439453125, -6.2724609375, -5.9998779296875, -5.727294921875, -5.4547119140625, -5.18212890625, -4.9095458984375, -4.636962890625, -4.3643798828125, -4.091796875, -3.8192138671875, -3.546630859375, -3.2740478515625, -3.00146484375, -2.7288818359375, -2.456298828125, -2.1837158203125, -1.9111328125, -1.6385498046875, -1.365966796875, -1.0933837890625, -0.82080078125, -0.5482177734375, -0.275634765625, -0.0030517578125, 0.26953125, 0.5421142578125, 0.814697265625, 1.0872802734375, 1.35986328125, 1.6324462890625, 1.905029296875, 2.1776123046875, 2.4501953125, 2.7227783203125, 2.995361328125, 3.2679443359375, 3.54052734375, 3.8131103515625, 4.085693359375, 4.3582763671875, 4.630859375, 4.9034423828125, 5.176025390625, 5.4486083984375, 5.72119140625, 5.9937744140625, 6.266357421875, 6.5389404296875, 6.8115234375, 7.0841064453125, 7.356689453125, 7.6292724609375, 7.90185546875, 8.1744384765625, 8.447021484375, 8.7196044921875, 8.9921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 10.0, 8.0, 13.0, 15.0, 20.0, 19.0, 20.0, 20.0, 27.0, 32.0, 43.0, 34.0, 39.0, 39.0, 48.0, 42.0, 46.0, 37.0, 51.0, 37.0, 37.0, 34.0, 37.0, 32.0, 29.0, 29.0, 36.0, 29.0, 13.0, 24.0, 20.0, 10.0, 21.0, 13.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.83978271484375, -6.6092529296875, -6.37872314453125, -6.148193359375, -5.91766357421875, -5.6871337890625, -5.45660400390625, -5.22607421875, -4.99554443359375, -4.7650146484375, -4.53448486328125, -4.303955078125, -4.07342529296875, -3.8428955078125, -3.61236572265625, -3.3818359375, -3.15130615234375, -2.9207763671875, -2.69024658203125, -2.459716796875, -2.22918701171875, -1.9986572265625, -1.76812744140625, -1.53759765625, -1.30706787109375, -1.0765380859375, -0.84600830078125, -0.615478515625, -0.38494873046875, -0.1544189453125, 0.07611083984375, 0.306640625, 0.53717041015625, 0.7677001953125, 0.99822998046875, 1.228759765625, 1.45928955078125, 1.6898193359375, 1.92034912109375, 2.15087890625, 2.38140869140625, 2.6119384765625, 2.84246826171875, 3.072998046875, 3.30352783203125, 3.5340576171875, 3.76458740234375, 3.9951171875, 4.22564697265625, 4.4561767578125, 4.68670654296875, 4.917236328125, 5.14776611328125, 5.3782958984375, 5.60882568359375, 5.83935546875, 6.06988525390625, 6.3004150390625, 6.53094482421875, 6.761474609375, 6.99200439453125, 7.2225341796875, 7.45306396484375, 7.68359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 8.0, 20.0, 12.0, 16.0, 25.0, 32.0, 46.0, 97.0, 110.0, 230.0, 332.0, 620.0, 1195.0, 2501.0, 6187.0, 16943.0, 57421.0, 226527.0, 461882.0, 198050.0, 50509.0, 15345.0, 5418.0, 2378.0, 1102.0, 592.0, 351.0, 217.0, 110.0, 78.0, 56.0, 37.0, 23.0, 15.0, 15.0, 11.0, 10.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.31640625, -6.133056640625, -5.94970703125, -5.766357421875, -5.5830078125, -5.399658203125, -5.21630859375, -5.032958984375, -4.849609375, -4.666259765625, -4.48291015625, -4.299560546875, -4.1162109375, -3.932861328125, -3.74951171875, -3.566162109375, -3.3828125, -3.199462890625, -3.01611328125, -2.832763671875, -2.6494140625, -2.466064453125, -2.28271484375, -2.099365234375, -1.916015625, -1.732666015625, -1.54931640625, -1.365966796875, -1.1826171875, -0.999267578125, -0.81591796875, -0.632568359375, -0.44921875, -0.265869140625, -0.08251953125, 0.100830078125, 0.2841796875, 0.467529296875, 0.65087890625, 0.834228515625, 1.017578125, 1.200927734375, 1.38427734375, 1.567626953125, 1.7509765625, 1.934326171875, 2.11767578125, 2.301025390625, 2.484375, 2.667724609375, 2.85107421875, 3.034423828125, 3.2177734375, 3.401123046875, 3.58447265625, 3.767822265625, 3.951171875, 4.134521484375, 4.31787109375, 4.501220703125, 4.6845703125, 4.867919921875, 5.05126953125, 5.234619140625, 5.41796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 1.0, 6.0, 9.0, 4.0, 12.0, 15.0, 18.0, 28.0, 45.0, 60.0, 90.0, 100.0, 129.0, 119.0, 89.0, 67.0, 52.0, 36.0, 25.0, 21.0, 17.0, 10.0, 9.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010824203491210938, -0.0010512322187423706, -0.0010200440883636475, -0.0009888559579849243, -0.0009576678276062012, -0.000926479697227478, -0.0008952915668487549, -0.0008641034364700317, -0.0008329153060913086, -0.0008017271757125854, -0.0007705390453338623, -0.0007393509149551392, -0.000708162784576416, -0.0006769746541976929, -0.0006457865238189697, -0.0006145983934402466, -0.0005834102630615234, -0.0005522221326828003, -0.0005210340023040771, -0.000489845871925354, -0.00045865774154663086, -0.0004274696111679077, -0.00039628148078918457, -0.0003650933504104614, -0.0003339052200317383, -0.00030271708965301514, -0.000271528959274292, -0.00024034082889556885, -0.0002091526985168457, -0.00017796456813812256, -0.00014677643775939941, -0.00011558830738067627, -8.440017700195312e-05, -5.321204662322998e-05, -2.2023916244506836e-05, 9.164214134216309e-06, 4.035234451293945e-05, 7.15404748916626e-05, 0.00010272860527038574, 0.0001339167356491089, 0.00016510486602783203, 0.00019629299640655518, 0.00022748112678527832, 0.00025866925716400146, 0.0002898573875427246, 0.00032104551792144775, 0.0003522336483001709, 0.00038342177867889404, 0.0004146099090576172, 0.00044579803943634033, 0.0004769861698150635, 0.0005081743001937866, 0.0005393624305725098, 0.0005705505609512329, 0.0006017386913299561, 0.0006329268217086792, 0.0006641149520874023, 0.0006953030824661255, 0.0007264912128448486, 0.0007576793432235718, 0.0007888674736022949, 0.0008200556039810181, 0.0008512437343597412, 0.0008824318647384644, 0.0009136199951171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 14.0, 17.0, 29.0, 69.0, 156.0, 432.0, 1366.0, 6219.0, 62667.0, 798406.0, 164916.0, 11173.0, 2031.0, 633.0, 208.0, 102.0, 42.0, 27.0, 19.0, 8.0, 9.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.5189208984375, -13.030029296875, -12.5411376953125, -12.05224609375, -11.5633544921875, -11.074462890625, -10.5855712890625, -10.0966796875, -9.6077880859375, -9.118896484375, -8.6300048828125, -8.14111328125, -7.6522216796875, -7.163330078125, -6.6744384765625, -6.185546875, -5.6966552734375, -5.207763671875, -4.7188720703125, -4.22998046875, -3.7410888671875, -3.252197265625, -2.7633056640625, -2.2744140625, -1.7855224609375, -1.296630859375, -0.8077392578125, -0.31884765625, 0.1700439453125, 0.658935546875, 1.1478271484375, 1.63671875, 2.1256103515625, 2.614501953125, 3.1033935546875, 3.59228515625, 4.0811767578125, 4.570068359375, 5.0589599609375, 5.5478515625, 6.0367431640625, 6.525634765625, 7.0145263671875, 7.50341796875, 7.9923095703125, 8.481201171875, 8.9700927734375, 9.458984375, 9.9478759765625, 10.436767578125, 10.9256591796875, 11.41455078125, 11.9034423828125, 12.392333984375, 12.8812255859375, 13.3701171875, 13.8590087890625, 14.347900390625, 14.8367919921875, 15.32568359375, 15.8145751953125, 16.303466796875, 16.7923583984375, 17.28125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 14.0, 9.0, 8.0, 26.0, 36.0, 43.0, 62.0, 80.0, 80.0, 85.0, 110.0, 91.0, 70.0, 84.0, 45.0, 38.0, 28.0, 21.0, 10.0, 10.0, 11.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.50274658203125, -4.3297119140625, -4.15667724609375, -3.983642578125, -3.81060791015625, -3.6375732421875, -3.46453857421875, -3.29150390625, -3.11846923828125, -2.9454345703125, -2.77239990234375, -2.599365234375, -2.42633056640625, -2.2532958984375, -2.08026123046875, -1.9072265625, -1.73419189453125, -1.5611572265625, -1.38812255859375, -1.215087890625, -1.04205322265625, -0.8690185546875, -0.69598388671875, -0.52294921875, -0.34991455078125, -0.1768798828125, -0.00384521484375, 0.169189453125, 0.34222412109375, 0.5152587890625, 0.68829345703125, 0.861328125, 1.03436279296875, 1.2073974609375, 1.38043212890625, 1.553466796875, 1.72650146484375, 1.8995361328125, 2.07257080078125, 2.24560546875, 2.41864013671875, 2.5916748046875, 2.76470947265625, 2.937744140625, 3.11077880859375, 3.2838134765625, 3.45684814453125, 3.6298828125, 3.80291748046875, 3.9759521484375, 4.14898681640625, 4.322021484375, 4.49505615234375, 4.6680908203125, 4.84112548828125, 5.01416015625, 5.18719482421875, 5.3602294921875, 5.53326416015625, 5.706298828125, 5.87933349609375, 6.0523681640625, 6.22540283203125, 6.3984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 16.0, 14.0, 19.0, 27.0, 44.0, 64.0, 102.0, 121.0, 120.0, 119.0, 109.0, 86.0, 53.0, 38.0, 21.0, 15.0, 15.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.699615478515625, -58.52817153930664, -56.35673141479492, -54.18528747558594, -52.01384735107422, -49.842403411865234, -47.67095947265625, -45.49951934814453, -43.32807922363281, -41.15663528442383, -38.98519515991211, -36.813751220703125, -34.642311096191406, -32.47086715698242, -30.29942512512207, -28.12798309326172, -25.956539154052734, -23.785097122192383, -21.61365509033203, -19.442211151123047, -17.270771026611328, -15.09932804107666, -12.927885055541992, -10.75644302368164, -8.585000991821289, -6.4135589599609375, -4.242116451263428, -2.070673942565918, 0.1007680892944336, 2.272210121154785, 4.443653106689453, 6.615095138549805, 8.786537170410156, 10.957979202270508, 13.12942123413086, 15.300864219665527, 17.472305297851562, 19.643749237060547, 21.8151912689209, 23.98663330078125, 26.1580753326416, 28.329517364501953, 30.500959396362305, 32.672401428222656, 34.84384536743164, 37.01528549194336, 39.186729431152344, 41.35816955566406, 43.52961349487305, 45.70105743408203, 47.87249755859375, 50.043941497802734, 52.21538162231445, 54.38682556152344, 56.558265686035156, 58.72970962524414, 60.901153564453125, 63.07259750366211, 65.2440414428711, 67.41548156738281, 69.58692169189453, 71.75836181640625, 73.9298095703125, 76.10124969482422, 78.27268981933594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 7.0, 6.0, 10.0, 17.0, 15.0, 22.0, 16.0, 26.0, 41.0, 46.0, 43.0, 50.0, 47.0, 61.0, 49.0, 61.0, 51.0, 42.0, 54.0, 60.0, 52.0, 34.0, 31.0, 35.0, 35.0, 18.0, 17.0, 10.0, 23.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-58.58982467651367, -56.99394989013672, -55.3980712890625, -53.80219650268555, -52.206321716308594, -50.610443115234375, -49.01456832885742, -47.41869354248047, -45.82281494140625, -44.2269401550293, -42.63106155395508, -41.035186767578125, -39.43931198120117, -37.84343719482422, -36.24755859375, -34.65168380737305, -33.055809020996094, -31.459932327270508, -29.864057540893555, -28.26818084716797, -26.672306060791016, -25.07642936706543, -23.480552673339844, -21.88467788696289, -20.288801193237305, -18.69292449951172, -17.097049713134766, -15.50117301940918, -13.90529727935791, -12.30942153930664, -10.713544845581055, -9.117669105529785, -7.521797180175781, -5.925921440124512, -4.330045223236084, -2.7341690063476562, -1.1382932662963867, 0.4575824737548828, 2.0534591674804688, 3.6493349075317383, 5.245210647583008, 6.841086387634277, 8.436962127685547, 10.032838821411133, 11.628714561462402, 13.224590301513672, 14.820466995239258, 16.416343688964844, 18.012218475341797, 19.608095169067383, 21.203969955444336, 22.799846649169922, 24.395721435546875, 25.99159812927246, 27.587474822998047, 29.183349609375, 30.779226303100586, 32.37510299682617, 33.970977783203125, 35.566856384277344, 37.1627311706543, 38.75860595703125, 40.35448455810547, 41.95035934448242, 43.546234130859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 7.0, 20.0, 15.0, 21.0, 34.0, 52.0, 72.0, 111.0, 174.0, 276.0, 498.0, 886.0, 1595.0, 3173.0, 6736.0, 15876.0, 43251.0, 157655.0, 1889351.0, 1845506.0, 157224.0, 42761.0, 15632.0, 6533.0, 3185.0, 1593.0, 784.0, 455.0, 281.0, 193.0, 123.0, 68.0, 42.0, 23.0, 20.0, 17.0, 15.0, 6.0, 5.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.4793701171875, -12.122802734375, -11.7662353515625, -11.40966796875, -11.0531005859375, -10.696533203125, -10.3399658203125, -9.9833984375, -9.6268310546875, -9.270263671875, -8.9136962890625, -8.55712890625, -8.2005615234375, -7.843994140625, -7.4874267578125, -7.130859375, -6.7742919921875, -6.417724609375, -6.0611572265625, -5.70458984375, -5.3480224609375, -4.991455078125, -4.6348876953125, -4.2783203125, -3.9217529296875, -3.565185546875, -3.2086181640625, -2.85205078125, -2.4954833984375, -2.138916015625, -1.7823486328125, -1.42578125, -1.0692138671875, -0.712646484375, -0.3560791015625, 0.00048828125, 0.3570556640625, 0.713623046875, 1.0701904296875, 1.4267578125, 1.7833251953125, 2.139892578125, 2.4964599609375, 2.85302734375, 3.2095947265625, 3.566162109375, 3.9227294921875, 4.279296875, 4.6358642578125, 4.992431640625, 5.3489990234375, 5.70556640625, 6.0621337890625, 6.418701171875, 6.7752685546875, 7.1318359375, 7.4884033203125, 7.844970703125, 8.2015380859375, 8.55810546875, 8.9146728515625, 9.271240234375, 9.6278076171875, 9.984375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 4.0, 13.0, 14.0, 20.0, 12.0, 18.0, 42.0, 37.0, 29.0, 27.0, 35.0, 53.0, 54.0, 62.0, 65.0, 64.0, 56.0, 62.0, 45.0, 40.0, 35.0, 38.0, 44.0, 16.0, 25.0, 12.0, 14.0, 11.0, 14.0, 5.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.95428466796875, -1.8948974609375, -1.83551025390625, -1.776123046875, -1.71673583984375, -1.6573486328125, -1.59796142578125, -1.53857421875, -1.47918701171875, -1.4197998046875, -1.36041259765625, -1.301025390625, -1.24163818359375, -1.1822509765625, -1.12286376953125, -1.0634765625, -1.00408935546875, -0.9447021484375, -0.88531494140625, -0.825927734375, -0.76654052734375, -0.7071533203125, -0.64776611328125, -0.58837890625, -0.52899169921875, -0.4696044921875, -0.41021728515625, -0.350830078125, -0.29144287109375, -0.2320556640625, -0.17266845703125, -0.11328125, -0.05389404296875, 0.0054931640625, 0.06488037109375, 0.124267578125, 0.18365478515625, 0.2430419921875, 0.30242919921875, 0.36181640625, 0.42120361328125, 0.4805908203125, 0.53997802734375, 0.599365234375, 0.65875244140625, 0.7181396484375, 0.77752685546875, 0.8369140625, 0.89630126953125, 0.9556884765625, 1.01507568359375, 1.074462890625, 1.13385009765625, 1.1932373046875, 1.25262451171875, 1.31201171875, 1.37139892578125, 1.4307861328125, 1.49017333984375, 1.549560546875, 1.60894775390625, 1.6683349609375, 1.72772216796875, 1.787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 10.0, 6.0, 16.0, 18.0, 12.0, 21.0, 35.0, 60.0, 69.0, 118.0, 215.0, 354.0, 600.0, 1062.0, 2406.0, 6875.0, 25685.0, 132507.0, 1690068.0, 2149963.0, 144573.0, 27174.0, 7183.0, 2493.0, 1081.0, 583.0, 362.0, 230.0, 144.0, 119.0, 58.0, 54.0, 38.0, 23.0, 17.0, 12.0, 8.0, 6.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.4691162109375, -12.024169921875, -11.5792236328125, -11.13427734375, -10.6893310546875, -10.244384765625, -9.7994384765625, -9.3544921875, -8.9095458984375, -8.464599609375, -8.0196533203125, -7.57470703125, -7.1297607421875, -6.684814453125, -6.2398681640625, -5.794921875, -5.3499755859375, -4.905029296875, -4.4600830078125, -4.01513671875, -3.5701904296875, -3.125244140625, -2.6802978515625, -2.2353515625, -1.7904052734375, -1.345458984375, -0.9005126953125, -0.45556640625, -0.0106201171875, 0.434326171875, 0.8792724609375, 1.32421875, 1.7691650390625, 2.214111328125, 2.6590576171875, 3.10400390625, 3.5489501953125, 3.993896484375, 4.4388427734375, 4.8837890625, 5.3287353515625, 5.773681640625, 6.2186279296875, 6.66357421875, 7.1085205078125, 7.553466796875, 7.9984130859375, 8.443359375, 8.8883056640625, 9.333251953125, 9.7781982421875, 10.22314453125, 10.6680908203125, 11.113037109375, 11.5579833984375, 12.0029296875, 12.4478759765625, 12.892822265625, 13.3377685546875, 13.78271484375, 14.2276611328125, 14.672607421875, 15.1175537109375, 15.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 20.0, 20.0, 46.0, 65.0, 109.0, 186.0, 396.0, 989.0, 1270.0, 459.0, 208.0, 124.0, 68.0, 32.0, 28.0, 20.0, 7.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.0172119140625, -4.800048828125, -4.5828857421875, -4.36572265625, -4.1485595703125, -3.931396484375, -3.7142333984375, -3.4970703125, -3.2799072265625, -3.062744140625, -2.8455810546875, -2.62841796875, -2.4112548828125, -2.194091796875, -1.9769287109375, -1.759765625, -1.5426025390625, -1.325439453125, -1.1082763671875, -0.89111328125, -0.6739501953125, -0.456787109375, -0.2396240234375, -0.0224609375, 0.1947021484375, 0.411865234375, 0.6290283203125, 0.84619140625, 1.0633544921875, 1.280517578125, 1.4976806640625, 1.71484375, 1.9320068359375, 2.149169921875, 2.3663330078125, 2.58349609375, 2.8006591796875, 3.017822265625, 3.2349853515625, 3.4521484375, 3.6693115234375, 3.886474609375, 4.1036376953125, 4.32080078125, 4.5379638671875, 4.755126953125, 4.9722900390625, 5.189453125, 5.4066162109375, 5.623779296875, 5.8409423828125, 6.05810546875, 6.2752685546875, 6.492431640625, 6.7095947265625, 6.9267578125, 7.1439208984375, 7.361083984375, 7.5782470703125, 7.79541015625, 8.0125732421875, 8.229736328125, 8.4468994140625, 8.6640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 17.0, 20.0, 31.0, 48.0, 72.0, 120.0, 133.0, 156.0, 154.0, 98.0, 63.0, 33.0, 26.0, 9.0, 3.0, 4.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.974544525146484, -38.56621551513672, -37.15789031982422, -35.74956512451172, -34.34123611450195, -32.93290710449219, -31.524581909179688, -30.116254806518555, -28.707927703857422, -27.29960060119629, -25.891273498535156, -24.482946395874023, -23.07461929321289, -21.666292190551758, -20.257965087890625, -18.849637985229492, -17.44131088256836, -16.032983779907227, -14.624656677246094, -13.216329574584961, -11.808002471923828, -10.399675369262695, -8.991348266601562, -7.58302116394043, -6.174694061279297, -4.766366958618164, -3.3580398559570312, -1.9497127532958984, -0.5413856506347656, 0.8669414520263672, 2.2752685546875, 3.683595657348633, 5.091926574707031, 6.500253677368164, 7.908580780029297, 9.31690788269043, 10.725234985351562, 12.133562088012695, 13.541889190673828, 14.950216293334961, 16.358543395996094, 17.766870498657227, 19.17519760131836, 20.583524703979492, 21.991851806640625, 23.400178909301758, 24.80850601196289, 26.216833114624023, 27.625160217285156, 29.03348731994629, 30.441814422607422, 31.850141525268555, 33.25846862792969, 34.66679382324219, 36.07512283325195, 37.48345184326172, 38.89177703857422, 40.30010223388672, 41.708431243896484, 43.11676025390625, 44.52508544921875, 45.93341064453125, 47.341739654541016, 48.75006866455078, 50.15839385986328]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 2.0, 7.0, 8.0, 5.0, 13.0, 14.0, 15.0, 18.0, 14.0, 17.0, 32.0, 28.0, 34.0, 42.0, 35.0, 53.0, 31.0, 43.0, 32.0, 55.0, 42.0, 60.0, 55.0, 40.0, 39.0, 30.0, 33.0, 30.0, 28.0, 20.0, 19.0, 23.0, 13.0, 16.0, 12.0, 8.0, 8.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.589323043823242, -16.017658233642578, -15.44599437713623, -14.874330520629883, -14.302665710449219, -13.731000900268555, -13.159337043762207, -12.58767318725586, -12.016008377075195, -11.444343566894531, -10.872679710388184, -10.301015853881836, -9.729351043701172, -9.157686233520508, -8.58602237701416, -8.014358520507812, -7.442693710327148, -6.871029376983643, -6.299365043640137, -5.727700710296631, -5.156036376953125, -4.584372043609619, -4.012707710266113, -3.4410433769226074, -2.8693790435791016, -2.2977147102355957, -1.7260503768920898, -1.154386043548584, -0.5827217102050781, -0.011057376861572266, 0.5606069564819336, 1.1322712898254395, 1.7039375305175781, 2.275601863861084, 2.84726619720459, 3.4189305305480957, 3.9905948638916016, 4.562259197235107, 5.133923530578613, 5.705587863922119, 6.277252197265625, 6.848916530609131, 7.420580863952637, 7.992245197296143, 8.563909530639648, 9.135574340820312, 9.70723819732666, 10.278902053833008, 10.850566864013672, 11.422231674194336, 11.993895530700684, 12.565559387207031, 13.137224197387695, 13.70888900756836, 14.280552864074707, 14.852216720581055, 15.423881530761719, 15.995546340942383, 16.567211151123047, 17.138874053955078, 17.710538864135742, 18.282203674316406, 18.853866577148438, 19.4255313873291, 19.997196197509766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 12.0, 25.0, 36.0, 69.0, 97.0, 180.0, 325.0, 644.0, 1231.0, 2746.0, 6725.0, 17982.0, 51486.0, 150126.0, 388346.0, 278851.0, 96531.0, 32949.0, 11659.0, 4592.0, 1908.0, 904.0, 502.0, 260.0, 138.0, 78.0, 48.0, 31.0, 28.0, 13.0, 5.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.1640625, -13.80810546875, -13.4521484375, -13.09619140625, -12.740234375, -12.38427734375, -12.0283203125, -11.67236328125, -11.31640625, -10.96044921875, -10.6044921875, -10.24853515625, -9.892578125, -9.53662109375, -9.1806640625, -8.82470703125, -8.46875, -8.11279296875, -7.7568359375, -7.40087890625, -7.044921875, -6.68896484375, -6.3330078125, -5.97705078125, -5.62109375, -5.26513671875, -4.9091796875, -4.55322265625, -4.197265625, -3.84130859375, -3.4853515625, -3.12939453125, -2.7734375, -2.41748046875, -2.0615234375, -1.70556640625, -1.349609375, -0.99365234375, -0.6376953125, -0.28173828125, 0.07421875, 0.43017578125, 0.7861328125, 1.14208984375, 1.498046875, 1.85400390625, 2.2099609375, 2.56591796875, 2.921875, 3.27783203125, 3.6337890625, 3.98974609375, 4.345703125, 4.70166015625, 5.0576171875, 5.41357421875, 5.76953125, 6.12548828125, 6.4814453125, 6.83740234375, 7.193359375, 7.54931640625, 7.9052734375, 8.26123046875, 8.6171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 8.0, 9.0, 7.0, 11.0, 14.0, 14.0, 17.0, 22.0, 24.0, 35.0, 34.0, 45.0, 38.0, 54.0, 56.0, 47.0, 48.0, 53.0, 58.0, 43.0, 53.0, 52.0, 41.0, 41.0, 22.0, 26.0, 23.0, 19.0, 22.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6806640625, -1.6247711181640625, -1.568878173828125, -1.5129852294921875, -1.45709228515625, -1.4011993408203125, -1.345306396484375, -1.2894134521484375, -1.2335205078125, -1.1776275634765625, -1.121734619140625, -1.0658416748046875, -1.00994873046875, -0.9540557861328125, -0.898162841796875, -0.8422698974609375, -0.786376953125, -0.7304840087890625, -0.674591064453125, -0.6186981201171875, -0.56280517578125, -0.5069122314453125, -0.451019287109375, -0.3951263427734375, -0.3392333984375, -0.2833404541015625, -0.227447509765625, -0.1715545654296875, -0.11566162109375, -0.0597686767578125, -0.003875732421875, 0.0520172119140625, 0.10791015625, 0.1638031005859375, 0.219696044921875, 0.2755889892578125, 0.33148193359375, 0.3873748779296875, 0.443267822265625, 0.4991607666015625, 0.5550537109375, 0.6109466552734375, 0.666839599609375, 0.7227325439453125, 0.77862548828125, 0.8345184326171875, 0.890411376953125, 0.9463043212890625, 1.002197265625, 1.0580902099609375, 1.113983154296875, 1.1698760986328125, 1.22576904296875, 1.2816619873046875, 1.337554931640625, 1.3934478759765625, 1.4493408203125, 1.5052337646484375, 1.561126708984375, 1.6170196533203125, 1.67291259765625, 1.7288055419921875, 1.784698486328125, 1.8405914306640625, 1.896484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 8.0, 7.0, 8.0, 16.0, 20.0, 23.0, 41.0, 40.0, 65.0, 79.0, 120.0, 156.0, 265.0, 407.0, 639.0, 1025.0, 1996.0, 4000.0, 8615.0, 20133.0, 49137.0, 117932.0, 273958.0, 317045.0, 146545.0, 60440.0, 25108.0, 10564.0, 4616.0, 2287.0, 1186.0, 754.0, 426.0, 265.0, 194.0, 122.0, 94.0, 49.0, 42.0, 37.0, 34.0, 17.0, 12.0, 11.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -7.0205078125, -6.794921875, -6.5693359375, -6.34375, -6.1181640625, -5.892578125, -5.6669921875, -5.44140625, -5.2158203125, -4.990234375, -4.7646484375, -4.5390625, -4.3134765625, -4.087890625, -3.8623046875, -3.63671875, -3.4111328125, -3.185546875, -2.9599609375, -2.734375, -2.5087890625, -2.283203125, -2.0576171875, -1.83203125, -1.6064453125, -1.380859375, -1.1552734375, -0.9296875, -0.7041015625, -0.478515625, -0.2529296875, -0.02734375, 0.1982421875, 0.423828125, 0.6494140625, 0.875, 1.1005859375, 1.326171875, 1.5517578125, 1.77734375, 2.0029296875, 2.228515625, 2.4541015625, 2.6796875, 2.9052734375, 3.130859375, 3.3564453125, 3.58203125, 3.8076171875, 4.033203125, 4.2587890625, 4.484375, 4.7099609375, 4.935546875, 5.1611328125, 5.38671875, 5.6123046875, 5.837890625, 6.0634765625, 6.2890625, 6.5146484375, 6.740234375, 6.9658203125, 7.19140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 8.0, 10.0, 15.0, 19.0, 17.0, 29.0, 25.0, 30.0, 35.0, 44.0, 30.0, 39.0, 50.0, 46.0, 44.0, 46.0, 45.0, 46.0, 45.0, 46.0, 44.0, 37.0, 41.0, 34.0, 33.0, 23.0, 24.0, 16.0, 14.0, 12.0, 5.0, 12.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-8.4453125, -8.20184326171875, -7.9583740234375, -7.71490478515625, -7.471435546875, -7.22796630859375, -6.9844970703125, -6.74102783203125, -6.49755859375, -6.25408935546875, -6.0106201171875, -5.76715087890625, -5.523681640625, -5.28021240234375, -5.0367431640625, -4.79327392578125, -4.5498046875, -4.30633544921875, -4.0628662109375, -3.81939697265625, -3.575927734375, -3.33245849609375, -3.0889892578125, -2.84552001953125, -2.60205078125, -2.35858154296875, -2.1151123046875, -1.87164306640625, -1.628173828125, -1.38470458984375, -1.1412353515625, -0.89776611328125, -0.654296875, -0.41082763671875, -0.1673583984375, 0.07611083984375, 0.319580078125, 0.56304931640625, 0.8065185546875, 1.04998779296875, 1.29345703125, 1.53692626953125, 1.7803955078125, 2.02386474609375, 2.267333984375, 2.51080322265625, 2.7542724609375, 2.99774169921875, 3.2412109375, 3.48468017578125, 3.7281494140625, 3.97161865234375, 4.215087890625, 4.45855712890625, 4.7020263671875, 4.94549560546875, 5.18896484375, 5.43243408203125, 5.6759033203125, 5.91937255859375, 6.162841796875, 6.40631103515625, 6.6497802734375, 6.89324951171875, 7.13671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 16.0, 11.0, 15.0, 28.0, 31.0, 51.0, 61.0, 90.0, 131.0, 189.0, 335.0, 513.0, 883.0, 1681.0, 3164.0, 6885.0, 15546.0, 39867.0, 108398.0, 286047.0, 347353.0, 146058.0, 53318.0, 20671.0, 8580.0, 3901.0, 1991.0, 1003.0, 604.0, 371.0, 253.0, 160.0, 111.0, 60.0, 60.0, 31.0, 20.0, 23.0, 9.0, 6.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.982421875, -3.862274169921875, -3.74212646484375, -3.621978759765625, -3.5018310546875, -3.381683349609375, -3.26153564453125, -3.141387939453125, -3.021240234375, -2.901092529296875, -2.78094482421875, -2.660797119140625, -2.5406494140625, -2.420501708984375, -2.30035400390625, -2.180206298828125, -2.06005859375, -1.939910888671875, -1.81976318359375, -1.699615478515625, -1.5794677734375, -1.459320068359375, -1.33917236328125, -1.219024658203125, -1.098876953125, -0.978729248046875, -0.85858154296875, -0.738433837890625, -0.6182861328125, -0.498138427734375, -0.37799072265625, -0.257843017578125, -0.1376953125, -0.017547607421875, 0.10260009765625, 0.222747802734375, 0.3428955078125, 0.463043212890625, 0.58319091796875, 0.703338623046875, 0.823486328125, 0.943634033203125, 1.06378173828125, 1.183929443359375, 1.3040771484375, 1.424224853515625, 1.54437255859375, 1.664520263671875, 1.78466796875, 1.904815673828125, 2.02496337890625, 2.145111083984375, 2.2652587890625, 2.385406494140625, 2.50555419921875, 2.625701904296875, 2.745849609375, 2.865997314453125, 2.98614501953125, 3.106292724609375, 3.2264404296875, 3.346588134765625, 3.46673583984375, 3.586883544921875, 3.70703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 7.0, 16.0, 12.0, 27.0, 22.0, 33.0, 45.0, 59.0, 102.0, 130.0, 148.0, 103.0, 75.0, 34.0, 34.0, 28.0, 29.0, 16.0, 11.0, 13.0, 8.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00084686279296875, -0.0008221343159675598, -0.0007974058389663696, -0.0007726773619651794, -0.0007479488849639893, -0.0007232204079627991, -0.0006984919309616089, -0.0006737634539604187, -0.0006490349769592285, -0.0006243064999580383, -0.0005995780229568481, -0.000574849545955658, -0.0005501210689544678, -0.0005253925919532776, -0.0005006641149520874, -0.0004759356379508972, -0.00045120716094970703, -0.00042647868394851685, -0.00040175020694732666, -0.0003770217299461365, -0.0003522932529449463, -0.0003275647759437561, -0.0003028362989425659, -0.00027810782194137573, -0.00025337934494018555, -0.00022865086793899536, -0.00020392239093780518, -0.000179193913936615, -0.0001544654369354248, -0.00012973695993423462, -0.00010500848293304443, -8.028000593185425e-05, -5.555152893066406e-05, -3.082305192947388e-05, -6.094574928283691e-06, 1.8633902072906494e-05, 4.336237907409668e-05, 6.809085607528687e-05, 9.281933307647705e-05, 0.00011754781007766724, 0.00014227628707885742, 0.0001670047640800476, 0.0001917332410812378, 0.00021646171808242798, 0.00024119019508361816, 0.00026591867208480835, 0.00029064714908599854, 0.0003153756260871887, 0.0003401041030883789, 0.0003648325800895691, 0.0003895610570907593, 0.00041428953409194946, 0.00043901801109313965, 0.00046374648809432983, 0.00048847496509552, 0.0005132034420967102, 0.0005379319190979004, 0.0005626603960990906, 0.0005873888731002808, 0.000612117350101471, 0.0006368458271026611, 0.0006615743041038513, 0.0006863027811050415, 0.0007110312581062317, 0.0007357597351074219]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 16.0, 11.0, 26.0, 25.0, 44.0, 54.0, 89.0, 135.0, 240.0, 361.0, 592.0, 1066.0, 1820.0, 3710.0, 8037.0, 20179.0, 58492.0, 188818.0, 416795.0, 231820.0, 72578.0, 24580.0, 9592.0, 4209.0, 2230.0, 1215.0, 678.0, 373.0, 237.0, 156.0, 96.0, 79.0, 48.0, 39.0, 25.0, 21.0, 17.0, 10.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.53125, -4.3878173828125, -4.244384765625, -4.1009521484375, -3.95751953125, -3.8140869140625, -3.670654296875, -3.5272216796875, -3.3837890625, -3.2403564453125, -3.096923828125, -2.9534912109375, -2.81005859375, -2.6666259765625, -2.523193359375, -2.3797607421875, -2.236328125, -2.0928955078125, -1.949462890625, -1.8060302734375, -1.66259765625, -1.5191650390625, -1.375732421875, -1.2322998046875, -1.0888671875, -0.9454345703125, -0.802001953125, -0.6585693359375, -0.51513671875, -0.3717041015625, -0.228271484375, -0.0848388671875, 0.05859375, 0.2020263671875, 0.345458984375, 0.4888916015625, 0.63232421875, 0.7757568359375, 0.919189453125, 1.0626220703125, 1.2060546875, 1.3494873046875, 1.492919921875, 1.6363525390625, 1.77978515625, 1.9232177734375, 2.066650390625, 2.2100830078125, 2.353515625, 2.4969482421875, 2.640380859375, 2.7838134765625, 2.92724609375, 3.0706787109375, 3.214111328125, 3.3575439453125, 3.5009765625, 3.6444091796875, 3.787841796875, 3.9312744140625, 4.07470703125, 4.2181396484375, 4.361572265625, 4.5050048828125, 4.6484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 10.0, 12.0, 14.0, 23.0, 24.0, 20.0, 20.0, 36.0, 55.0, 53.0, 77.0, 89.0, 79.0, 90.0, 84.0, 62.0, 60.0, 48.0, 33.0, 26.0, 24.0, 16.0, 12.0, 8.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.940765380859375, -4.80731201171875, -4.673858642578125, -4.5404052734375, -4.406951904296875, -4.27349853515625, -4.140045166015625, -4.006591796875, -3.873138427734375, -3.73968505859375, -3.606231689453125, -3.4727783203125, -3.339324951171875, -3.20587158203125, -3.072418212890625, -2.93896484375, -2.805511474609375, -2.67205810546875, -2.538604736328125, -2.4051513671875, -2.271697998046875, -2.13824462890625, -2.004791259765625, -1.871337890625, -1.737884521484375, -1.60443115234375, -1.470977783203125, -1.3375244140625, -1.204071044921875, -1.07061767578125, -0.937164306640625, -0.8037109375, -0.670257568359375, -0.53680419921875, -0.403350830078125, -0.2698974609375, -0.136444091796875, -0.00299072265625, 0.130462646484375, 0.263916015625, 0.397369384765625, 0.53082275390625, 0.664276123046875, 0.7977294921875, 0.931182861328125, 1.06463623046875, 1.198089599609375, 1.33154296875, 1.464996337890625, 1.59844970703125, 1.731903076171875, 1.8653564453125, 1.998809814453125, 2.13226318359375, 2.265716552734375, 2.399169921875, 2.532623291015625, 2.66607666015625, 2.799530029296875, 2.9329833984375, 3.066436767578125, 3.19989013671875, 3.333343505859375, 3.466796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 31.0, 38.0, 46.0, 80.0, 82.0, 105.0, 109.0, 106.0, 108.0, 66.0, 67.0, 37.0, 37.0, 16.0, 11.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.15516662597656, -63.38795471191406, -61.62074661254883, -59.85353469848633, -58.086326599121094, -56.319114685058594, -54.551902770996094, -52.78469467163086, -51.01748275756836, -49.25027084350586, -47.483062744140625, -45.715850830078125, -43.94864273071289, -42.18143081665039, -40.414222717285156, -38.647010803222656, -36.879798889160156, -35.112586975097656, -33.34537887573242, -31.578166961669922, -29.810956954956055, -28.043746948242188, -26.27653694152832, -24.509326934814453, -22.74211883544922, -20.97490882873535, -19.207698822021484, -17.440486907958984, -15.673276901245117, -13.90606689453125, -12.138856887817383, -10.3716459274292, -8.604434967041016, -6.83722448348999, -5.070013999938965, -3.3028039932250977, -1.5355935096740723, 0.23161697387695312, 1.9988269805908203, 3.766037940979004, 5.533247947692871, 7.3004584312438965, 9.067668914794922, 10.834878921508789, 12.602088928222656, 14.36929988861084, 16.13650894165039, 17.90372085571289, 19.670930862426758, 21.438140869140625, 23.205350875854492, 24.97256088256836, 26.73977279663086, 28.506982803344727, 30.274192810058594, 32.041404724121094, 33.80861282348633, 35.57582473754883, 37.34303283691406, 39.11024475097656, 40.8774528503418, 42.6446647644043, 44.41187286376953, 46.17908477783203, 47.94629669189453]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 2.0, 4.0, 9.0, 8.0, 6.0, 9.0, 11.0, 17.0, 20.0, 15.0, 24.0, 29.0, 34.0, 27.0, 34.0, 33.0, 39.0, 35.0, 44.0, 35.0, 46.0, 39.0, 36.0, 42.0, 33.0, 38.0, 32.0, 30.0, 34.0, 28.0, 34.0, 17.0, 20.0, 20.0, 21.0, 17.0, 14.0, 14.0, 10.0, 6.0, 11.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.24681854248047, -32.092681884765625, -30.938547134399414, -29.784412384033203, -28.63027572631836, -27.476139068603516, -26.322004318237305, -25.167869567871094, -24.01373291015625, -22.859596252441406, -21.705461502075195, -20.551326751708984, -19.39719009399414, -18.243053436279297, -17.088918685913086, -15.934782981872559, -14.780647277832031, -13.626511573791504, -12.472375869750977, -11.31824016571045, -10.164104461669922, -9.009968757629395, -7.855833053588867, -6.70169734954834, -5.5475616455078125, -4.393425941467285, -3.239290237426758, -2.0851545333862305, -0.9310188293457031, 0.22311687469482422, 1.3772525787353516, 2.531388282775879, 3.685527801513672, 4.839663505554199, 5.993799209594727, 7.147934913635254, 8.302070617675781, 9.456206321716309, 10.610342025756836, 11.764477729797363, 12.91861343383789, 14.072749137878418, 15.226884841918945, 16.381019592285156, 17.53515625, 18.689292907714844, 19.843427658081055, 20.997562408447266, 22.15169906616211, 23.305835723876953, 24.459970474243164, 25.614105224609375, 26.76824188232422, 27.922378540039062, 29.076513290405273, 30.230648040771484, 31.384784698486328, 32.53892135620117, 33.69305419921875, 34.847190856933594, 36.00132751464844, 37.15546417236328, 38.309600830078125, 39.4637336730957, 40.61787033081055]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 3.0, 7.0, 11.0, 14.0, 17.0, 22.0, 46.0, 58.0, 63.0, 105.0, 140.0, 248.0, 335.0, 558.0, 901.0, 1477.0, 2442.0, 4428.0, 8619.0, 18928.0, 50633.0, 196520.0, 3246779.0, 520062.0, 86979.0, 28487.0, 12065.0, 5995.0, 3132.0, 1889.0, 1202.0, 669.0, 439.0, 315.0, 196.0, 136.0, 99.0, 64.0, 46.0, 35.0, 24.0, 21.0, 15.0, 15.0, 13.0, 5.0, 4.0, 0.0, 1.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-8.640625, -8.3499755859375, -8.059326171875, -7.7686767578125, -7.47802734375, -7.1873779296875, -6.896728515625, -6.6060791015625, -6.3154296875, -6.0247802734375, -5.734130859375, -5.4434814453125, -5.15283203125, -4.8621826171875, -4.571533203125, -4.2808837890625, -3.990234375, -3.6995849609375, -3.408935546875, -3.1182861328125, -2.82763671875, -2.5369873046875, -2.246337890625, -1.9556884765625, -1.6650390625, -1.3743896484375, -1.083740234375, -0.7930908203125, -0.50244140625, -0.2117919921875, 0.078857421875, 0.3695068359375, 0.66015625, 0.9508056640625, 1.241455078125, 1.5321044921875, 1.82275390625, 2.1134033203125, 2.404052734375, 2.6947021484375, 2.9853515625, 3.2760009765625, 3.566650390625, 3.8572998046875, 4.14794921875, 4.4385986328125, 4.729248046875, 5.0198974609375, 5.310546875, 5.6011962890625, 5.891845703125, 6.1824951171875, 6.47314453125, 6.7637939453125, 7.054443359375, 7.3450927734375, 7.6357421875, 7.9263916015625, 8.217041015625, 8.5076904296875, 8.79833984375, 9.0889892578125, 9.379638671875, 9.6702880859375, 9.9609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 1.0, 3.0, 5.0, 8.0, 6.0, 8.0, 13.0, 15.0, 15.0, 22.0, 26.0, 31.0, 30.0, 30.0, 32.0, 53.0, 50.0, 50.0, 56.0, 46.0, 49.0, 57.0, 52.0, 49.0, 40.0, 30.0, 40.0, 37.0, 22.0, 21.0, 19.0, 16.0, 13.0, 16.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.67578125, -1.6198272705078125, -1.563873291015625, -1.5079193115234375, -1.45196533203125, -1.3960113525390625, -1.340057373046875, -1.2841033935546875, -1.2281494140625, -1.1721954345703125, -1.116241455078125, -1.0602874755859375, -1.00433349609375, -0.9483795166015625, -0.892425537109375, -0.8364715576171875, -0.780517578125, -0.7245635986328125, -0.668609619140625, -0.6126556396484375, -0.55670166015625, -0.5007476806640625, -0.444793701171875, -0.3888397216796875, -0.3328857421875, -0.2769317626953125, -0.220977783203125, -0.1650238037109375, -0.10906982421875, -0.0531158447265625, 0.002838134765625, 0.0587921142578125, 0.11474609375, 0.1707000732421875, 0.226654052734375, 0.2826080322265625, 0.33856201171875, 0.3945159912109375, 0.450469970703125, 0.5064239501953125, 0.5623779296875, 0.6183319091796875, 0.674285888671875, 0.7302398681640625, 0.78619384765625, 0.8421478271484375, 0.898101806640625, 0.9540557861328125, 1.010009765625, 1.0659637451171875, 1.121917724609375, 1.1778717041015625, 1.23382568359375, 1.2897796630859375, 1.345733642578125, 1.4016876220703125, 1.4576416015625, 1.5135955810546875, 1.569549560546875, 1.6255035400390625, 1.68145751953125, 1.7374114990234375, 1.793365478515625, 1.8493194580078125, 1.9052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 5.0, 8.0, 5.0, 7.0, 10.0, 16.0, 15.0, 27.0, 24.0, 36.0, 48.0, 54.0, 80.0, 115.0, 261.0, 635.0, 1764.0, 5655.0, 22868.0, 131629.0, 3098176.0, 841639.0, 71412.0, 13894.0, 3571.0, 1200.0, 485.0, 239.0, 114.0, 73.0, 63.0, 41.0, 21.0, 24.0, 20.0, 14.0, 3.0, 8.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3359375, -11.8929443359375, -11.449951171875, -11.0069580078125, -10.56396484375, -10.1209716796875, -9.677978515625, -9.2349853515625, -8.7919921875, -8.3489990234375, -7.906005859375, -7.4630126953125, -7.02001953125, -6.5770263671875, -6.134033203125, -5.6910400390625, -5.248046875, -4.8050537109375, -4.362060546875, -3.9190673828125, -3.47607421875, -3.0330810546875, -2.590087890625, -2.1470947265625, -1.7041015625, -1.2611083984375, -0.818115234375, -0.3751220703125, 0.06787109375, 0.5108642578125, 0.953857421875, 1.3968505859375, 1.83984375, 2.2828369140625, 2.725830078125, 3.1688232421875, 3.61181640625, 4.0548095703125, 4.497802734375, 4.9407958984375, 5.3837890625, 5.8267822265625, 6.269775390625, 6.7127685546875, 7.15576171875, 7.5987548828125, 8.041748046875, 8.4847412109375, 8.927734375, 9.3707275390625, 9.813720703125, 10.2567138671875, 10.69970703125, 11.1427001953125, 11.585693359375, 12.0286865234375, 12.4716796875, 12.9146728515625, 13.357666015625, 13.8006591796875, 14.24365234375, 14.6866455078125, 15.129638671875, 15.5726318359375, 16.015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 7.0, 10.0, 16.0, 28.0, 52.0, 90.0, 152.0, 303.0, 1026.0, 1641.0, 398.0, 148.0, 92.0, 44.0, 25.0, 17.0, 10.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.39569091796875, -7.2015380859375, -7.00738525390625, -6.813232421875, -6.61907958984375, -6.4249267578125, -6.23077392578125, -6.03662109375, -5.84246826171875, -5.6483154296875, -5.45416259765625, -5.260009765625, -5.06585693359375, -4.8717041015625, -4.67755126953125, -4.4833984375, -4.28924560546875, -4.0950927734375, -3.90093994140625, -3.706787109375, -3.51263427734375, -3.3184814453125, -3.12432861328125, -2.93017578125, -2.73602294921875, -2.5418701171875, -2.34771728515625, -2.153564453125, -1.95941162109375, -1.7652587890625, -1.57110595703125, -1.376953125, -1.18280029296875, -0.9886474609375, -0.79449462890625, -0.600341796875, -0.40618896484375, -0.2120361328125, -0.01788330078125, 0.17626953125, 0.37042236328125, 0.5645751953125, 0.75872802734375, 0.952880859375, 1.14703369140625, 1.3411865234375, 1.53533935546875, 1.7294921875, 1.92364501953125, 2.1177978515625, 2.31195068359375, 2.506103515625, 2.70025634765625, 2.8944091796875, 3.08856201171875, 3.28271484375, 3.47686767578125, 3.6710205078125, 3.86517333984375, 4.059326171875, 4.25347900390625, 4.4476318359375, 4.64178466796875, 4.8359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 30.0, 46.0, 76.0, 104.0, 141.0, 141.0, 136.0, 110.0, 74.0, 53.0, 34.0, 8.0, 13.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.1578369140625, -34.22833251953125, -33.298828125, -32.369327545166016, -31.439823150634766, -30.510318756103516, -29.580814361572266, -28.651309967041016, -27.7218074798584, -26.79230308532715, -25.86280059814453, -24.93329620361328, -24.00379180908203, -23.074289321899414, -22.144784927368164, -21.215282440185547, -20.285778045654297, -19.356273651123047, -18.42677116394043, -17.49726676940918, -16.567764282226562, -15.638259887695312, -14.708755493164062, -13.779252052307129, -12.849748611450195, -11.920245170593262, -10.990741729736328, -10.061237335205078, -9.131733894348145, -8.202230453491211, -7.272726535797119, -6.343222618103027, -5.413719177246094, -4.48421573638916, -3.5547118186950684, -2.6252081394195557, -1.695704460144043, -0.7662010192871094, 0.16330289840698242, 1.0928068161010742, 2.022310256958008, 2.9518139362335205, 3.881317615509033, 4.810821533203125, 5.740324974060059, 6.669828414916992, 7.599332332611084, 8.528836250305176, 9.45833969116211, 10.387843132019043, 11.317346572875977, 12.246850967407227, 13.17635440826416, 14.105857849121094, 15.035362243652344, 15.964865684509277, 16.89436912536621, 17.82387351989746, 18.753376007080078, 19.682880401611328, 20.612384796142578, 21.541887283325195, 22.471391677856445, 23.400894165039062, 24.330398559570312]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 9.0, 18.0, 23.0, 31.0, 39.0, 34.0, 46.0, 38.0, 45.0, 40.0, 55.0, 53.0, 54.0, 40.0, 65.0, 52.0, 54.0, 42.0, 47.0, 33.0, 35.0, 32.0, 23.0, 18.0, 10.0, 14.0, 11.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.483598709106445, -18.97551155090332, -18.467424392700195, -17.95933723449707, -17.451250076293945, -16.94316291809082, -16.435075759887695, -15.92698860168457, -15.418901443481445, -14.91081428527832, -14.402727127075195, -13.89463996887207, -13.386552810668945, -12.87846565246582, -12.370378494262695, -11.86229133605957, -11.354205131530762, -10.846117973327637, -10.338030815124512, -9.829943656921387, -9.321856498718262, -8.813769340515137, -8.305683135986328, -7.797595500946045, -7.28950834274292, -6.781421184539795, -6.27333402633667, -5.765247344970703, -5.257160186767578, -4.749073028564453, -4.240985870361328, -3.732898712158203, -3.2248125076293945, -2.7167253494262695, -2.2086381912231445, -1.7005512714385986, -1.1924641132354736, -0.6843769550323486, -0.17629003524780273, 0.33179712295532227, 0.8398842811584473, 1.3479714393615723, 1.8560584783554077, 2.364145517349243, 2.872232675552368, 3.380319833755493, 3.888406753540039, 4.396493911743164, 4.904581069946289, 5.412668228149414, 5.920755386352539, 6.428842544555664, 6.936929702758789, 7.445016860961914, 7.953103542327881, 8.461191177368164, 8.969278335571289, 9.477365493774414, 9.985452651977539, 10.493539810180664, 11.001626968383789, 11.509714126586914, 12.017801284790039, 12.525888442993164, 13.033974647521973]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 6.0, 32.0, 44.0, 59.0, 118.0, 211.0, 417.0, 724.0, 1474.0, 3367.0, 9005.0, 25506.0, 80244.0, 255167.0, 423416.0, 167964.0, 52592.0, 17155.0, 6146.0, 2503.0, 1110.0, 576.0, 281.0, 156.0, 100.0, 65.0, 38.0, 29.0, 17.0, 10.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.775634765625, -11.38720703125, -10.998779296875, -10.6103515625, -10.221923828125, -9.83349609375, -9.445068359375, -9.056640625, -8.668212890625, -8.27978515625, -7.891357421875, -7.5029296875, -7.114501953125, -6.72607421875, -6.337646484375, -5.94921875, -5.560791015625, -5.17236328125, -4.783935546875, -4.3955078125, -4.007080078125, -3.61865234375, -3.230224609375, -2.841796875, -2.453369140625, -2.06494140625, -1.676513671875, -1.2880859375, -0.899658203125, -0.51123046875, -0.122802734375, 0.265625, 0.654052734375, 1.04248046875, 1.430908203125, 1.8193359375, 2.207763671875, 2.59619140625, 2.984619140625, 3.373046875, 3.761474609375, 4.14990234375, 4.538330078125, 4.9267578125, 5.315185546875, 5.70361328125, 6.092041015625, 6.48046875, 6.868896484375, 7.25732421875, 7.645751953125, 8.0341796875, 8.422607421875, 8.81103515625, 9.199462890625, 9.587890625, 9.976318359375, 10.36474609375, 10.753173828125, 11.1416015625, 11.530029296875, 11.91845703125, 12.306884765625, 12.6953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 5.0, 8.0, 13.0, 17.0, 16.0, 27.0, 20.0, 22.0, 30.0, 40.0, 43.0, 38.0, 50.0, 52.0, 47.0, 54.0, 57.0, 58.0, 38.0, 59.0, 53.0, 26.0, 28.0, 33.0, 16.0, 26.0, 24.0, 12.0, 13.0, 12.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.662109375, -1.6068115234375, -1.551513671875, -1.4962158203125, -1.44091796875, -1.3856201171875, -1.330322265625, -1.2750244140625, -1.2197265625, -1.1644287109375, -1.109130859375, -1.0538330078125, -0.99853515625, -0.9432373046875, -0.887939453125, -0.8326416015625, -0.77734375, -0.7220458984375, -0.666748046875, -0.6114501953125, -0.55615234375, -0.5008544921875, -0.445556640625, -0.3902587890625, -0.3349609375, -0.2796630859375, -0.224365234375, -0.1690673828125, -0.11376953125, -0.0584716796875, -0.003173828125, 0.0521240234375, 0.107421875, 0.1627197265625, 0.218017578125, 0.2733154296875, 0.32861328125, 0.3839111328125, 0.439208984375, 0.4945068359375, 0.5498046875, 0.6051025390625, 0.660400390625, 0.7156982421875, 0.77099609375, 0.8262939453125, 0.881591796875, 0.9368896484375, 0.9921875, 1.0474853515625, 1.102783203125, 1.1580810546875, 1.21337890625, 1.2686767578125, 1.323974609375, 1.3792724609375, 1.4345703125, 1.4898681640625, 1.545166015625, 1.6004638671875, 1.65576171875, 1.7110595703125, 1.766357421875, 1.8216552734375, 1.876953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 11.0, 15.0, 13.0, 14.0, 35.0, 45.0, 51.0, 77.0, 93.0, 126.0, 179.0, 224.0, 335.0, 557.0, 1054.0, 2069.0, 5115.0, 14131.0, 45575.0, 152977.0, 404537.0, 287158.0, 90903.0, 27261.0, 8877.0, 3373.0, 1496.0, 752.0, 438.0, 297.0, 196.0, 154.0, 118.0, 78.0, 53.0, 37.0, 38.0, 27.0, 28.0, 9.0, 15.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.30645751953125, -7.0230712890625, -6.73968505859375, -6.456298828125, -6.17291259765625, -5.8895263671875, -5.60614013671875, -5.32275390625, -5.03936767578125, -4.7559814453125, -4.47259521484375, -4.189208984375, -3.90582275390625, -3.6224365234375, -3.33905029296875, -3.0556640625, -2.77227783203125, -2.4888916015625, -2.20550537109375, -1.922119140625, -1.63873291015625, -1.3553466796875, -1.07196044921875, -0.78857421875, -0.50518798828125, -0.2218017578125, 0.06158447265625, 0.344970703125, 0.62835693359375, 0.9117431640625, 1.19512939453125, 1.478515625, 1.76190185546875, 2.0452880859375, 2.32867431640625, 2.612060546875, 2.89544677734375, 3.1788330078125, 3.46221923828125, 3.74560546875, 4.02899169921875, 4.3123779296875, 4.59576416015625, 4.879150390625, 5.16253662109375, 5.4459228515625, 5.72930908203125, 6.0126953125, 6.29608154296875, 6.5794677734375, 6.86285400390625, 7.146240234375, 7.42962646484375, 7.7130126953125, 7.99639892578125, 8.27978515625, 8.56317138671875, 8.8465576171875, 9.12994384765625, 9.413330078125, 9.69671630859375, 9.9801025390625, 10.26348876953125, 10.546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 6.0, 6.0, 10.0, 9.0, 11.0, 12.0, 15.0, 16.0, 26.0, 29.0, 34.0, 30.0, 21.0, 26.0, 34.0, 36.0, 39.0, 51.0, 43.0, 41.0, 37.0, 42.0, 40.0, 30.0, 39.0, 29.0, 30.0, 20.0, 25.0, 27.0, 15.0, 20.0, 7.0, 25.0, 15.0, 16.0, 12.0, 4.0, 3.0, 11.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.23828125, -6.0538330078125, -5.869384765625, -5.6849365234375, -5.50048828125, -5.3160400390625, -5.131591796875, -4.9471435546875, -4.7626953125, -4.5782470703125, -4.393798828125, -4.2093505859375, -4.02490234375, -3.8404541015625, -3.656005859375, -3.4715576171875, -3.287109375, -3.1026611328125, -2.918212890625, -2.7337646484375, -2.54931640625, -2.3648681640625, -2.180419921875, -1.9959716796875, -1.8115234375, -1.6270751953125, -1.442626953125, -1.2581787109375, -1.07373046875, -0.8892822265625, -0.704833984375, -0.5203857421875, -0.3359375, -0.1514892578125, 0.032958984375, 0.2174072265625, 0.40185546875, 0.5863037109375, 0.770751953125, 0.9552001953125, 1.1396484375, 1.3240966796875, 1.508544921875, 1.6929931640625, 1.87744140625, 2.0618896484375, 2.246337890625, 2.4307861328125, 2.615234375, 2.7996826171875, 2.984130859375, 3.1685791015625, 3.35302734375, 3.5374755859375, 3.721923828125, 3.9063720703125, 4.0908203125, 4.2752685546875, 4.459716796875, 4.6441650390625, 4.82861328125, 5.0130615234375, 5.197509765625, 5.3819580078125, 5.56640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 7.0, 11.0, 14.0, 26.0, 34.0, 47.0, 60.0, 142.0, 251.0, 479.0, 920.0, 1964.0, 4926.0, 14872.0, 60206.0, 348255.0, 496320.0, 88784.0, 20093.0, 6408.0, 2335.0, 1124.0, 561.0, 302.0, 146.0, 82.0, 63.0, 37.0, 18.0, 14.0, 10.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.65234375, -7.4344482421875, -7.216552734375, -6.9986572265625, -6.78076171875, -6.5628662109375, -6.344970703125, -6.1270751953125, -5.9091796875, -5.6912841796875, -5.473388671875, -5.2554931640625, -5.03759765625, -4.8197021484375, -4.601806640625, -4.3839111328125, -4.166015625, -3.9481201171875, -3.730224609375, -3.5123291015625, -3.29443359375, -3.0765380859375, -2.858642578125, -2.6407470703125, -2.4228515625, -2.2049560546875, -1.987060546875, -1.7691650390625, -1.55126953125, -1.3333740234375, -1.115478515625, -0.8975830078125, -0.6796875, -0.4617919921875, -0.243896484375, -0.0260009765625, 0.19189453125, 0.4097900390625, 0.627685546875, 0.8455810546875, 1.0634765625, 1.2813720703125, 1.499267578125, 1.7171630859375, 1.93505859375, 2.1529541015625, 2.370849609375, 2.5887451171875, 2.806640625, 3.0245361328125, 3.242431640625, 3.4603271484375, 3.67822265625, 3.8961181640625, 4.114013671875, 4.3319091796875, 4.5498046875, 4.7677001953125, 4.985595703125, 5.2034912109375, 5.42138671875, 5.6392822265625, 5.857177734375, 6.0750732421875, 6.29296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 15.0, 14.0, 16.0, 21.0, 23.0, 19.0, 46.0, 48.0, 63.0, 99.0, 115.0, 118.0, 77.0, 65.0, 47.0, 25.0, 36.0, 22.0, 20.0, 13.0, 14.0, 9.0, 9.0, 6.0, 12.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007076263427734375, -0.0006838887929916382, -0.0006601512432098389, -0.0006364136934280396, -0.0006126761436462402, -0.0005889385938644409, -0.0005652010440826416, -0.0005414634943008423, -0.000517725944519043, -0.0004939883947372437, -0.00047025084495544434, -0.000446513295173645, -0.0004227757453918457, -0.0003990381956100464, -0.00037530064582824707, -0.00035156309604644775, -0.00032782554626464844, -0.0003040879964828491, -0.0002803504467010498, -0.0002566128969192505, -0.00023287534713745117, -0.00020913779735565186, -0.00018540024757385254, -0.00016166269779205322, -0.0001379251480102539, -0.00011418759822845459, -9.045004844665527e-05, -6.671249866485596e-05, -4.297494888305664e-05, -1.9237399101257324e-05, 4.500150680541992e-06, 2.823770046234131e-05, 5.1975250244140625e-05, 7.571280002593994e-05, 9.945034980773926e-05, 0.00012318789958953857, 0.0001469254493713379, 0.0001706629991531372, 0.00019440054893493652, 0.00021813809871673584, 0.00024187564849853516, 0.00026561319828033447, 0.0002893507480621338, 0.0003130882978439331, 0.0003368258476257324, 0.00036056339740753174, 0.00038430094718933105, 0.00040803849697113037, 0.0004317760467529297, 0.000455513596534729, 0.0004792511463165283, 0.0005029886960983276, 0.000526726245880127, 0.0005504637956619263, 0.0005742013454437256, 0.0005979388952255249, 0.0006216764450073242, 0.0006454139947891235, 0.0006691515445709229, 0.0006928890943527222, 0.0007166266441345215, 0.0007403641939163208, 0.0007641017436981201, 0.0007878392934799194, 0.0008115768432617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 0.0, 6.0, 9.0, 7.0, 11.0, 15.0, 17.0, 26.0, 39.0, 73.0, 133.0, 178.0, 369.0, 687.0, 1380.0, 3723.0, 12357.0, 66040.0, 614306.0, 302259.0, 34307.0, 7503.0, 2653.0, 1146.0, 591.0, 302.0, 145.0, 107.0, 44.0, 37.0, 23.0, 11.0, 9.0, 7.0, 8.0, 3.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.2095947265625, -7.903564453125, -7.5975341796875, -7.29150390625, -6.9854736328125, -6.679443359375, -6.3734130859375, -6.0673828125, -5.7613525390625, -5.455322265625, -5.1492919921875, -4.84326171875, -4.5372314453125, -4.231201171875, -3.9251708984375, -3.619140625, -3.3131103515625, -3.007080078125, -2.7010498046875, -2.39501953125, -2.0889892578125, -1.782958984375, -1.4769287109375, -1.1708984375, -0.8648681640625, -0.558837890625, -0.2528076171875, 0.05322265625, 0.3592529296875, 0.665283203125, 0.9713134765625, 1.27734375, 1.5833740234375, 1.889404296875, 2.1954345703125, 2.50146484375, 2.8074951171875, 3.113525390625, 3.4195556640625, 3.7255859375, 4.0316162109375, 4.337646484375, 4.6436767578125, 4.94970703125, 5.2557373046875, 5.561767578125, 5.8677978515625, 6.173828125, 6.4798583984375, 6.785888671875, 7.0919189453125, 7.39794921875, 7.7039794921875, 8.010009765625, 8.3160400390625, 8.6220703125, 8.9281005859375, 9.234130859375, 9.5401611328125, 9.84619140625, 10.1522216796875, 10.458251953125, 10.7642822265625, 11.0703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 8.0, 11.0, 23.0, 33.0, 37.0, 57.0, 82.0, 125.0, 148.0, 117.0, 114.0, 80.0, 35.0, 31.0, 27.0, 14.0, 13.0, 11.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.14453125, -6.9388427734375, -6.733154296875, -6.5274658203125, -6.32177734375, -6.1160888671875, -5.910400390625, -5.7047119140625, -5.4990234375, -5.2933349609375, -5.087646484375, -4.8819580078125, -4.67626953125, -4.4705810546875, -4.264892578125, -4.0592041015625, -3.853515625, -3.6478271484375, -3.442138671875, -3.2364501953125, -3.03076171875, -2.8250732421875, -2.619384765625, -2.4136962890625, -2.2080078125, -2.0023193359375, -1.796630859375, -1.5909423828125, -1.38525390625, -1.1795654296875, -0.973876953125, -0.7681884765625, -0.5625, -0.3568115234375, -0.151123046875, 0.0545654296875, 0.26025390625, 0.4659423828125, 0.671630859375, 0.8773193359375, 1.0830078125, 1.2886962890625, 1.494384765625, 1.7000732421875, 1.90576171875, 2.1114501953125, 2.317138671875, 2.5228271484375, 2.728515625, 2.9342041015625, 3.139892578125, 3.3455810546875, 3.55126953125, 3.7569580078125, 3.962646484375, 4.1683349609375, 4.3740234375, 4.5797119140625, 4.785400390625, 4.9910888671875, 5.19677734375, 5.4024658203125, 5.608154296875, 5.8138427734375, 6.01953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 19.0, 54.0, 127.0, 215.0, 218.0, 191.0, 89.0, 38.0, 22.0, 11.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.28690338134766, -106.39412689208984, -102.5013427734375, -98.60856628417969, -94.71578216552734, -90.82300567626953, -86.93022155761719, -83.03744506835938, -79.14466857910156, -75.25189208984375, -71.3591079711914, -67.4663314819336, -63.57354736328125, -59.68077087402344, -55.78799057006836, -51.89521026611328, -48.00242614746094, -44.10964584350586, -40.21686553955078, -36.32408905029297, -32.431304931640625, -28.53852653503418, -24.645748138427734, -20.752967834472656, -16.860187530517578, -12.9674072265625, -9.074627876281738, -5.181848526000977, -1.2890682220458984, 2.6037120819091797, 6.496490478515625, 10.389270782470703, 14.282058715820312, 18.17483901977539, 22.06761932373047, 25.960397720336914, 29.853178024291992, 33.74595642089844, 37.638736724853516, 41.531517028808594, 45.42429733276367, 49.31707763671875, 53.20985794067383, 57.102638244628906, 60.99541473388672, 64.88819885253906, 68.78097534179688, 72.67375183105469, 76.56653594970703, 80.45931243896484, 84.35209655761719, 88.244873046875, 92.13765716552734, 96.03043365478516, 99.9232177734375, 103.81599426269531, 107.70877075195312, 111.60154724121094, 115.49433135986328, 119.3871078491211, 123.27989196777344, 127.17266845703125, 131.06544494628906, 134.95822143554688, 138.85101318359375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 8.0, 9.0, 13.0, 14.0, 14.0, 20.0, 30.0, 18.0, 22.0, 27.0, 29.0, 26.0, 41.0, 36.0, 34.0, 47.0, 30.0, 36.0, 36.0, 54.0, 38.0, 36.0, 29.0, 34.0, 32.0, 28.0, 25.0, 26.0, 25.0, 24.0, 19.0, 28.0, 18.0, 13.0, 10.0, 10.0, 5.0, 9.0, 5.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-32.232086181640625, -31.216745376586914, -30.20140266418457, -29.18606185913086, -28.17072105407715, -27.155380249023438, -26.140037536621094, -25.124696731567383, -24.109355926513672, -23.09401512145996, -22.078672409057617, -21.063331604003906, -20.047990798950195, -19.032649993896484, -18.01730728149414, -17.00196647644043, -15.986623764038086, -14.971282005310059, -13.955941200256348, -12.94059944152832, -11.92525863647461, -10.909916877746582, -9.894575119018555, -8.879234313964844, -7.863892555236816, -6.848551273345947, -5.833209991455078, -4.817868232727051, -3.8025269508361816, -2.7871856689453125, -1.7718439102172852, -0.756502628326416, 0.2588386535644531, 1.2741800546646118, 2.2895214557647705, 3.3048629760742188, 4.320204257965088, 5.335545539855957, 6.350887298583984, 7.3662285804748535, 8.381569862365723, 9.39691162109375, 10.412252426147461, 11.427594184875488, 12.442935943603516, 13.458276748657227, 14.473618507385254, 15.488960266113281, 16.504301071166992, 17.519641876220703, 18.534984588623047, 19.550325393676758, 20.56566619873047, 21.581008911132812, 22.596349716186523, 23.611690521240234, 24.627033233642578, 25.64237403869629, 26.657716751098633, 27.673057556152344, 28.688398361206055, 29.703739166259766, 30.71908187866211, 31.73442268371582, 32.74976348876953]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 8.0, 7.0, 13.0, 16.0, 30.0, 33.0, 40.0, 66.0, 109.0, 152.0, 213.0, 290.0, 512.0, 705.0, 1219.0, 1996.0, 3675.0, 7423.0, 15352.0, 39644.0, 138888.0, 1448404.0, 2307405.0, 152852.0, 41890.0, 16195.0, 7458.0, 3819.0, 2158.0, 1287.0, 816.0, 532.0, 341.0, 216.0, 148.0, 104.0, 74.0, 52.0, 40.0, 27.0, 16.0, 13.0, 11.0, 8.0, 14.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5078125, -9.201416015625, -8.89501953125, -8.588623046875, -8.2822265625, -7.975830078125, -7.66943359375, -7.363037109375, -7.056640625, -6.750244140625, -6.44384765625, -6.137451171875, -5.8310546875, -5.524658203125, -5.21826171875, -4.911865234375, -4.60546875, -4.299072265625, -3.99267578125, -3.686279296875, -3.3798828125, -3.073486328125, -2.76708984375, -2.460693359375, -2.154296875, -1.847900390625, -1.54150390625, -1.235107421875, -0.9287109375, -0.622314453125, -0.31591796875, -0.009521484375, 0.296875, 0.603271484375, 0.90966796875, 1.216064453125, 1.5224609375, 1.828857421875, 2.13525390625, 2.441650390625, 2.748046875, 3.054443359375, 3.36083984375, 3.667236328125, 3.9736328125, 4.280029296875, 4.58642578125, 4.892822265625, 5.19921875, 5.505615234375, 5.81201171875, 6.118408203125, 6.4248046875, 6.731201171875, 7.03759765625, 7.343994140625, 7.650390625, 7.956787109375, 8.26318359375, 8.569580078125, 8.8759765625, 9.182373046875, 9.48876953125, 9.795166015625, 10.1015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 10.0, 4.0, 4.0, 11.0, 15.0, 11.0, 18.0, 18.0, 30.0, 36.0, 39.0, 44.0, 48.0, 51.0, 46.0, 68.0, 41.0, 61.0, 53.0, 49.0, 55.0, 32.0, 37.0, 41.0, 35.0, 20.0, 25.0, 17.0, 14.0, 17.0, 10.0, 10.0, 4.0, 3.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8251953125, -1.766265869140625, -1.70733642578125, -1.648406982421875, -1.5894775390625, -1.530548095703125, -1.47161865234375, -1.412689208984375, -1.353759765625, -1.294830322265625, -1.23590087890625, -1.176971435546875, -1.1180419921875, -1.059112548828125, -1.00018310546875, -0.941253662109375, -0.88232421875, -0.823394775390625, -0.76446533203125, -0.705535888671875, -0.6466064453125, -0.587677001953125, -0.52874755859375, -0.469818115234375, -0.410888671875, -0.351959228515625, -0.29302978515625, -0.234100341796875, -0.1751708984375, -0.116241455078125, -0.05731201171875, 0.001617431640625, 0.060546875, 0.119476318359375, 0.17840576171875, 0.237335205078125, 0.2962646484375, 0.355194091796875, 0.41412353515625, 0.473052978515625, 0.531982421875, 0.590911865234375, 0.64984130859375, 0.708770751953125, 0.7677001953125, 0.826629638671875, 0.88555908203125, 0.944488525390625, 1.00341796875, 1.062347412109375, 1.12127685546875, 1.180206298828125, 1.2391357421875, 1.298065185546875, 1.35699462890625, 1.415924072265625, 1.474853515625, 1.533782958984375, 1.59271240234375, 1.651641845703125, 1.7105712890625, 1.769500732421875, 1.82843017578125, 1.887359619140625, 1.9462890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 9.0, 3.0, 19.0, 16.0, 41.0, 51.0, 88.0, 109.0, 206.0, 307.0, 569.0, 1137.0, 2476.0, 5722.0, 16424.0, 55370.0, 260046.0, 2930399.0, 762927.0, 111972.0, 29282.0, 9588.0, 3884.0, 1668.0, 794.0, 419.0, 253.0, 166.0, 94.0, 73.0, 40.0, 44.0, 22.0, 19.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.465576171875, -9.15771484375, -8.849853515625, -8.5419921875, -8.234130859375, -7.92626953125, -7.618408203125, -7.310546875, -7.002685546875, -6.69482421875, -6.386962890625, -6.0791015625, -5.771240234375, -5.46337890625, -5.155517578125, -4.84765625, -4.539794921875, -4.23193359375, -3.924072265625, -3.6162109375, -3.308349609375, -3.00048828125, -2.692626953125, -2.384765625, -2.076904296875, -1.76904296875, -1.461181640625, -1.1533203125, -0.845458984375, -0.53759765625, -0.229736328125, 0.078125, 0.385986328125, 0.69384765625, 1.001708984375, 1.3095703125, 1.617431640625, 1.92529296875, 2.233154296875, 2.541015625, 2.848876953125, 3.15673828125, 3.464599609375, 3.7724609375, 4.080322265625, 4.38818359375, 4.696044921875, 5.00390625, 5.311767578125, 5.61962890625, 5.927490234375, 6.2353515625, 6.543212890625, 6.85107421875, 7.158935546875, 7.466796875, 7.774658203125, 8.08251953125, 8.390380859375, 8.6982421875, 9.006103515625, 9.31396484375, 9.621826171875, 9.9296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 13.0, 9.0, 10.0, 27.0, 37.0, 62.0, 95.0, 185.0, 382.0, 1125.0, 1231.0, 413.0, 193.0, 98.0, 57.0, 49.0, 27.0, 22.0, 8.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.04010009765625, -4.8536376953125, -4.66717529296875, -4.480712890625, -4.29425048828125, -4.1077880859375, -3.92132568359375, -3.73486328125, -3.54840087890625, -3.3619384765625, -3.17547607421875, -2.989013671875, -2.80255126953125, -2.6160888671875, -2.42962646484375, -2.2431640625, -2.05670166015625, -1.8702392578125, -1.68377685546875, -1.497314453125, -1.31085205078125, -1.1243896484375, -0.93792724609375, -0.75146484375, -0.56500244140625, -0.3785400390625, -0.19207763671875, -0.005615234375, 0.18084716796875, 0.3673095703125, 0.55377197265625, 0.740234375, 0.92669677734375, 1.1131591796875, 1.29962158203125, 1.486083984375, 1.67254638671875, 1.8590087890625, 2.04547119140625, 2.23193359375, 2.41839599609375, 2.6048583984375, 2.79132080078125, 2.977783203125, 3.16424560546875, 3.3507080078125, 3.53717041015625, 3.7236328125, 3.91009521484375, 4.0965576171875, 4.28302001953125, 4.469482421875, 4.65594482421875, 4.8424072265625, 5.02886962890625, 5.21533203125, 5.40179443359375, 5.5882568359375, 5.77471923828125, 5.961181640625, 6.14764404296875, 6.3341064453125, 6.52056884765625, 6.70703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 11.0, 8.0, 19.0, 46.0, 73.0, 120.0, 170.0, 184.0, 137.0, 93.0, 64.0, 37.0, 20.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.404075622558594, -60.989295959472656, -59.57451248168945, -58.15972900390625, -56.74494934082031, -55.330169677734375, -53.91538619995117, -52.50060272216797, -51.08582305908203, -49.671043395996094, -48.25625991821289, -46.84147644042969, -45.42669677734375, -44.01191711425781, -42.59713363647461, -41.182350158691406, -39.76757049560547, -38.35279083251953, -36.93800735473633, -35.523223876953125, -34.10844421386719, -32.69366455078125, -31.278881072998047, -29.864099502563477, -28.449317932128906, -27.034536361694336, -25.619754791259766, -24.204973220825195, -22.790191650390625, -21.375410079956055, -19.960628509521484, -18.545846939086914, -17.131061553955078, -15.716279983520508, -14.301498413085938, -12.886716842651367, -11.471935272216797, -10.057153701782227, -8.642372131347656, -7.227590560913086, -5.812808990478516, -4.398027420043945, -2.983245849609375, -1.5684642791748047, -0.15368270874023438, 1.261098861694336, 2.6758804321289062, 4.090662002563477, 5.505443572998047, 6.920225143432617, 8.335006713867188, 9.749788284301758, 11.164569854736328, 12.579351425170898, 13.994132995605469, 15.408914566040039, 16.82369613647461, 18.23847770690918, 19.65325927734375, 21.06804084777832, 22.48282241821289, 23.89760398864746, 25.31238555908203, 26.7271671295166, 28.141948699951172]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 19.0, 17.0, 11.0, 18.0, 27.0, 25.0, 39.0, 35.0, 42.0, 60.0, 56.0, 50.0, 61.0, 59.0, 53.0, 43.0, 47.0, 41.0, 44.0, 39.0, 43.0, 30.0, 23.0, 24.0, 12.0, 12.0, 16.0, 11.0, 6.0, 11.0, 1.0, 3.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.431673049926758, -22.79859161376953, -22.165510177612305, -21.532428741455078, -20.899349212646484, -20.266267776489258, -19.63318634033203, -19.000104904174805, -18.367023468017578, -17.73394203186035, -17.100860595703125, -16.4677791595459, -15.834698677062988, -15.201617240905762, -14.568536758422852, -13.935455322265625, -13.302373886108398, -12.669292449951172, -12.036211013793945, -11.403130531311035, -10.770049095153809, -10.136967658996582, -9.503887176513672, -8.870805740356445, -8.237724304199219, -7.604642868041992, -6.971561908721924, -6.3384809494018555, -5.705399513244629, -5.072318077087402, -4.439237117767334, -3.8061561584472656, -3.173074722290039, -2.5399935245513916, -1.9069123268127441, -1.2738311290740967, -0.6407499313354492, -0.007668733596801758, 0.6254124641418457, 1.258493423461914, 1.8915748596191406, 2.524656057357788, 3.1577372550964355, 3.790818452835083, 4.4238996505737305, 5.056981086730957, 5.690062046051025, 6.323143005371094, 6.95622444152832, 7.589305877685547, 8.222387313842773, 8.855467796325684, 9.48854923248291, 10.121630668640137, 10.754711151123047, 11.387792587280273, 12.0208740234375, 12.653955459594727, 13.287036895751953, 13.920117378234863, 14.55319881439209, 15.186280250549316, 15.819360733032227, 16.452442169189453, 17.08552360534668]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 11.0, 15.0, 20.0, 28.0, 42.0, 65.0, 93.0, 174.0, 257.0, 430.0, 831.0, 1576.0, 3087.0, 6709.0, 16127.0, 40776.0, 121133.0, 504450.0, 241195.0, 67518.0, 24984.0, 10014.0, 4350.0, 2057.0, 1107.0, 601.0, 366.0, 203.0, 113.0, 74.0, 49.0, 19.0, 20.0, 17.0, 19.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.244873046875, -7.91162109375, -7.578369140625, -7.2451171875, -6.911865234375, -6.57861328125, -6.245361328125, -5.912109375, -5.578857421875, -5.24560546875, -4.912353515625, -4.5791015625, -4.245849609375, -3.91259765625, -3.579345703125, -3.24609375, -2.912841796875, -2.57958984375, -2.246337890625, -1.9130859375, -1.579833984375, -1.24658203125, -0.913330078125, -0.580078125, -0.246826171875, 0.08642578125, 0.419677734375, 0.7529296875, 1.086181640625, 1.41943359375, 1.752685546875, 2.0859375, 2.419189453125, 2.75244140625, 3.085693359375, 3.4189453125, 3.752197265625, 4.08544921875, 4.418701171875, 4.751953125, 5.085205078125, 5.41845703125, 5.751708984375, 6.0849609375, 6.418212890625, 6.75146484375, 7.084716796875, 7.41796875, 7.751220703125, 8.08447265625, 8.417724609375, 8.7509765625, 9.084228515625, 9.41748046875, 9.750732421875, 10.083984375, 10.417236328125, 10.75048828125, 11.083740234375, 11.4169921875, 11.750244140625, 12.08349609375, 12.416748046875, 12.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 24.0, 21.0, 35.0, 30.0, 34.0, 61.0, 55.0, 56.0, 61.0, 63.0, 57.0, 58.0, 57.0, 62.0, 36.0, 39.0, 38.0, 41.0, 20.0, 24.0, 19.0, 17.0, 14.0, 6.0, 6.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.888519287109375, -1.82196044921875, -1.755401611328125, -1.6888427734375, -1.622283935546875, -1.55572509765625, -1.489166259765625, -1.422607421875, -1.356048583984375, -1.28948974609375, -1.222930908203125, -1.1563720703125, -1.089813232421875, -1.02325439453125, -0.956695556640625, -0.89013671875, -0.823577880859375, -0.75701904296875, -0.690460205078125, -0.6239013671875, -0.557342529296875, -0.49078369140625, -0.424224853515625, -0.357666015625, -0.291107177734375, -0.22454833984375, -0.157989501953125, -0.0914306640625, -0.024871826171875, 0.04168701171875, 0.108245849609375, 0.1748046875, 0.241363525390625, 0.30792236328125, 0.374481201171875, 0.4410400390625, 0.507598876953125, 0.57415771484375, 0.640716552734375, 0.707275390625, 0.773834228515625, 0.84039306640625, 0.906951904296875, 0.9735107421875, 1.040069580078125, 1.10662841796875, 1.173187255859375, 1.23974609375, 1.306304931640625, 1.37286376953125, 1.439422607421875, 1.5059814453125, 1.572540283203125, 1.63909912109375, 1.705657958984375, 1.772216796875, 1.838775634765625, 1.90533447265625, 1.971893310546875, 2.0384521484375, 2.105010986328125, 2.17156982421875, 2.238128662109375, 2.3046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 13.0, 22.0, 25.0, 25.0, 44.0, 73.0, 96.0, 107.0, 175.0, 280.0, 425.0, 811.0, 1691.0, 4735.0, 16285.0, 66500.0, 354950.0, 487204.0, 84732.0, 20413.0, 5745.0, 1967.0, 865.0, 459.0, 257.0, 207.0, 125.0, 91.0, 59.0, 42.0, 29.0, 22.0, 17.0, 10.0, 7.0, 9.0, 1.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-12.125, -11.7794189453125, -11.433837890625, -11.0882568359375, -10.74267578125, -10.3970947265625, -10.051513671875, -9.7059326171875, -9.3603515625, -9.0147705078125, -8.669189453125, -8.3236083984375, -7.97802734375, -7.6324462890625, -7.286865234375, -6.9412841796875, -6.595703125, -6.2501220703125, -5.904541015625, -5.5589599609375, -5.21337890625, -4.8677978515625, -4.522216796875, -4.1766357421875, -3.8310546875, -3.4854736328125, -3.139892578125, -2.7943115234375, -2.44873046875, -2.1031494140625, -1.757568359375, -1.4119873046875, -1.06640625, -0.7208251953125, -0.375244140625, -0.0296630859375, 0.31591796875, 0.6614990234375, 1.007080078125, 1.3526611328125, 1.6982421875, 2.0438232421875, 2.389404296875, 2.7349853515625, 3.08056640625, 3.4261474609375, 3.771728515625, 4.1173095703125, 4.462890625, 4.8084716796875, 5.154052734375, 5.4996337890625, 5.84521484375, 6.1907958984375, 6.536376953125, 6.8819580078125, 7.2275390625, 7.5731201171875, 7.918701171875, 8.2642822265625, 8.60986328125, 8.9554443359375, 9.301025390625, 9.6466064453125, 9.9921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 10.0, 12.0, 19.0, 22.0, 23.0, 18.0, 31.0, 34.0, 49.0, 31.0, 47.0, 39.0, 48.0, 51.0, 45.0, 44.0, 52.0, 48.0, 31.0, 49.0, 50.0, 47.0, 39.0, 24.0, 23.0, 16.0, 16.0, 13.0, 17.0, 7.0, 13.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.11865234375, -7.8701171875, -7.62158203125, -7.373046875, -7.12451171875, -6.8759765625, -6.62744140625, -6.37890625, -6.13037109375, -5.8818359375, -5.63330078125, -5.384765625, -5.13623046875, -4.8876953125, -4.63916015625, -4.390625, -4.14208984375, -3.8935546875, -3.64501953125, -3.396484375, -3.14794921875, -2.8994140625, -2.65087890625, -2.40234375, -2.15380859375, -1.9052734375, -1.65673828125, -1.408203125, -1.15966796875, -0.9111328125, -0.66259765625, -0.4140625, -0.16552734375, 0.0830078125, 0.33154296875, 0.580078125, 0.82861328125, 1.0771484375, 1.32568359375, 1.57421875, 1.82275390625, 2.0712890625, 2.31982421875, 2.568359375, 2.81689453125, 3.0654296875, 3.31396484375, 3.5625, 3.81103515625, 4.0595703125, 4.30810546875, 4.556640625, 4.80517578125, 5.0537109375, 5.30224609375, 5.55078125, 5.79931640625, 6.0478515625, 6.29638671875, 6.544921875, 6.79345703125, 7.0419921875, 7.29052734375, 7.5390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 9.0, 13.0, 7.0, 27.0, 40.0, 47.0, 115.0, 199.0, 445.0, 1179.0, 4266.0, 23192.0, 191657.0, 741442.0, 71036.0, 10980.0, 2487.0, 750.0, 300.0, 157.0, 80.0, 43.0, 21.0, 22.0, 14.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.015625, -9.7396240234375, -9.463623046875, -9.1876220703125, -8.91162109375, -8.6356201171875, -8.359619140625, -8.0836181640625, -7.8076171875, -7.5316162109375, -7.255615234375, -6.9796142578125, -6.70361328125, -6.4276123046875, -6.151611328125, -5.8756103515625, -5.599609375, -5.3236083984375, -5.047607421875, -4.7716064453125, -4.49560546875, -4.2196044921875, -3.943603515625, -3.6676025390625, -3.3916015625, -3.1156005859375, -2.839599609375, -2.5635986328125, -2.28759765625, -2.0115966796875, -1.735595703125, -1.4595947265625, -1.18359375, -0.9075927734375, -0.631591796875, -0.3555908203125, -0.07958984375, 0.1964111328125, 0.472412109375, 0.7484130859375, 1.0244140625, 1.3004150390625, 1.576416015625, 1.8524169921875, 2.12841796875, 2.4044189453125, 2.680419921875, 2.9564208984375, 3.232421875, 3.5084228515625, 3.784423828125, 4.0604248046875, 4.33642578125, 4.6124267578125, 4.888427734375, 5.1644287109375, 5.4404296875, 5.7164306640625, 5.992431640625, 6.2684326171875, 6.54443359375, 6.8204345703125, 7.096435546875, 7.3724365234375, 7.6484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 6.0, 16.0, 6.0, 10.0, 9.0, 20.0, 15.0, 19.0, 23.0, 29.0, 66.0, 168.0, 221.0, 118.0, 51.0, 34.0, 25.0, 24.0, 19.0, 14.0, 16.0, 17.0, 18.0, 10.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007333755493164062, -0.0007106810808181763, -0.0006879866123199463, -0.0006652921438217163, -0.0006425976753234863, -0.0006199032068252563, -0.0005972087383270264, -0.0005745142698287964, -0.0005518198013305664, -0.0005291253328323364, -0.0005064308643341064, -0.00048373639583587646, -0.0004610419273376465, -0.0004383474588394165, -0.0004156529903411865, -0.00039295852184295654, -0.00037026405334472656, -0.0003475695848464966, -0.0003248751163482666, -0.0003021806478500366, -0.00027948617935180664, -0.00025679171085357666, -0.00023409724235534668, -0.0002114027738571167, -0.00018870830535888672, -0.00016601383686065674, -0.00014331936836242676, -0.00012062489986419678, -9.79304313659668e-05, -7.523596286773682e-05, -5.2541494369506836e-05, -2.9847025871276855e-05, -7.152557373046875e-06, 1.5541911125183105e-05, 3.8236379623413086e-05, 6.0930848121643066e-05, 8.362531661987305e-05, 0.00010631978511810303, 0.000129014253616333, 0.000151708722114563, 0.00017440319061279297, 0.00019709765911102295, 0.00021979212760925293, 0.0002424865961074829, 0.0002651810646057129, 0.00028787553310394287, 0.00031057000160217285, 0.00033326447010040283, 0.0003559589385986328, 0.0003786534070968628, 0.0004013478755950928, 0.00042404234409332275, 0.00044673681259155273, 0.0004694312810897827, 0.0004921257495880127, 0.0005148202180862427, 0.0005375146865844727, 0.0005602091550827026, 0.0005829036235809326, 0.0006055980920791626, 0.0006282925605773926, 0.0006509870290756226, 0.0006736814975738525, 0.0006963759660720825, 0.0007190704345703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 14.0, 11.0, 16.0, 30.0, 32.0, 70.0, 86.0, 164.0, 285.0, 483.0, 992.0, 2500.0, 8375.0, 43579.0, 427824.0, 501678.0, 48472.0, 9051.0, 2540.0, 1075.0, 536.0, 290.0, 168.0, 71.0, 70.0, 37.0, 25.0, 17.0, 12.0, 8.0, 7.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.4140625, -10.1328125, -9.8515625, -9.5703125, -9.2890625, -9.0078125, -8.7265625, -8.4453125, -8.1640625, -7.8828125, -7.6015625, -7.3203125, -7.0390625, -6.7578125, -6.4765625, -6.1953125, -5.9140625, -5.6328125, -5.3515625, -5.0703125, -4.7890625, -4.5078125, -4.2265625, -3.9453125, -3.6640625, -3.3828125, -3.1015625, -2.8203125, -2.5390625, -2.2578125, -1.9765625, -1.6953125, -1.4140625, -1.1328125, -0.8515625, -0.5703125, -0.2890625, -0.0078125, 0.2734375, 0.5546875, 0.8359375, 1.1171875, 1.3984375, 1.6796875, 1.9609375, 2.2421875, 2.5234375, 2.8046875, 3.0859375, 3.3671875, 3.6484375, 3.9296875, 4.2109375, 4.4921875, 4.7734375, 5.0546875, 5.3359375, 5.6171875, 5.8984375, 6.1796875, 6.4609375, 6.7421875, 7.0234375, 7.3046875, 7.5859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 7.0, 9.0, 11.0, 10.0, 19.0, 23.0, 33.0, 36.0, 58.0, 80.0, 95.0, 106.0, 127.0, 100.0, 63.0, 49.0, 33.0, 28.0, 21.0, 14.0, 21.0, 12.0, 8.0, 10.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.18798828125, -5.0439453125, -4.89990234375, -4.755859375, -4.61181640625, -4.4677734375, -4.32373046875, -4.1796875, -4.03564453125, -3.8916015625, -3.74755859375, -3.603515625, -3.45947265625, -3.3154296875, -3.17138671875, -3.02734375, -2.88330078125, -2.7392578125, -2.59521484375, -2.451171875, -2.30712890625, -2.1630859375, -2.01904296875, -1.875, -1.73095703125, -1.5869140625, -1.44287109375, -1.298828125, -1.15478515625, -1.0107421875, -0.86669921875, -0.72265625, -0.57861328125, -0.4345703125, -0.29052734375, -0.146484375, -0.00244140625, 0.1416015625, 0.28564453125, 0.4296875, 0.57373046875, 0.7177734375, 0.86181640625, 1.005859375, 1.14990234375, 1.2939453125, 1.43798828125, 1.58203125, 1.72607421875, 1.8701171875, 2.01416015625, 2.158203125, 2.30224609375, 2.4462890625, 2.59033203125, 2.734375, 2.87841796875, 3.0224609375, 3.16650390625, 3.310546875, 3.45458984375, 3.5986328125, 3.74267578125, 3.88671875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 31.0, 145.0, 360.0, 303.0, 118.0, 28.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.74913024902344, -107.72673034667969, -101.70433044433594, -95.68193054199219, -89.65953063964844, -83.63713073730469, -77.61473846435547, -71.59233856201172, -65.56993865966797, -59.54753875732422, -53.52513885498047, -47.502742767333984, -41.480342864990234, -35.457942962646484, -29.435546875, -23.41314697265625, -17.3907470703125, -11.368348121643066, -5.345949172973633, 0.6764488220214844, 6.698848724365234, 12.721248626708984, 18.74364471435547, 24.76604461669922, 30.78844451904297, 36.81084442138672, 42.83324432373047, 48.85564041137695, 54.8780403137207, 60.90044021606445, 66.92283630371094, 72.94523620605469, 78.96762084960938, 84.99002075195312, 91.01242065429688, 97.03482055664062, 103.05722045898438, 109.07962036132812, 115.10201263427734, 121.1244125366211, 127.14681243896484, 133.16920471191406, 139.1916046142578, 145.21400451660156, 151.2364044189453, 157.25880432128906, 163.2812042236328, 169.30360412597656, 175.3260040283203, 181.34840393066406, 187.3708038330078, 193.39320373535156, 199.4156036376953, 205.43800354003906, 211.46038818359375, 217.4827880859375, 223.50518798828125, 229.527587890625, 235.54998779296875, 241.5723876953125, 247.59478759765625, 253.6171875, 259.63958740234375, 265.6619873046875, 271.68438720703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 3.0, 8.0, 12.0, 19.0, 16.0, 14.0, 21.0, 24.0, 29.0, 27.0, 24.0, 34.0, 34.0, 34.0, 31.0, 37.0, 40.0, 34.0, 40.0, 36.0, 37.0, 32.0, 30.0, 31.0, 34.0, 38.0, 31.0, 40.0, 23.0, 21.0, 27.0, 18.0, 22.0, 12.0, 11.0, 14.0, 8.0, 5.0, 4.0, 10.0, 2.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0], "bins": [-35.04864501953125, -34.04417037963867, -33.03969192504883, -32.03521728515625, -31.03074073791504, -30.026264190673828, -29.02178955078125, -28.01731300354004, -27.012836456298828, -26.008359909057617, -25.003883361816406, -23.999408721923828, -22.994932174682617, -21.990455627441406, -20.985980987548828, -19.981504440307617, -18.977027893066406, -17.972551345825195, -16.968074798583984, -15.963600158691406, -14.959123611450195, -13.954647064208984, -12.95017147064209, -11.945695877075195, -10.941219329833984, -9.936742782592773, -8.932267189025879, -7.927791118621826, -6.923315048217773, -5.918838977813721, -4.914362907409668, -3.9098868370056152, -2.905406951904297, -1.9009308815002441, -0.8964548110961914, 0.10802125930786133, 1.112497329711914, 2.116973400115967, 3.1214494705200195, 4.125925540924072, 5.130401611328125, 6.134877681732178, 7.1393537521362305, 8.143829345703125, 9.148305892944336, 10.152782440185547, 11.157258033752441, 12.161733627319336, 13.166210174560547, 14.170686721801758, 15.175162315368652, 16.179637908935547, 17.184114456176758, 18.18859100341797, 19.193065643310547, 20.197542190551758, 21.20201873779297, 22.20649528503418, 23.21097183227539, 24.21544647216797, 25.21992301940918, 26.22439956665039, 27.22887420654297, 28.23335075378418, 29.23782730102539]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 7.0, 5.0, 14.0, 20.0, 15.0, 23.0, 38.0, 51.0, 120.0, 168.0, 319.0, 720.0, 1606.0, 4665.0, 17145.0, 102341.0, 3710296.0, 313140.0, 31516.0, 7464.0, 2490.0, 1033.0, 445.0, 220.0, 142.0, 81.0, 54.0, 41.0, 20.0, 18.0, 14.0, 7.0, 8.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -22.0087890625, -21.314453125, -20.6201171875, -19.92578125, -19.2314453125, -18.537109375, -17.8427734375, -17.1484375, -16.4541015625, -15.759765625, -15.0654296875, -14.37109375, -13.6767578125, -12.982421875, -12.2880859375, -11.59375, -10.8994140625, -10.205078125, -9.5107421875, -8.81640625, -8.1220703125, -7.427734375, -6.7333984375, -6.0390625, -5.3447265625, -4.650390625, -3.9560546875, -3.26171875, -2.5673828125, -1.873046875, -1.1787109375, -0.484375, 0.2099609375, 0.904296875, 1.5986328125, 2.29296875, 2.9873046875, 3.681640625, 4.3759765625, 5.0703125, 5.7646484375, 6.458984375, 7.1533203125, 7.84765625, 8.5419921875, 9.236328125, 9.9306640625, 10.625, 11.3193359375, 12.013671875, 12.7080078125, 13.40234375, 14.0966796875, 14.791015625, 15.4853515625, 16.1796875, 16.8740234375, 17.568359375, 18.2626953125, 18.95703125, 19.6513671875, 20.345703125, 21.0400390625, 21.734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 11.0, 15.0, 14.0, 14.0, 18.0, 23.0, 29.0, 23.0, 39.0, 52.0, 51.0, 50.0, 49.0, 46.0, 72.0, 68.0, 54.0, 33.0, 40.0, 51.0, 51.0, 30.0, 25.0, 22.0, 17.0, 24.0, 16.0, 9.0, 8.0, 6.0, 6.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9262237548828125, -1.865142822265625, -1.8040618896484375, -1.74298095703125, -1.6819000244140625, -1.620819091796875, -1.5597381591796875, -1.4986572265625, -1.4375762939453125, -1.376495361328125, -1.3154144287109375, -1.25433349609375, -1.1932525634765625, -1.132171630859375, -1.0710906982421875, -1.010009765625, -0.9489288330078125, -0.887847900390625, -0.8267669677734375, -0.76568603515625, -0.7046051025390625, -0.643524169921875, -0.5824432373046875, -0.5213623046875, -0.4602813720703125, -0.399200439453125, -0.3381195068359375, -0.27703857421875, -0.2159576416015625, -0.154876708984375, -0.0937957763671875, -0.03271484375, 0.0283660888671875, 0.089447021484375, 0.1505279541015625, 0.21160888671875, 0.2726898193359375, 0.333770751953125, 0.3948516845703125, 0.4559326171875, 0.5170135498046875, 0.578094482421875, 0.6391754150390625, 0.70025634765625, 0.7613372802734375, 0.822418212890625, 0.8834991455078125, 0.944580078125, 1.0056610107421875, 1.066741943359375, 1.1278228759765625, 1.18890380859375, 1.2499847412109375, 1.311065673828125, 1.3721466064453125, 1.4332275390625, 1.4943084716796875, 1.555389404296875, 1.6164703369140625, 1.67755126953125, 1.7386322021484375, 1.799713134765625, 1.8607940673828125, 1.921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 11.0, 12.0, 15.0, 22.0, 41.0, 52.0, 80.0, 133.0, 203.0, 407.0, 853.0, 2087.0, 6042.0, 19968.0, 87870.0, 1059606.0, 2844683.0, 132911.0, 26641.0, 7781.0, 2673.0, 1043.0, 500.0, 255.0, 150.0, 77.0, 51.0, 38.0, 20.0, 25.0, 15.0, 7.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.248291015625, -10.84814453125, -10.447998046875, -10.0478515625, -9.647705078125, -9.24755859375, -8.847412109375, -8.447265625, -8.047119140625, -7.64697265625, -7.246826171875, -6.8466796875, -6.446533203125, -6.04638671875, -5.646240234375, -5.24609375, -4.845947265625, -4.44580078125, -4.045654296875, -3.6455078125, -3.245361328125, -2.84521484375, -2.445068359375, -2.044921875, -1.644775390625, -1.24462890625, -0.844482421875, -0.4443359375, -0.044189453125, 0.35595703125, 0.756103515625, 1.15625, 1.556396484375, 1.95654296875, 2.356689453125, 2.7568359375, 3.156982421875, 3.55712890625, 3.957275390625, 4.357421875, 4.757568359375, 5.15771484375, 5.557861328125, 5.9580078125, 6.358154296875, 6.75830078125, 7.158447265625, 7.55859375, 7.958740234375, 8.35888671875, 8.759033203125, 9.1591796875, 9.559326171875, 9.95947265625, 10.359619140625, 10.759765625, 11.159912109375, 11.56005859375, 11.960205078125, 12.3603515625, 12.760498046875, 13.16064453125, 13.560791015625, 13.9609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 5.0, 7.0, 11.0, 7.0, 12.0, 22.0, 19.0, 12.0, 33.0, 36.0, 64.0, 102.0, 161.0, 285.0, 535.0, 1313.0, 634.0, 292.0, 170.0, 98.0, 66.0, 48.0, 33.0, 30.0, 15.0, 10.0, 15.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.892608642578125, -2.77935791015625, -2.666107177734375, -2.5528564453125, -2.439605712890625, -2.32635498046875, -2.213104248046875, -2.099853515625, -1.986602783203125, -1.87335205078125, -1.760101318359375, -1.6468505859375, -1.533599853515625, -1.42034912109375, -1.307098388671875, -1.19384765625, -1.080596923828125, -0.96734619140625, -0.854095458984375, -0.7408447265625, -0.627593994140625, -0.51434326171875, -0.401092529296875, -0.287841796875, -0.174591064453125, -0.06134033203125, 0.051910400390625, 0.1651611328125, 0.278411865234375, 0.39166259765625, 0.504913330078125, 0.6181640625, 0.731414794921875, 0.84466552734375, 0.957916259765625, 1.0711669921875, 1.184417724609375, 1.29766845703125, 1.410919189453125, 1.524169921875, 1.637420654296875, 1.75067138671875, 1.863922119140625, 1.9771728515625, 2.090423583984375, 2.20367431640625, 2.316925048828125, 2.43017578125, 2.543426513671875, 2.65667724609375, 2.769927978515625, 2.8831787109375, 2.996429443359375, 3.10968017578125, 3.222930908203125, 3.336181640625, 3.449432373046875, 3.56268310546875, 3.675933837890625, 3.7891845703125, 3.902435302734375, 4.01568603515625, 4.128936767578125, 4.2421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 13.0, 18.0, 36.0, 52.0, 69.0, 85.0, 102.0, 112.0, 110.0, 97.0, 84.0, 70.0, 46.0, 23.0, 28.0, 14.0, 14.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.307350158691406, -26.50409698486328, -25.70084571838379, -24.897592544555664, -24.09433937072754, -23.291088104248047, -22.487834930419922, -21.684581756591797, -20.881328582763672, -20.078075408935547, -19.274824142456055, -18.47157096862793, -17.668317794799805, -16.865066528320312, -16.061813354492188, -15.258560180664062, -14.45530891418457, -13.652056694030762, -12.848803520202637, -12.045551300048828, -11.242298126220703, -10.439045906066895, -9.635793685913086, -8.832540512084961, -8.029288291931152, -7.2260355949401855, -6.422782897949219, -5.61953067779541, -4.816277980804443, -4.013025283813477, -3.209773063659668, -2.406520366668701, -1.6032676696777344, -0.8000150918960571, 0.003237485885620117, 0.8064899444580078, 1.6097426414489746, 2.4129953384399414, 3.21624755859375, 4.019500255584717, 4.822752952575684, 5.62600564956665, 6.429258346557617, 7.232510566711426, 8.035762786865234, 8.83901596069336, 9.642268180847168, 10.445520401000977, 11.248773574829102, 12.05202579498291, 12.855278968811035, 13.658531188964844, 14.461784362792969, 15.265036582946777, 16.068288803100586, 16.87154197692871, 17.674793243408203, 18.478046417236328, 19.28129768371582, 20.084550857543945, 20.88780403137207, 21.691055297851562, 22.494308471679688, 23.297561645507812, 24.100814819335938]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 9.0, 19.0, 15.0, 19.0, 16.0, 33.0, 28.0, 27.0, 56.0, 45.0, 33.0, 41.0, 48.0, 47.0, 46.0, 64.0, 53.0, 44.0, 47.0, 57.0, 37.0, 41.0, 38.0, 35.0, 22.0, 18.0, 11.0, 12.0, 12.0, 8.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.987573623657227, -14.501357078552246, -14.01513957977295, -13.528923034667969, -13.042705535888672, -12.556488990783691, -12.070271492004395, -11.584054946899414, -11.097837448120117, -10.611620903015137, -10.12540340423584, -9.63918685913086, -9.152969360351562, -8.666752815246582, -8.180535316467285, -7.694318771362305, -7.208101749420166, -6.721884727478027, -6.235667705535889, -5.74945068359375, -5.263233661651611, -4.777016639709473, -4.290800094604492, -3.8045828342437744, -3.3183658123016357, -2.832148790359497, -2.3459317684173584, -1.8597148656845093, -1.3734978437423706, -0.8872809410095215, -0.4010639190673828, 0.08515310287475586, 0.5713701248168945, 1.0575871467590332, 1.5438041687011719, 2.0300211906433105, 2.516238212585449, 3.002454996109009, 3.4886720180511475, 3.974889039993286, 4.461106300354004, 4.947323322296143, 5.433540344238281, 5.91975736618042, 6.405974388122559, 6.892190933227539, 7.378408432006836, 7.864624977111816, 8.350841522216797, 8.837058067321777, 9.323275566101074, 9.809492111206055, 10.295709609985352, 10.781926155090332, 11.268143653869629, 11.75436019897461, 12.240577697753906, 12.726794242858887, 13.213011741638184, 13.699228286743164, 14.185445785522461, 14.671662330627441, 15.157879829406738, 15.644096374511719, 16.130313873291016]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 5.0, 11.0, 17.0, 23.0, 37.0, 55.0, 102.0, 196.0, 328.0, 718.0, 1545.0, 3911.0, 12302.0, 44446.0, 199308.0, 629482.0, 113290.0, 29141.0, 8392.0, 2872.0, 1109.0, 576.0, 296.0, 155.0, 88.0, 44.0, 34.0, 16.0, 14.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6571044921875, -11.197021484375, -10.7369384765625, -10.27685546875, -9.8167724609375, -9.356689453125, -8.8966064453125, -8.4365234375, -7.9764404296875, -7.516357421875, -7.0562744140625, -6.59619140625, -6.1361083984375, -5.676025390625, -5.2159423828125, -4.755859375, -4.2957763671875, -3.835693359375, -3.3756103515625, -2.91552734375, -2.4554443359375, -1.995361328125, -1.5352783203125, -1.0751953125, -0.6151123046875, -0.155029296875, 0.3050537109375, 0.76513671875, 1.2252197265625, 1.685302734375, 2.1453857421875, 2.60546875, 3.0655517578125, 3.525634765625, 3.9857177734375, 4.44580078125, 4.9058837890625, 5.365966796875, 5.8260498046875, 6.2861328125, 6.7462158203125, 7.206298828125, 7.6663818359375, 8.12646484375, 8.5865478515625, 9.046630859375, 9.5067138671875, 9.966796875, 10.4268798828125, 10.886962890625, 11.3470458984375, 11.80712890625, 12.2672119140625, 12.727294921875, 13.1873779296875, 13.6474609375, 14.1075439453125, 14.567626953125, 15.0277099609375, 15.48779296875, 15.9478759765625, 16.407958984375, 16.8680419921875, 17.328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 5.0, 8.0, 6.0, 15.0, 7.0, 13.0, 23.0, 20.0, 28.0, 30.0, 35.0, 41.0, 57.0, 42.0, 64.0, 55.0, 48.0, 60.0, 61.0, 50.0, 44.0, 34.0, 50.0, 42.0, 25.0, 24.0, 20.0, 18.0, 17.0, 11.0, 9.0, 5.0, 11.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9173736572265625, -1.855255126953125, -1.7931365966796875, -1.73101806640625, -1.6688995361328125, -1.606781005859375, -1.5446624755859375, -1.4825439453125, -1.4204254150390625, -1.358306884765625, -1.2961883544921875, -1.23406982421875, -1.1719512939453125, -1.109832763671875, -1.0477142333984375, -0.985595703125, -0.9234771728515625, -0.861358642578125, -0.7992401123046875, -0.73712158203125, -0.6750030517578125, -0.612884521484375, -0.5507659912109375, -0.4886474609375, -0.4265289306640625, -0.364410400390625, -0.3022918701171875, -0.24017333984375, -0.1780548095703125, -0.115936279296875, -0.0538177490234375, 0.00830078125, 0.0704193115234375, 0.132537841796875, 0.1946563720703125, 0.25677490234375, 0.3188934326171875, 0.381011962890625, 0.4431304931640625, 0.5052490234375, 0.5673675537109375, 0.629486083984375, 0.6916046142578125, 0.75372314453125, 0.8158416748046875, 0.877960205078125, 0.9400787353515625, 1.002197265625, 1.0643157958984375, 1.126434326171875, 1.1885528564453125, 1.25067138671875, 1.3127899169921875, 1.374908447265625, 1.4370269775390625, 1.4991455078125, 1.5612640380859375, 1.623382568359375, 1.6855010986328125, 1.74761962890625, 1.8097381591796875, 1.871856689453125, 1.9339752197265625, 1.99609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 10.0, 6.0, 10.0, 13.0, 20.0, 16.0, 38.0, 43.0, 63.0, 100.0, 143.0, 228.0, 391.0, 790.0, 1610.0, 3395.0, 7831.0, 18768.0, 45849.0, 124923.0, 456732.0, 257153.0, 77229.0, 30222.0, 12639.0, 5399.0, 2361.0, 1113.0, 623.0, 288.0, 176.0, 132.0, 60.0, 56.0, 33.0, 29.0, 25.0, 15.0, 5.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.21875, -7.9952392578125, -7.771728515625, -7.5482177734375, -7.32470703125, -7.1011962890625, -6.877685546875, -6.6541748046875, -6.4306640625, -6.2071533203125, -5.983642578125, -5.7601318359375, -5.53662109375, -5.3131103515625, -5.089599609375, -4.8660888671875, -4.642578125, -4.4190673828125, -4.195556640625, -3.9720458984375, -3.74853515625, -3.5250244140625, -3.301513671875, -3.0780029296875, -2.8544921875, -2.6309814453125, -2.407470703125, -2.1839599609375, -1.96044921875, -1.7369384765625, -1.513427734375, -1.2899169921875, -1.06640625, -0.8428955078125, -0.619384765625, -0.3958740234375, -0.17236328125, 0.0511474609375, 0.274658203125, 0.4981689453125, 0.7216796875, 0.9451904296875, 1.168701171875, 1.3922119140625, 1.61572265625, 1.8392333984375, 2.062744140625, 2.2862548828125, 2.509765625, 2.7332763671875, 2.956787109375, 3.1802978515625, 3.40380859375, 3.6273193359375, 3.850830078125, 4.0743408203125, 4.2978515625, 4.5213623046875, 4.744873046875, 4.9683837890625, 5.19189453125, 5.4154052734375, 5.638916015625, 5.8624267578125, 6.0859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 10.0, 7.0, 11.0, 12.0, 13.0, 14.0, 17.0, 14.0, 19.0, 23.0, 23.0, 34.0, 29.0, 44.0, 38.0, 39.0, 37.0, 37.0, 47.0, 47.0, 38.0, 40.0, 31.0, 51.0, 25.0, 34.0, 24.0, 36.0, 26.0, 29.0, 23.0, 16.0, 21.0, 23.0, 17.0, 7.0, 9.0, 6.0, 9.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.1004638671875, -5.892333984375, -5.6842041015625, -5.47607421875, -5.2679443359375, -5.059814453125, -4.8516845703125, -4.6435546875, -4.4354248046875, -4.227294921875, -4.0191650390625, -3.81103515625, -3.6029052734375, -3.394775390625, -3.1866455078125, -2.978515625, -2.7703857421875, -2.562255859375, -2.3541259765625, -2.14599609375, -1.9378662109375, -1.729736328125, -1.5216064453125, -1.3134765625, -1.1053466796875, -0.897216796875, -0.6890869140625, -0.48095703125, -0.2728271484375, -0.064697265625, 0.1434326171875, 0.3515625, 0.5596923828125, 0.767822265625, 0.9759521484375, 1.18408203125, 1.3922119140625, 1.600341796875, 1.8084716796875, 2.0166015625, 2.2247314453125, 2.432861328125, 2.6409912109375, 2.84912109375, 3.0572509765625, 3.265380859375, 3.4735107421875, 3.681640625, 3.8897705078125, 4.097900390625, 4.3060302734375, 4.51416015625, 4.7222900390625, 4.930419921875, 5.1385498046875, 5.3466796875, 5.5548095703125, 5.762939453125, 5.9710693359375, 6.17919921875, 6.3873291015625, 6.595458984375, 6.8035888671875, 7.01171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 15.0, 12.0, 38.0, 53.0, 92.0, 154.0, 352.0, 723.0, 2168.0, 7270.0, 31433.0, 189267.0, 676538.0, 111457.0, 20957.0, 5127.0, 1635.0, 596.0, 287.0, 172.0, 81.0, 44.0, 28.0, 18.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.0775146484375, -4.920654296875, -4.7637939453125, -4.60693359375, -4.4500732421875, -4.293212890625, -4.1363525390625, -3.9794921875, -3.8226318359375, -3.665771484375, -3.5089111328125, -3.35205078125, -3.1951904296875, -3.038330078125, -2.8814697265625, -2.724609375, -2.5677490234375, -2.410888671875, -2.2540283203125, -2.09716796875, -1.9403076171875, -1.783447265625, -1.6265869140625, -1.4697265625, -1.3128662109375, -1.156005859375, -0.9991455078125, -0.84228515625, -0.6854248046875, -0.528564453125, -0.3717041015625, -0.21484375, -0.0579833984375, 0.098876953125, 0.2557373046875, 0.41259765625, 0.5694580078125, 0.726318359375, 0.8831787109375, 1.0400390625, 1.1968994140625, 1.353759765625, 1.5106201171875, 1.66748046875, 1.8243408203125, 1.981201171875, 2.1380615234375, 2.294921875, 2.4517822265625, 2.608642578125, 2.7655029296875, 2.92236328125, 3.0792236328125, 3.236083984375, 3.3929443359375, 3.5498046875, 3.7066650390625, 3.863525390625, 4.0203857421875, 4.17724609375, 4.3341064453125, 4.490966796875, 4.6478271484375, 4.8046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 16.0, 15.0, 12.0, 19.0, 38.0, 65.0, 126.0, 259.0, 172.0, 95.0, 43.0, 20.0, 11.0, 17.0, 17.0, 9.0, 9.0, 3.0, 2.0, 10.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005159378051757812, -0.0004931986331939697, -0.0004704594612121582, -0.0004477202892303467, -0.00042498111724853516, -0.00040224194526672363, -0.0003795027732849121, -0.0003567636013031006, -0.00033402442932128906, -0.00031128525733947754, -0.000288546085357666, -0.0002658069133758545, -0.00024306774139404297, -0.00022032856941223145, -0.00019758939743041992, -0.0001748502254486084, -0.00015211105346679688, -0.00012937188148498535, -0.00010663270950317383, -8.38935375213623e-05, -6.115436553955078e-05, -3.841519355773926e-05, -1.5676021575927734e-05, 7.063150405883789e-06, 2.9802322387695312e-05, 5.2541494369506836e-05, 7.528066635131836e-05, 9.801983833312988e-05, 0.0001207590103149414, 0.00014349818229675293, 0.00016623735427856445, 0.00018897652626037598, 0.0002117156982421875, 0.00023445487022399902, 0.00025719404220581055, 0.00027993321418762207, 0.0003026723861694336, 0.0003254115581512451, 0.00034815073013305664, 0.00037088990211486816, 0.0003936290740966797, 0.0004163682460784912, 0.00043910741806030273, 0.00046184659004211426, 0.0004845857620239258, 0.0005073249340057373, 0.0005300641059875488, 0.0005528032779693604, 0.0005755424499511719, 0.0005982816219329834, 0.0006210207939147949, 0.0006437599658966064, 0.000666499137878418, 0.0006892383098602295, 0.000711977481842041, 0.0007347166538238525, 0.0007574558258056641, 0.0007801949977874756, 0.0008029341697692871, 0.0008256733417510986, 0.0008484125137329102, 0.0008711516857147217, 0.0008938908576965332, 0.0009166300296783447, 0.0009393692016601562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 14.0, 22.0, 21.0, 36.0, 62.0, 83.0, 167.0, 295.0, 567.0, 1028.0, 2192.0, 4719.0, 10633.0, 28625.0, 89029.0, 359700.0, 400845.0, 98501.0, 30683.0, 11530.0, 4972.0, 2326.0, 1090.0, 603.0, 300.0, 161.0, 104.0, 75.0, 45.0, 23.0, 19.0, 12.0, 16.0, 13.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.380859375, -3.268310546875, -3.15576171875, -3.043212890625, -2.9306640625, -2.818115234375, -2.70556640625, -2.593017578125, -2.48046875, -2.367919921875, -2.25537109375, -2.142822265625, -2.0302734375, -1.917724609375, -1.80517578125, -1.692626953125, -1.580078125, -1.467529296875, -1.35498046875, -1.242431640625, -1.1298828125, -1.017333984375, -0.90478515625, -0.792236328125, -0.6796875, -0.567138671875, -0.45458984375, -0.342041015625, -0.2294921875, -0.116943359375, -0.00439453125, 0.108154296875, 0.220703125, 0.333251953125, 0.44580078125, 0.558349609375, 0.6708984375, 0.783447265625, 0.89599609375, 1.008544921875, 1.12109375, 1.233642578125, 1.34619140625, 1.458740234375, 1.5712890625, 1.683837890625, 1.79638671875, 1.908935546875, 2.021484375, 2.134033203125, 2.24658203125, 2.359130859375, 2.4716796875, 2.584228515625, 2.69677734375, 2.809326171875, 2.921875, 3.034423828125, 3.14697265625, 3.259521484375, 3.3720703125, 3.484619140625, 3.59716796875, 3.709716796875, 3.822265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 5.0, 11.0, 11.0, 28.0, 25.0, 41.0, 42.0, 54.0, 41.0, 65.0, 80.0, 91.0, 80.0, 65.0, 52.0, 48.0, 43.0, 25.0, 27.0, 17.0, 15.0, 6.0, 8.0, 9.0, 10.0, 13.0, 5.0, 4.0, 3.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.140625, -3.0496826171875, -2.958740234375, -2.8677978515625, -2.77685546875, -2.6859130859375, -2.594970703125, -2.5040283203125, -2.4130859375, -2.3221435546875, -2.231201171875, -2.1402587890625, -2.04931640625, -1.9583740234375, -1.867431640625, -1.7764892578125, -1.685546875, -1.5946044921875, -1.503662109375, -1.4127197265625, -1.32177734375, -1.2308349609375, -1.139892578125, -1.0489501953125, -0.9580078125, -0.8670654296875, -0.776123046875, -0.6851806640625, -0.59423828125, -0.5032958984375, -0.412353515625, -0.3214111328125, -0.23046875, -0.1395263671875, -0.048583984375, 0.0423583984375, 0.13330078125, 0.2242431640625, 0.315185546875, 0.4061279296875, 0.4970703125, 0.5880126953125, 0.678955078125, 0.7698974609375, 0.86083984375, 0.9517822265625, 1.042724609375, 1.1336669921875, 1.224609375, 1.3155517578125, 1.406494140625, 1.4974365234375, 1.58837890625, 1.6793212890625, 1.770263671875, 1.8612060546875, 1.9521484375, 2.0430908203125, 2.134033203125, 2.2249755859375, 2.31591796875, 2.4068603515625, 2.497802734375, 2.5887451171875, 2.6796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 23.0, 44.0, 90.0, 170.0, 198.0, 219.0, 120.0, 71.0, 44.0, 10.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.873268127441406, -57.943050384521484, -55.0128288269043, -52.082611083984375, -49.15238952636719, -46.222171783447266, -43.291954040527344, -40.361732482910156, -37.431514739990234, -34.50129699707031, -31.571075439453125, -28.640857696533203, -25.71063804626465, -22.780418395996094, -19.850200653076172, -16.919981002807617, -13.989761352539062, -11.059541702270508, -8.12932300567627, -5.199104309082031, -2.2688846588134766, 0.6613349914550781, 3.591552734375, 6.521772384643555, 9.45199203491211, 12.382211685180664, 15.312430381774902, 18.24264907836914, 21.172868728637695, 24.10308837890625, 27.033306121826172, 29.963525772094727, 32.89374542236328, 35.8239631652832, 38.75418472290039, 41.68440246582031, 44.6146240234375, 47.54484176635742, 50.475059509277344, 53.40528106689453, 56.33549880981445, 59.265716552734375, 62.19593811035156, 65.12615966796875, 68.0563735961914, 70.9865951538086, 73.91680908203125, 76.84703063964844, 79.77725219726562, 82.70747375488281, 85.63768768310547, 88.56790924072266, 91.49813079833984, 94.4283447265625, 97.35856628417969, 100.28878784179688, 103.21900939941406, 106.14923095703125, 109.0794448852539, 112.0096664428711, 114.93988800048828, 117.87010192871094, 120.80032348632812, 123.73054504394531, 126.66075897216797]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 7.0, 12.0, 9.0, 12.0, 11.0, 12.0, 11.0, 13.0, 17.0, 18.0, 38.0, 18.0, 23.0, 28.0, 33.0, 36.0, 35.0, 37.0, 27.0, 44.0, 47.0, 36.0, 36.0, 37.0, 37.0, 38.0, 42.0, 46.0, 33.0, 24.0, 29.0, 11.0, 17.0, 17.0, 17.0, 13.0, 15.0, 12.0, 12.0, 2.0, 3.0, 3.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-28.655441284179688, -27.728147506713867, -26.80085563659668, -25.87356185913086, -24.94626808166504, -24.01897430419922, -23.09168243408203, -22.16438865661621, -21.23709487915039, -20.30980110168457, -19.382509231567383, -18.455215454101562, -17.527921676635742, -16.600627899169922, -15.673336029052734, -14.746042251586914, -13.818750381469727, -12.891457557678223, -11.964163780212402, -11.036870956420898, -10.109577178955078, -9.182284355163574, -8.25499153137207, -7.327698230743408, -6.400404930114746, -5.473111629486084, -4.545818328857422, -3.618525505065918, -2.691232204437256, -1.7639389038085938, -0.8366460800170898, 0.09064722061157227, 1.0179405212402344, 1.945233702659607, 2.8725268840789795, 3.7998199462890625, 4.727113246917725, 5.654406547546387, 6.581699371337891, 7.508992671966553, 8.436285972595215, 9.363578796386719, 10.290872573852539, 11.218165397644043, 12.145458221435547, 13.072751998901367, 14.000044822692871, 14.927337646484375, 15.854631423950195, 16.781925201416016, 17.709217071533203, 18.636510848999023, 19.563804626464844, 20.49109649658203, 21.41839027404785, 22.345684051513672, 23.27297592163086, 24.20026969909668, 25.127561569213867, 26.054855346679688, 26.982149124145508, 27.909442901611328, 28.836734771728516, 29.764028549194336, 30.691322326660156]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 12.0, 18.0, 23.0, 25.0, 45.0, 70.0, 123.0, 220.0, 350.0, 676.0, 1365.0, 2986.0, 6890.0, 18902.0, 73868.0, 794071.0, 3144522.0, 109212.0, 25052.0, 8468.0, 3681.0, 1678.0, 850.0, 455.0, 263.0, 150.0, 99.0, 67.0, 42.0, 27.0, 18.0, 12.0, 13.0, 8.0, 4.0, 10.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.5390625, -13.0, -12.4609375, -11.921875, -11.3828125, -10.84375, -10.3046875, -9.765625, -9.2265625, -8.6875, -8.1484375, -7.609375, -7.0703125, -6.53125, -5.9921875, -5.453125, -4.9140625, -4.375, -3.8359375, -3.296875, -2.7578125, -2.21875, -1.6796875, -1.140625, -0.6015625, -0.0625, 0.4765625, 1.015625, 1.5546875, 2.09375, 2.6328125, 3.171875, 3.7109375, 4.25, 4.7890625, 5.328125, 5.8671875, 6.40625, 6.9453125, 7.484375, 8.0234375, 8.5625, 9.1015625, 9.640625, 10.1796875, 10.71875, 11.2578125, 11.796875, 12.3359375, 12.875, 13.4140625, 13.953125, 14.4921875, 15.03125, 15.5703125, 16.109375, 16.6484375, 17.1875, 17.7265625, 18.265625, 18.8046875, 19.34375, 19.8828125, 20.421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 13.0, 5.0, 13.0, 18.0, 24.0, 15.0, 23.0, 41.0, 27.0, 49.0, 55.0, 47.0, 55.0, 50.0, 63.0, 49.0, 64.0, 50.0, 36.0, 40.0, 33.0, 34.0, 37.0, 29.0, 14.0, 15.0, 19.0, 14.0, 12.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.8463134765625, -1.786376953125, -1.7264404296875, -1.66650390625, -1.6065673828125, -1.546630859375, -1.4866943359375, -1.4267578125, -1.3668212890625, -1.306884765625, -1.2469482421875, -1.18701171875, -1.1270751953125, -1.067138671875, -1.0072021484375, -0.947265625, -0.8873291015625, -0.827392578125, -0.7674560546875, -0.70751953125, -0.6475830078125, -0.587646484375, -0.5277099609375, -0.4677734375, -0.4078369140625, -0.347900390625, -0.2879638671875, -0.22802734375, -0.1680908203125, -0.108154296875, -0.0482177734375, 0.01171875, 0.0716552734375, 0.131591796875, 0.1915283203125, 0.25146484375, 0.3114013671875, 0.371337890625, 0.4312744140625, 0.4912109375, 0.5511474609375, 0.611083984375, 0.6710205078125, 0.73095703125, 0.7908935546875, 0.850830078125, 0.9107666015625, 0.970703125, 1.0306396484375, 1.090576171875, 1.1505126953125, 1.21044921875, 1.2703857421875, 1.330322265625, 1.3902587890625, 1.4501953125, 1.5101318359375, 1.570068359375, 1.6300048828125, 1.68994140625, 1.7498779296875, 1.809814453125, 1.8697509765625, 1.9296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 7.0, 9.0, 15.0, 21.0, 27.0, 38.0, 62.0, 80.0, 115.0, 179.0, 310.0, 485.0, 732.0, 1283.0, 2245.0, 4075.0, 8057.0, 16474.0, 37682.0, 98521.0, 339314.0, 2824601.0, 621842.0, 143635.0, 51216.0, 21585.0, 10193.0, 5022.0, 2679.0, 1510.0, 852.0, 501.0, 317.0, 198.0, 140.0, 88.0, 46.0, 40.0, 21.0, 20.0, 17.0, 14.0, 4.0, 6.0, 6.0, 5.0, 1.0], "bins": [-8.546875, -8.32586669921875, -8.1048583984375, -7.88385009765625, -7.662841796875, -7.44183349609375, -7.2208251953125, -6.99981689453125, -6.77880859375, -6.55780029296875, -6.3367919921875, -6.11578369140625, -5.894775390625, -5.67376708984375, -5.4527587890625, -5.23175048828125, -5.0107421875, -4.78973388671875, -4.5687255859375, -4.34771728515625, -4.126708984375, -3.90570068359375, -3.6846923828125, -3.46368408203125, -3.24267578125, -3.02166748046875, -2.8006591796875, -2.57965087890625, -2.358642578125, -2.13763427734375, -1.9166259765625, -1.69561767578125, -1.474609375, -1.25360107421875, -1.0325927734375, -0.81158447265625, -0.590576171875, -0.36956787109375, -0.1485595703125, 0.07244873046875, 0.29345703125, 0.51446533203125, 0.7354736328125, 0.95648193359375, 1.177490234375, 1.39849853515625, 1.6195068359375, 1.84051513671875, 2.0615234375, 2.28253173828125, 2.5035400390625, 2.72454833984375, 2.945556640625, 3.16656494140625, 3.3875732421875, 3.60858154296875, 3.82958984375, 4.05059814453125, 4.2716064453125, 4.49261474609375, 4.713623046875, 4.93463134765625, 5.1556396484375, 5.37664794921875, 5.59765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 0.0, 4.0, 3.0, 10.0, 7.0, 14.0, 18.0, 23.0, 16.0, 44.0, 65.0, 75.0, 94.0, 160.0, 326.0, 616.0, 1503.0, 410.0, 229.0, 154.0, 89.0, 60.0, 37.0, 26.0, 20.0, 26.0, 10.0, 10.0, 7.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.10260009765625, -3.9864501953125, -3.87030029296875, -3.754150390625, -3.63800048828125, -3.5218505859375, -3.40570068359375, -3.28955078125, -3.17340087890625, -3.0572509765625, -2.94110107421875, -2.824951171875, -2.70880126953125, -2.5926513671875, -2.47650146484375, -2.3603515625, -2.24420166015625, -2.1280517578125, -2.01190185546875, -1.895751953125, -1.77960205078125, -1.6634521484375, -1.54730224609375, -1.43115234375, -1.31500244140625, -1.1988525390625, -1.08270263671875, -0.966552734375, -0.85040283203125, -0.7342529296875, -0.61810302734375, -0.501953125, -0.38580322265625, -0.2696533203125, -0.15350341796875, -0.037353515625, 0.07879638671875, 0.1949462890625, 0.31109619140625, 0.42724609375, 0.54339599609375, 0.6595458984375, 0.77569580078125, 0.891845703125, 1.00799560546875, 1.1241455078125, 1.24029541015625, 1.3564453125, 1.47259521484375, 1.5887451171875, 1.70489501953125, 1.821044921875, 1.93719482421875, 2.0533447265625, 2.16949462890625, 2.28564453125, 2.40179443359375, 2.5179443359375, 2.63409423828125, 2.750244140625, 2.86639404296875, 2.9825439453125, 3.09869384765625, 3.21484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 7.0, 10.0, 22.0, 40.0, 68.0, 129.0, 151.0, 161.0, 163.0, 115.0, 60.0, 43.0, 15.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.11037063598633, -40.98886489868164, -39.86736297607422, -38.74585723876953, -37.624351501464844, -36.50284957885742, -35.381343841552734, -34.25984191894531, -33.138336181640625, -32.01683044433594, -30.895328521728516, -29.773822784423828, -28.652318954467773, -27.53081512451172, -26.40930938720703, -25.287805557250977, -24.166301727294922, -23.044797897338867, -21.923294067382812, -20.801788330078125, -19.68028450012207, -18.558780670166016, -17.437274932861328, -16.315771102905273, -15.194267272949219, -14.072763442993164, -12.951258659362793, -11.829753875732422, -10.708250045776367, -9.586746215820312, -8.465241432189941, -7.3437371253967285, -6.222236633300781, -5.100732326507568, -3.9792280197143555, -2.8577237129211426, -1.7362194061279297, -0.6147150993347168, 0.5067892074584961, 1.628293514251709, 2.749797821044922, 3.8713021278381348, 4.992806434631348, 6.1143107414245605, 7.235815048217773, 8.357318878173828, 9.4788236618042, 10.60032844543457, 11.721832275390625, 12.84333610534668, 13.96484088897705, 15.086345672607422, 16.207849502563477, 17.32935333251953, 18.45085906982422, 19.572362899780273, 20.693866729736328, 21.815370559692383, 22.936874389648438, 24.058380126953125, 25.17988395690918, 26.301387786865234, 27.422893524169922, 28.544397354125977, 29.66590118408203]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 21.0, 25.0, 16.0, 25.0, 27.0, 24.0, 43.0, 33.0, 37.0, 39.0, 38.0, 42.0, 41.0, 43.0, 33.0, 45.0, 32.0, 25.0, 41.0, 34.0, 27.0, 37.0, 32.0, 19.0, 16.0, 22.0, 21.0, 15.0, 19.0, 14.0, 6.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.666410446166992, -9.317983627319336, -8.96955680847168, -8.621129989624023, -8.272703170776367, -7.924276351928711, -7.575850009918213, -7.227423191070557, -6.8789963722229, -6.530569553375244, -6.182142734527588, -5.83371639251709, -5.485289573669434, -5.136862754821777, -4.788435935974121, -4.440009117126465, -4.091582298278809, -3.7431554794311523, -3.394728660583496, -3.046302080154419, -2.6978752613067627, -2.3494484424591064, -2.0010218620300293, -1.652595043182373, -1.3041682243347168, -0.9557414650917053, -0.6073147058486938, -0.25888800621032715, 0.0895388126373291, 0.43796563148498535, 0.7863922119140625, 1.1348190307617188, 1.483245849609375, 1.8316726684570312, 2.1800994873046875, 2.5285260677337646, 2.876952886581421, 3.225379705429077, 3.5738062858581543, 3.9222331047058105, 4.270659923553467, 4.619086742401123, 4.967513561248779, 5.315939903259277, 5.664366722106934, 6.01279354095459, 6.361220359802246, 6.709647178649902, 7.058073997497559, 7.406500816345215, 7.754927635192871, 8.103354454040527, 8.451781272888184, 8.80020809173584, 9.14863395690918, 9.497060775756836, 9.845487594604492, 10.193914413452148, 10.542341232299805, 10.890768051147461, 11.239194869995117, 11.587621688842773, 11.93604850769043, 12.284475326538086, 12.632902145385742]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 13.0, 20.0, 21.0, 31.0, 52.0, 56.0, 111.0, 209.0, 348.0, 544.0, 1129.0, 2076.0, 4519.0, 10475.0, 28450.0, 77314.0, 202670.0, 387776.0, 205715.0, 78002.0, 28929.0, 10947.0, 4569.0, 2081.0, 1038.0, 575.0, 361.0, 193.0, 130.0, 67.0, 35.0, 27.0, 23.0, 6.0, 5.0, 2.0, 9.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.421875, -10.11083984375, -9.7998046875, -9.48876953125, -9.177734375, -8.86669921875, -8.5556640625, -8.24462890625, -7.93359375, -7.62255859375, -7.3115234375, -7.00048828125, -6.689453125, -6.37841796875, -6.0673828125, -5.75634765625, -5.4453125, -5.13427734375, -4.8232421875, -4.51220703125, -4.201171875, -3.89013671875, -3.5791015625, -3.26806640625, -2.95703125, -2.64599609375, -2.3349609375, -2.02392578125, -1.712890625, -1.40185546875, -1.0908203125, -0.77978515625, -0.46875, -0.15771484375, 0.1533203125, 0.46435546875, 0.775390625, 1.08642578125, 1.3974609375, 1.70849609375, 2.01953125, 2.33056640625, 2.6416015625, 2.95263671875, 3.263671875, 3.57470703125, 3.8857421875, 4.19677734375, 4.5078125, 4.81884765625, 5.1298828125, 5.44091796875, 5.751953125, 6.06298828125, 6.3740234375, 6.68505859375, 6.99609375, 7.30712890625, 7.6181640625, 7.92919921875, 8.240234375, 8.55126953125, 8.8623046875, 9.17333984375, 9.484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 9.0, 17.0, 17.0, 26.0, 30.0, 38.0, 41.0, 37.0, 44.0, 48.0, 55.0, 52.0, 42.0, 43.0, 57.0, 52.0, 50.0, 48.0, 42.0, 36.0, 32.0, 25.0, 23.0, 15.0, 23.0, 14.0, 10.0, 11.0, 9.0, 10.0, 2.0, 0.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.119140625, -2.05718994140625, -1.9952392578125, -1.93328857421875, -1.871337890625, -1.80938720703125, -1.7474365234375, -1.68548583984375, -1.62353515625, -1.56158447265625, -1.4996337890625, -1.43768310546875, -1.375732421875, -1.31378173828125, -1.2518310546875, -1.18988037109375, -1.1279296875, -1.06597900390625, -1.0040283203125, -0.94207763671875, -0.880126953125, -0.81817626953125, -0.7562255859375, -0.69427490234375, -0.63232421875, -0.57037353515625, -0.5084228515625, -0.44647216796875, -0.384521484375, -0.32257080078125, -0.2606201171875, -0.19866943359375, -0.13671875, -0.07476806640625, -0.0128173828125, 0.04913330078125, 0.111083984375, 0.17303466796875, 0.2349853515625, 0.29693603515625, 0.35888671875, 0.42083740234375, 0.4827880859375, 0.54473876953125, 0.606689453125, 0.66864013671875, 0.7305908203125, 0.79254150390625, 0.8544921875, 0.91644287109375, 0.9783935546875, 1.04034423828125, 1.102294921875, 1.16424560546875, 1.2261962890625, 1.28814697265625, 1.35009765625, 1.41204833984375, 1.4739990234375, 1.53594970703125, 1.597900390625, 1.65985107421875, 1.7218017578125, 1.78375244140625, 1.845703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 6.0, 10.0, 6.0, 21.0, 27.0, 30.0, 52.0, 50.0, 94.0, 128.0, 192.0, 242.0, 334.0, 556.0, 1075.0, 2511.0, 10934.0, 70083.0, 448922.0, 431655.0, 66259.0, 10225.0, 2338.0, 991.0, 563.0, 352.0, 240.0, 168.0, 122.0, 101.0, 79.0, 54.0, 43.0, 19.0, 18.0, 19.0, 10.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -12.95849609375, -12.5263671875, -12.09423828125, -11.662109375, -11.22998046875, -10.7978515625, -10.36572265625, -9.93359375, -9.50146484375, -9.0693359375, -8.63720703125, -8.205078125, -7.77294921875, -7.3408203125, -6.90869140625, -6.4765625, -6.04443359375, -5.6123046875, -5.18017578125, -4.748046875, -4.31591796875, -3.8837890625, -3.45166015625, -3.01953125, -2.58740234375, -2.1552734375, -1.72314453125, -1.291015625, -0.85888671875, -0.4267578125, 0.00537109375, 0.4375, 0.86962890625, 1.3017578125, 1.73388671875, 2.166015625, 2.59814453125, 3.0302734375, 3.46240234375, 3.89453125, 4.32666015625, 4.7587890625, 5.19091796875, 5.623046875, 6.05517578125, 6.4873046875, 6.91943359375, 7.3515625, 7.78369140625, 8.2158203125, 8.64794921875, 9.080078125, 9.51220703125, 9.9443359375, 10.37646484375, 10.80859375, 11.24072265625, 11.6728515625, 12.10498046875, 12.537109375, 12.96923828125, 13.4013671875, 13.83349609375, 14.265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 8.0, 10.0, 8.0, 17.0, 14.0, 14.0, 22.0, 28.0, 21.0, 25.0, 34.0, 37.0, 31.0, 40.0, 45.0, 51.0, 50.0, 41.0, 37.0, 46.0, 37.0, 27.0, 28.0, 33.0, 35.0, 29.0, 37.0, 27.0, 26.0, 18.0, 17.0, 18.0, 16.0, 11.0, 5.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9453125, -6.71484375, -6.484375, -6.25390625, -6.0234375, -5.79296875, -5.5625, -5.33203125, -5.1015625, -4.87109375, -4.640625, -4.41015625, -4.1796875, -3.94921875, -3.71875, -3.48828125, -3.2578125, -3.02734375, -2.796875, -2.56640625, -2.3359375, -2.10546875, -1.875, -1.64453125, -1.4140625, -1.18359375, -0.953125, -0.72265625, -0.4921875, -0.26171875, -0.03125, 0.19921875, 0.4296875, 0.66015625, 0.890625, 1.12109375, 1.3515625, 1.58203125, 1.8125, 2.04296875, 2.2734375, 2.50390625, 2.734375, 2.96484375, 3.1953125, 3.42578125, 3.65625, 3.88671875, 4.1171875, 4.34765625, 4.578125, 4.80859375, 5.0390625, 5.26953125, 5.5, 5.73046875, 5.9609375, 6.19140625, 6.421875, 6.65234375, 6.8828125, 7.11328125, 7.34375, 7.57421875, 7.8046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 8.0, 8.0, 13.0, 25.0, 37.0, 88.0, 206.0, 776.0, 17348.0, 1005975.0, 22775.0, 887.0, 217.0, 93.0, 42.0, 11.0, 15.0, 10.0, 11.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.40966796875, -15.5693359375, -14.72900390625, -13.888671875, -13.04833984375, -12.2080078125, -11.36767578125, -10.52734375, -9.68701171875, -8.8466796875, -8.00634765625, -7.166015625, -6.32568359375, -5.4853515625, -4.64501953125, -3.8046875, -2.96435546875, -2.1240234375, -1.28369140625, -0.443359375, 0.39697265625, 1.2373046875, 2.07763671875, 2.91796875, 3.75830078125, 4.5986328125, 5.43896484375, 6.279296875, 7.11962890625, 7.9599609375, 8.80029296875, 9.640625, 10.48095703125, 11.3212890625, 12.16162109375, 13.001953125, 13.84228515625, 14.6826171875, 15.52294921875, 16.36328125, 17.20361328125, 18.0439453125, 18.88427734375, 19.724609375, 20.56494140625, 21.4052734375, 22.24560546875, 23.0859375, 23.92626953125, 24.7666015625, 25.60693359375, 26.447265625, 27.28759765625, 28.1279296875, 28.96826171875, 29.80859375, 30.64892578125, 31.4892578125, 32.32958984375, 33.169921875, 34.01025390625, 34.8505859375, 35.69091796875, 36.53125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 14.0, 11.0, 22.0, 22.0, 31.0, 43.0, 43.0, 62.0, 92.0, 163.0, 129.0, 82.0, 58.0, 51.0, 32.0, 36.0, 20.0, 22.0, 11.0, 6.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010175704956054688, -0.0009913444519042969, -0.000965118408203125, -0.0009388923645019531, -0.0009126663208007812, -0.0008864402770996094, -0.0008602142333984375, -0.0008339881896972656, -0.0008077621459960938, -0.0007815361022949219, -0.00075531005859375, -0.0007290840148925781, -0.0007028579711914062, -0.0006766319274902344, -0.0006504058837890625, -0.0006241798400878906, -0.0005979537963867188, -0.0005717277526855469, -0.000545501708984375, -0.0005192756652832031, -0.0004930496215820312, -0.0004668235778808594, -0.0004405975341796875, -0.0004143714904785156, -0.00038814544677734375, -0.0003619194030761719, -0.000335693359375, -0.0003094673156738281, -0.00028324127197265625, -0.0002570152282714844, -0.0002307891845703125, -0.00020456314086914062, -0.00017833709716796875, -0.00015211105346679688, -0.000125885009765625, -9.965896606445312e-05, -7.343292236328125e-05, -4.7206878662109375e-05, -2.09808349609375e-05, 5.245208740234375e-06, 3.147125244140625e-05, 5.7697296142578125e-05, 8.392333984375e-05, 0.00011014938354492188, 0.00013637542724609375, 0.00016260147094726562, 0.0001888275146484375, 0.00021505355834960938, 0.00024127960205078125, 0.0002675056457519531, 0.000293731689453125, 0.0003199577331542969, 0.00034618377685546875, 0.0003724098205566406, 0.0003986358642578125, 0.0004248619079589844, 0.00045108795166015625, 0.0004773139953613281, 0.0005035400390625, 0.0005297660827636719, 0.0005559921264648438, 0.0005822181701660156, 0.0006084442138671875, 0.0006346702575683594, 0.0006608963012695312]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 10.0, 17.0, 36.0, 73.0, 102.0, 277.0, 1274.0, 35294.0, 1003835.0, 6586.0, 609.0, 207.0, 100.0, 46.0, 34.0, 28.0, 18.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0, -38.92822265625, -37.8564453125, -36.78466796875, -35.712890625, -34.64111328125, -33.5693359375, -32.49755859375, -31.42578125, -30.35400390625, -29.2822265625, -28.21044921875, -27.138671875, -26.06689453125, -24.9951171875, -23.92333984375, -22.8515625, -21.77978515625, -20.7080078125, -19.63623046875, -18.564453125, -17.49267578125, -16.4208984375, -15.34912109375, -14.27734375, -13.20556640625, -12.1337890625, -11.06201171875, -9.990234375, -8.91845703125, -7.8466796875, -6.77490234375, -5.703125, -4.63134765625, -3.5595703125, -2.48779296875, -1.416015625, -0.34423828125, 0.7275390625, 1.79931640625, 2.87109375, 3.94287109375, 5.0146484375, 6.08642578125, 7.158203125, 8.22998046875, 9.3017578125, 10.37353515625, 11.4453125, 12.51708984375, 13.5888671875, 14.66064453125, 15.732421875, 16.80419921875, 17.8759765625, 18.94775390625, 20.01953125, 21.09130859375, 22.1630859375, 23.23486328125, 24.306640625, 25.37841796875, 26.4501953125, 27.52197265625, 28.59375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 17.0, 30.0, 80.0, 188.0, 299.0, 214.0, 96.0, 42.0, 18.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.003173828125, -8.45947265625, -7.915771484375, -7.3720703125, -6.828369140625, -6.28466796875, -5.740966796875, -5.197265625, -4.653564453125, -4.10986328125, -3.566162109375, -3.0224609375, -2.478759765625, -1.93505859375, -1.391357421875, -0.84765625, -0.303955078125, 0.23974609375, 0.783447265625, 1.3271484375, 1.870849609375, 2.41455078125, 2.958251953125, 3.501953125, 4.045654296875, 4.58935546875, 5.133056640625, 5.6767578125, 6.220458984375, 6.76416015625, 7.307861328125, 7.8515625, 8.395263671875, 8.93896484375, 9.482666015625, 10.0263671875, 10.570068359375, 11.11376953125, 11.657470703125, 12.201171875, 12.744873046875, 13.28857421875, 13.832275390625, 14.3759765625, 14.919677734375, 15.46337890625, 16.007080078125, 16.55078125, 17.094482421875, 17.63818359375, 18.181884765625, 18.7255859375, 19.269287109375, 19.81298828125, 20.356689453125, 20.900390625, 21.444091796875, 21.98779296875, 22.531494140625, 23.0751953125, 23.618896484375, 24.16259765625, 24.706298828125, 25.25]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 90.0, 504.0, 368.0, 34.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-264.66839599609375, -253.05661010742188, -241.44482421875, -229.83303833007812, -218.22125244140625, -206.60946655273438, -194.9976806640625, -183.38589477539062, -171.77410888671875, -160.16232299804688, -148.550537109375, -136.93875122070312, -125.32696533203125, -113.71517944335938, -102.1033935546875, -90.49160766601562, -78.87982177734375, -67.26803588867188, -55.65625, -44.044464111328125, -32.43267822265625, -20.820892333984375, -9.2091064453125, 2.402679443359375, 14.01446533203125, 25.626251220703125, 37.238037109375, 48.849822998046875, 60.46160888671875, 72.07339477539062, 83.6851806640625, 95.29696655273438, 106.90875244140625, 118.52053833007812, 130.13232421875, 141.74411010742188, 153.35589599609375, 164.96768188476562, 176.5794677734375, 188.19125366210938, 199.80303955078125, 211.41482543945312, 223.026611328125, 234.63839721679688, 246.25018310546875, 257.8619689941406, 269.4737548828125, 281.0855407714844, 292.69732666015625, 304.3091125488281, 315.9208984375, 327.5326843261719, 339.14447021484375, 350.7562561035156, 362.3680419921875, 373.9798278808594, 385.59161376953125, 397.2033996582031, 408.815185546875, 420.4269714355469, 432.03875732421875, 443.6505432128906, 455.2623291015625, 466.8741149902344, 478.48590087890625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 6.0, 2.0, 8.0, 16.0, 6.0, 15.0, 20.0, 17.0, 36.0, 23.0, 27.0, 28.0, 37.0, 29.0, 39.0, 30.0, 29.0, 53.0, 34.0, 36.0, 42.0, 30.0, 45.0, 42.0, 41.0, 25.0, 32.0, 27.0, 21.0, 36.0, 24.0, 22.0, 14.0, 15.0, 20.0, 10.0, 9.0, 6.0, 13.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.45487976074219, -34.274147033691406, -33.09341049194336, -31.912677764892578, -30.731945037841797, -29.551210403442383, -28.37047576904297, -27.189743041992188, -26.009010314941406, -24.828275680541992, -23.64754295349121, -22.466808319091797, -21.286075592041016, -20.1053409576416, -18.924606323242188, -17.743873596191406, -16.563138961791992, -15.382405281066895, -14.201671600341797, -13.020936965942383, -11.840204238891602, -10.659469604492188, -9.47873592376709, -8.298002243041992, -7.1172685623168945, -5.936534881591797, -4.755801200866699, -3.5750670433044434, -2.3943333625793457, -1.213599681854248, -0.03286552429199219, 1.1478681564331055, 2.328601837158203, 3.509335517883301, 4.690069198608398, 5.870803356170654, 7.051537036895752, 8.232271194458008, 9.413004875183105, 10.593738555908203, 11.7744722366333, 12.955205917358398, 14.135939598083496, 15.316673278808594, 16.497407913208008, 17.67814064025879, 18.858875274658203, 20.039608001708984, 21.2203426361084, 22.401077270507812, 23.581809997558594, 24.762544631958008, 25.94327735900879, 27.124011993408203, 28.304744720458984, 29.4854793548584, 30.666213989257812, 31.846948623657227, 33.02768325805664, 34.20841598510742, 35.3891487121582, 36.569881439208984, 37.75061798095703, 38.93135070800781, 40.112083435058594]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 11.0, 11.0, 27.0, 33.0, 71.0, 94.0, 162.0, 314.0, 580.0, 1201.0, 2641.0, 6613.0, 19846.0, 79733.0, 633219.0, 3194755.0, 196299.0, 38902.0, 11431.0, 4367.0, 1854.0, 931.0, 446.0, 258.0, 164.0, 98.0, 60.0, 42.0, 21.0, 23.0, 20.0, 12.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.0234375, -10.6190185546875, -10.214599609375, -9.8101806640625, -9.40576171875, -9.0013427734375, -8.596923828125, -8.1925048828125, -7.7880859375, -7.3836669921875, -6.979248046875, -6.5748291015625, -6.17041015625, -5.7659912109375, -5.361572265625, -4.9571533203125, -4.552734375, -4.1483154296875, -3.743896484375, -3.3394775390625, -2.93505859375, -2.5306396484375, -2.126220703125, -1.7218017578125, -1.3173828125, -0.9129638671875, -0.508544921875, -0.1041259765625, 0.30029296875, 0.7047119140625, 1.109130859375, 1.5135498046875, 1.91796875, 2.3223876953125, 2.726806640625, 3.1312255859375, 3.53564453125, 3.9400634765625, 4.344482421875, 4.7489013671875, 5.1533203125, 5.5577392578125, 5.962158203125, 6.3665771484375, 6.77099609375, 7.1754150390625, 7.579833984375, 7.9842529296875, 8.388671875, 8.7930908203125, 9.197509765625, 9.6019287109375, 10.00634765625, 10.4107666015625, 10.815185546875, 11.2196044921875, 11.6240234375, 12.0284423828125, 12.432861328125, 12.8372802734375, 13.24169921875, 13.6461181640625, 14.050537109375, 14.4549560546875, 14.859375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 5.0, 3.0, 10.0, 15.0, 16.0, 29.0, 14.0, 35.0, 43.0, 36.0, 44.0, 53.0, 52.0, 52.0, 65.0, 57.0, 49.0, 45.0, 49.0, 53.0, 35.0, 44.0, 35.0, 26.0, 25.0, 13.0, 16.0, 15.0, 11.0, 10.0, 8.0, 7.0, 3.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.36328125, -2.2966461181640625, -2.230010986328125, -2.1633758544921875, -2.09674072265625, -2.0301055908203125, -1.963470458984375, -1.8968353271484375, -1.8302001953125, -1.7635650634765625, -1.696929931640625, -1.6302947998046875, -1.56365966796875, -1.4970245361328125, -1.430389404296875, -1.3637542724609375, -1.297119140625, -1.2304840087890625, -1.163848876953125, -1.0972137451171875, -1.03057861328125, -0.9639434814453125, -0.897308349609375, -0.8306732177734375, -0.7640380859375, -0.6974029541015625, -0.630767822265625, -0.5641326904296875, -0.49749755859375, -0.4308624267578125, -0.364227294921875, -0.2975921630859375, -0.23095703125, -0.1643218994140625, -0.097686767578125, -0.0310516357421875, 0.03558349609375, 0.1022186279296875, 0.168853759765625, 0.2354888916015625, 0.3021240234375, 0.3687591552734375, 0.435394287109375, 0.5020294189453125, 0.56866455078125, 0.6352996826171875, 0.701934814453125, 0.7685699462890625, 0.835205078125, 0.9018402099609375, 0.968475341796875, 1.0351104736328125, 1.10174560546875, 1.1683807373046875, 1.235015869140625, 1.3016510009765625, 1.3682861328125, 1.4349212646484375, 1.501556396484375, 1.5681915283203125, 1.63482666015625, 1.7014617919921875, 1.768096923828125, 1.8347320556640625, 1.9013671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 13.0, 11.0, 26.0, 33.0, 42.0, 63.0, 78.0, 154.0, 226.0, 335.0, 548.0, 921.0, 1628.0, 3058.0, 6295.0, 14281.0, 36835.0, 112637.0, 476376.0, 2752271.0, 585670.0, 131035.0, 41635.0, 15707.0, 6723.0, 3252.0, 1766.0, 947.0, 597.0, 374.0, 257.0, 152.0, 91.0, 67.0, 50.0, 33.0, 22.0, 16.0, 8.0, 11.0, 7.0, 9.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.64617919921875, -6.4134521484375, -6.18072509765625, -5.947998046875, -5.71527099609375, -5.4825439453125, -5.24981689453125, -5.01708984375, -4.78436279296875, -4.5516357421875, -4.31890869140625, -4.086181640625, -3.85345458984375, -3.6207275390625, -3.38800048828125, -3.1552734375, -2.92254638671875, -2.6898193359375, -2.45709228515625, -2.224365234375, -1.99163818359375, -1.7589111328125, -1.52618408203125, -1.29345703125, -1.06072998046875, -0.8280029296875, -0.59527587890625, -0.362548828125, -0.12982177734375, 0.1029052734375, 0.33563232421875, 0.568359375, 0.80108642578125, 1.0338134765625, 1.26654052734375, 1.499267578125, 1.73199462890625, 1.9647216796875, 2.19744873046875, 2.43017578125, 2.66290283203125, 2.8956298828125, 3.12835693359375, 3.361083984375, 3.59381103515625, 3.8265380859375, 4.05926513671875, 4.2919921875, 4.52471923828125, 4.7574462890625, 4.99017333984375, 5.222900390625, 5.45562744140625, 5.6883544921875, 5.92108154296875, 6.15380859375, 6.38653564453125, 6.6192626953125, 6.85198974609375, 7.084716796875, 7.31744384765625, 7.5501708984375, 7.78289794921875, 8.015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 6.0, 6.0, 9.0, 20.0, 13.0, 38.0, 45.0, 69.0, 95.0, 196.0, 360.0, 706.0, 1268.0, 523.0, 261.0, 162.0, 97.0, 62.0, 36.0, 25.0, 31.0, 13.0, 7.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.18621826171875, -4.0208740234375, -3.85552978515625, -3.690185546875, -3.52484130859375, -3.3594970703125, -3.19415283203125, -3.02880859375, -2.86346435546875, -2.6981201171875, -2.53277587890625, -2.367431640625, -2.20208740234375, -2.0367431640625, -1.87139892578125, -1.7060546875, -1.54071044921875, -1.3753662109375, -1.21002197265625, -1.044677734375, -0.87933349609375, -0.7139892578125, -0.54864501953125, -0.38330078125, -0.21795654296875, -0.0526123046875, 0.11273193359375, 0.278076171875, 0.44342041015625, 0.6087646484375, 0.77410888671875, 0.939453125, 1.10479736328125, 1.2701416015625, 1.43548583984375, 1.600830078125, 1.76617431640625, 1.9315185546875, 2.09686279296875, 2.26220703125, 2.42755126953125, 2.5928955078125, 2.75823974609375, 2.923583984375, 3.08892822265625, 3.2542724609375, 3.41961669921875, 3.5849609375, 3.75030517578125, 3.9156494140625, 4.08099365234375, 4.246337890625, 4.41168212890625, 4.5770263671875, 4.74237060546875, 4.90771484375, 5.07305908203125, 5.2384033203125, 5.40374755859375, 5.569091796875, 5.73443603515625, 5.8997802734375, 6.06512451171875, 6.23046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 17.0, 64.0, 141.0, 206.0, 222.0, 173.0, 100.0, 41.0, 22.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.925148010253906, -52.00737380981445, -50.089599609375, -48.17182159423828, -46.25404739379883, -44.336273193359375, -42.41849899291992, -40.50072479248047, -38.582950592041016, -36.66517639160156, -34.74740219116211, -32.829627990722656, -30.91185188293457, -28.994075775146484, -27.07630157470703, -25.158527374267578, -23.240751266479492, -21.32297706604004, -19.405200958251953, -17.4874267578125, -15.569652557373047, -13.651877403259277, -11.734102249145508, -9.816328048706055, -7.898552894592285, -5.980778217315674, -4.0630035400390625, -2.145228385925293, -0.22745370864868164, 1.6903209686279297, 3.608096122741699, 5.525870323181152, 7.443645477294922, 9.361420631408691, 11.279194831848145, 13.196969985961914, 15.114744186401367, 17.032520294189453, 18.950294494628906, 20.86806869506836, 22.785842895507812, 24.703617095947266, 26.62139320373535, 28.539167404174805, 30.456941604614258, 32.374717712402344, 34.2924919128418, 36.21026611328125, 38.12804412841797, 40.04581832885742, 41.963592529296875, 43.881370544433594, 45.79914474487305, 47.7169189453125, 49.63469314575195, 51.552467346191406, 53.47024154663086, 55.38801574707031, 57.305789947509766, 59.22356414794922, 61.14134216308594, 63.05911636352539, 64.97689056396484, 66.89466857910156, 68.81243896484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 9.0, 9.0, 12.0, 16.0, 17.0, 19.0, 28.0, 23.0, 35.0, 33.0, 35.0, 42.0, 42.0, 47.0, 55.0, 40.0, 49.0, 48.0, 45.0, 58.0, 27.0, 43.0, 24.0, 30.0, 28.0, 29.0, 29.0, 27.0, 19.0, 16.0, 12.0, 10.0, 6.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.17355728149414, -15.631606101989746, -15.089654922485352, -14.547703742980957, -14.005752563476562, -13.463801383972168, -12.921850204467773, -12.379898071289062, -11.837947845458984, -11.29599666595459, -10.754045486450195, -10.2120943069458, -9.670143127441406, -9.128191947937012, -8.586240768432617, -8.044288635253906, -7.502337455749512, -6.960386276245117, -6.418435096740723, -5.876483917236328, -5.334532737731934, -4.792581558227539, -4.250629901885986, -3.708678722381592, -3.1667275428771973, -2.6247763633728027, -2.082825183868408, -1.5408737659454346, -0.99892258644104, -0.4569714069366455, 0.08498001098632812, 0.6269311904907227, 1.1688823699951172, 1.7108335494995117, 2.2527847290039062, 2.79473614692688, 3.3366873264312744, 3.878638505935669, 4.420589923858643, 4.962541103363037, 5.504492282867432, 6.046443462371826, 6.588394641876221, 7.130346298217773, 7.672297477722168, 8.214248657226562, 8.756199836730957, 9.298151016235352, 9.840102195739746, 10.38205337524414, 10.924004554748535, 11.46595573425293, 12.007906913757324, 12.549858093261719, 13.09181022644043, 13.633760452270508, 14.175712585449219, 14.717663764953613, 15.259614944458008, 15.801566123962402, 16.343517303466797, 16.885469436645508, 17.427419662475586, 17.969371795654297, 18.511322021484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 10.0, 9.0, 7.0, 11.0, 32.0, 36.0, 58.0, 100.0, 161.0, 273.0, 427.0, 909.0, 1897.0, 4312.0, 10912.0, 30168.0, 91742.0, 258401.0, 372018.0, 181608.0, 60736.0, 20778.0, 7653.0, 3148.0, 1438.0, 717.0, 393.0, 224.0, 134.0, 85.0, 48.0, 38.0, 24.0, 10.0, 17.0, 2.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.12109375, -7.8125, -7.50390625, -7.1953125, -6.88671875, -6.578125, -6.26953125, -5.9609375, -5.65234375, -5.34375, -5.03515625, -4.7265625, -4.41796875, -4.109375, -3.80078125, -3.4921875, -3.18359375, -2.875, -2.56640625, -2.2578125, -1.94921875, -1.640625, -1.33203125, -1.0234375, -0.71484375, -0.40625, -0.09765625, 0.2109375, 0.51953125, 0.828125, 1.13671875, 1.4453125, 1.75390625, 2.0625, 2.37109375, 2.6796875, 2.98828125, 3.296875, 3.60546875, 3.9140625, 4.22265625, 4.53125, 4.83984375, 5.1484375, 5.45703125, 5.765625, 6.07421875, 6.3828125, 6.69140625, 7.0, 7.30859375, 7.6171875, 7.92578125, 8.234375, 8.54296875, 8.8515625, 9.16015625, 9.46875, 9.77734375, 10.0859375, 10.39453125, 10.703125, 11.01171875, 11.3203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 8.0, 12.0, 18.0, 23.0, 23.0, 30.0, 46.0, 39.0, 49.0, 37.0, 49.0, 46.0, 53.0, 45.0, 51.0, 62.0, 58.0, 43.0, 42.0, 28.0, 32.0, 33.0, 32.0, 19.0, 17.0, 15.0, 15.0, 10.0, 12.0, 6.0, 2.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-2.498046875, -2.428314208984375, -2.35858154296875, -2.288848876953125, -2.2191162109375, -2.149383544921875, -2.07965087890625, -2.009918212890625, -1.940185546875, -1.870452880859375, -1.80072021484375, -1.730987548828125, -1.6612548828125, -1.591522216796875, -1.52178955078125, -1.452056884765625, -1.38232421875, -1.312591552734375, -1.24285888671875, -1.173126220703125, -1.1033935546875, -1.033660888671875, -0.96392822265625, -0.894195556640625, -0.824462890625, -0.754730224609375, -0.68499755859375, -0.615264892578125, -0.5455322265625, -0.475799560546875, -0.40606689453125, -0.336334228515625, -0.2666015625, -0.196868896484375, -0.12713623046875, -0.057403564453125, 0.0123291015625, 0.082061767578125, 0.15179443359375, 0.221527099609375, 0.291259765625, 0.360992431640625, 0.43072509765625, 0.500457763671875, 0.5701904296875, 0.639923095703125, 0.70965576171875, 0.779388427734375, 0.84912109375, 0.918853759765625, 0.98858642578125, 1.058319091796875, 1.1280517578125, 1.197784423828125, 1.26751708984375, 1.337249755859375, 1.406982421875, 1.476715087890625, 1.54644775390625, 1.616180419921875, 1.6859130859375, 1.755645751953125, 1.82537841796875, 1.895111083984375, 1.96484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 6.0, 17.0, 18.0, 27.0, 33.0, 39.0, 57.0, 59.0, 77.0, 116.0, 151.0, 174.0, 208.0, 354.0, 469.0, 727.0, 1285.0, 3080.0, 11619.0, 67514.0, 430131.0, 442980.0, 70207.0, 12103.0, 3063.0, 1334.0, 785.0, 507.0, 313.0, 232.0, 198.0, 149.0, 114.0, 99.0, 71.0, 52.0, 37.0, 25.0, 27.0, 17.0, 18.0, 13.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.7265625, -13.283935546875, -12.84130859375, -12.398681640625, -11.9560546875, -11.513427734375, -11.07080078125, -10.628173828125, -10.185546875, -9.742919921875, -9.30029296875, -8.857666015625, -8.4150390625, -7.972412109375, -7.52978515625, -7.087158203125, -6.64453125, -6.201904296875, -5.75927734375, -5.316650390625, -4.8740234375, -4.431396484375, -3.98876953125, -3.546142578125, -3.103515625, -2.660888671875, -2.21826171875, -1.775634765625, -1.3330078125, -0.890380859375, -0.44775390625, -0.005126953125, 0.4375, 0.880126953125, 1.32275390625, 1.765380859375, 2.2080078125, 2.650634765625, 3.09326171875, 3.535888671875, 3.978515625, 4.421142578125, 4.86376953125, 5.306396484375, 5.7490234375, 6.191650390625, 6.63427734375, 7.076904296875, 7.51953125, 7.962158203125, 8.40478515625, 8.847412109375, 9.2900390625, 9.732666015625, 10.17529296875, 10.617919921875, 11.060546875, 11.503173828125, 11.94580078125, 12.388427734375, 12.8310546875, 13.273681640625, 13.71630859375, 14.158935546875, 14.6015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 7.0, 7.0, 11.0, 6.0, 17.0, 12.0, 17.0, 20.0, 22.0, 30.0, 29.0, 24.0, 44.0, 38.0, 41.0, 33.0, 45.0, 39.0, 37.0, 41.0, 54.0, 51.0, 46.0, 38.0, 38.0, 35.0, 27.0, 27.0, 26.0, 27.0, 22.0, 13.0, 16.0, 10.0, 9.0, 5.0, 7.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.7738037109375, -7.477294921875, -7.1807861328125, -6.88427734375, -6.5877685546875, -6.291259765625, -5.9947509765625, -5.6982421875, -5.4017333984375, -5.105224609375, -4.8087158203125, -4.51220703125, -4.2156982421875, -3.919189453125, -3.6226806640625, -3.326171875, -3.0296630859375, -2.733154296875, -2.4366455078125, -2.14013671875, -1.8436279296875, -1.547119140625, -1.2506103515625, -0.9541015625, -0.6575927734375, -0.361083984375, -0.0645751953125, 0.23193359375, 0.5284423828125, 0.824951171875, 1.1214599609375, 1.41796875, 1.7144775390625, 2.010986328125, 2.3074951171875, 2.60400390625, 2.9005126953125, 3.197021484375, 3.4935302734375, 3.7900390625, 4.0865478515625, 4.383056640625, 4.6795654296875, 4.97607421875, 5.2725830078125, 5.569091796875, 5.8656005859375, 6.162109375, 6.4586181640625, 6.755126953125, 7.0516357421875, 7.34814453125, 7.6446533203125, 7.941162109375, 8.2376708984375, 8.5341796875, 8.8306884765625, 9.127197265625, 9.4237060546875, 9.72021484375, 10.0167236328125, 10.313232421875, 10.6097412109375, 10.90625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 4.0, 11.0, 8.0, 7.0, 26.0, 35.0, 83.0, 203.0, 542.0, 2439.0, 21764.0, 381120.0, 600378.0, 37199.0, 3621.0, 672.0, 226.0, 85.0, 47.0, 27.0, 11.0, 14.0, 11.0, 6.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.5703125, -9.229736328125, -8.88916015625, -8.548583984375, -8.2080078125, -7.867431640625, -7.52685546875, -7.186279296875, -6.845703125, -6.505126953125, -6.16455078125, -5.823974609375, -5.4833984375, -5.142822265625, -4.80224609375, -4.461669921875, -4.12109375, -3.780517578125, -3.43994140625, -3.099365234375, -2.7587890625, -2.418212890625, -2.07763671875, -1.737060546875, -1.396484375, -1.055908203125, -0.71533203125, -0.374755859375, -0.0341796875, 0.306396484375, 0.64697265625, 0.987548828125, 1.328125, 1.668701171875, 2.00927734375, 2.349853515625, 2.6904296875, 3.031005859375, 3.37158203125, 3.712158203125, 4.052734375, 4.393310546875, 4.73388671875, 5.074462890625, 5.4150390625, 5.755615234375, 6.09619140625, 6.436767578125, 6.77734375, 7.117919921875, 7.45849609375, 7.799072265625, 8.1396484375, 8.480224609375, 8.82080078125, 9.161376953125, 9.501953125, 9.842529296875, 10.18310546875, 10.523681640625, 10.8642578125, 11.204833984375, 11.54541015625, 11.885986328125, 12.2265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 6.0, 9.0, 16.0, 19.0, 25.0, 29.0, 36.0, 51.0, 45.0, 53.0, 51.0, 72.0, 84.0, 85.0, 77.0, 55.0, 66.0, 34.0, 33.0, 27.0, 22.0, 23.0, 16.0, 8.0, 9.0, 10.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007224082946777344, -0.0007015466690063477, -0.0006806850433349609, -0.0006598234176635742, -0.0006389617919921875, -0.0006181001663208008, -0.0005972385406494141, -0.0005763769149780273, -0.0005555152893066406, -0.0005346536636352539, -0.0005137920379638672, -0.0004929304122924805, -0.00047206878662109375, -0.00045120716094970703, -0.0004303455352783203, -0.0004094839096069336, -0.0003886222839355469, -0.00036776065826416016, -0.00034689903259277344, -0.0003260374069213867, -0.00030517578125, -0.0002843141555786133, -0.00026345252990722656, -0.00024259090423583984, -0.00022172927856445312, -0.0002008676528930664, -0.0001800060272216797, -0.00015914440155029297, -0.00013828277587890625, -0.00011742115020751953, -9.655952453613281e-05, -7.56978988647461e-05, -5.4836273193359375e-05, -3.3974647521972656e-05, -1.3113021850585938e-05, 7.748603820800781e-06, 2.86102294921875e-05, 4.947185516357422e-05, 7.033348083496094e-05, 9.119510650634766e-05, 0.00011205673217773438, 0.0001329183578491211, 0.0001537799835205078, 0.00017464160919189453, 0.00019550323486328125, 0.00021636486053466797, 0.0002372264862060547, 0.0002580881118774414, 0.0002789497375488281, 0.00029981136322021484, 0.00032067298889160156, 0.0003415346145629883, 0.000362396240234375, 0.0003832578659057617, 0.00040411949157714844, 0.00042498111724853516, 0.0004458427429199219, 0.0004667043685913086, 0.0004875659942626953, 0.000508427619934082, 0.0005292892456054688, 0.0005501508712768555, 0.0005710124969482422, 0.0005918741226196289, 0.0006127357482910156]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 6.0, 5.0, 17.0, 20.0, 18.0, 30.0, 53.0, 48.0, 90.0, 123.0, 222.0, 317.0, 557.0, 1060.0, 2570.0, 8877.0, 54462.0, 431681.0, 471997.0, 61314.0, 9776.0, 2631.0, 1144.0, 538.0, 340.0, 207.0, 143.0, 101.0, 45.0, 50.0, 34.0, 20.0, 12.0, 9.0, 8.0, 3.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.5234375, -8.286865234375, -8.05029296875, -7.813720703125, -7.5771484375, -7.340576171875, -7.10400390625, -6.867431640625, -6.630859375, -6.394287109375, -6.15771484375, -5.921142578125, -5.6845703125, -5.447998046875, -5.21142578125, -4.974853515625, -4.73828125, -4.501708984375, -4.26513671875, -4.028564453125, -3.7919921875, -3.555419921875, -3.31884765625, -3.082275390625, -2.845703125, -2.609130859375, -2.37255859375, -2.135986328125, -1.8994140625, -1.662841796875, -1.42626953125, -1.189697265625, -0.953125, -0.716552734375, -0.47998046875, -0.243408203125, -0.0068359375, 0.229736328125, 0.46630859375, 0.702880859375, 0.939453125, 1.176025390625, 1.41259765625, 1.649169921875, 1.8857421875, 2.122314453125, 2.35888671875, 2.595458984375, 2.83203125, 3.068603515625, 3.30517578125, 3.541748046875, 3.7783203125, 4.014892578125, 4.25146484375, 4.488037109375, 4.724609375, 4.961181640625, 5.19775390625, 5.434326171875, 5.6708984375, 5.907470703125, 6.14404296875, 6.380615234375, 6.6171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 3.0, 4.0, 9.0, 11.0, 18.0, 15.0, 28.0, 23.0, 27.0, 29.0, 46.0, 53.0, 74.0, 57.0, 74.0, 66.0, 64.0, 70.0, 47.0, 67.0, 41.0, 27.0, 28.0, 30.0, 20.0, 19.0, 9.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.91015625, -4.779266357421875, -4.64837646484375, -4.517486572265625, -4.3865966796875, -4.255706787109375, -4.12481689453125, -3.993927001953125, -3.863037109375, -3.732147216796875, -3.60125732421875, -3.470367431640625, -3.3394775390625, -3.208587646484375, -3.07769775390625, -2.946807861328125, -2.81591796875, -2.685028076171875, -2.55413818359375, -2.423248291015625, -2.2923583984375, -2.161468505859375, -2.03057861328125, -1.899688720703125, -1.768798828125, -1.637908935546875, -1.50701904296875, -1.376129150390625, -1.2452392578125, -1.114349365234375, -0.98345947265625, -0.852569580078125, -0.7216796875, -0.590789794921875, -0.45989990234375, -0.329010009765625, -0.1981201171875, -0.067230224609375, 0.06365966796875, 0.194549560546875, 0.325439453125, 0.456329345703125, 0.58721923828125, 0.718109130859375, 0.8489990234375, 0.979888916015625, 1.11077880859375, 1.241668701171875, 1.37255859375, 1.503448486328125, 1.63433837890625, 1.765228271484375, 1.8961181640625, 2.027008056640625, 2.15789794921875, 2.288787841796875, 2.419677734375, 2.550567626953125, 2.68145751953125, 2.812347412109375, 2.9432373046875, 3.074127197265625, 3.20501708984375, 3.335906982421875, 3.466796875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 11.0, 24.0, 48.0, 93.0, 140.0, 174.0, 159.0, 152.0, 90.0, 44.0, 34.0, 18.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.52593231201172, -37.353511810302734, -34.181095123291016, -31.00867462158203, -27.83625602722168, -24.663837432861328, -21.491416931152344, -18.318998336791992, -15.14657974243164, -11.974161148071289, -8.801741600036621, -5.629322052001953, -2.4569034576416016, 0.71551513671875, 3.8879356384277344, 7.060354232788086, 10.232772827148438, 13.405191421508789, 16.57761001586914, 19.750030517578125, 22.922449111938477, 26.094867706298828, 29.267288208007812, 32.43970489501953, 35.612125396728516, 38.7845458984375, 41.95696258544922, 45.1293830871582, 48.30180358886719, 51.474220275878906, 54.64664077758789, 57.819061279296875, 60.991485595703125, 64.16390228271484, 67.3363265991211, 70.50874328613281, 73.68115997314453, 76.85357666015625, 80.0260009765625, 83.19841766357422, 86.37083435058594, 89.54325103759766, 92.7156753540039, 95.88809204101562, 99.06050872802734, 102.23292541503906, 105.40534973144531, 108.57776641845703, 111.75019073486328, 114.922607421875, 118.09503173828125, 121.26744842529297, 124.43986511230469, 127.61228942871094, 130.78469848632812, 133.95712280273438, 137.12954711914062, 140.30197143554688, 143.47438049316406, 146.6468048095703, 149.81922912597656, 152.99163818359375, 156.1640625, 159.33648681640625, 162.50889587402344]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 5.0, 11.0, 12.0, 11.0, 11.0, 10.0, 19.0, 22.0, 34.0, 32.0, 29.0, 51.0, 41.0, 43.0, 49.0, 42.0, 47.0, 43.0, 53.0, 52.0, 39.0, 42.0, 32.0, 42.0, 36.0, 31.0, 26.0, 21.0, 22.0, 13.0, 18.0, 15.0, 9.0, 10.0, 10.0, 6.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.214202880859375, -51.633819580078125, -50.053436279296875, -48.473052978515625, -46.892669677734375, -45.31228256225586, -43.73189926147461, -42.15151596069336, -40.57113265991211, -38.99074935913086, -37.41036605834961, -35.82998275756836, -34.249595642089844, -32.669212341308594, -31.088829040527344, -29.508445739746094, -27.928062438964844, -26.347679138183594, -24.767295837402344, -23.18691062927246, -21.60652732849121, -20.02614402770996, -18.445758819580078, -16.865375518798828, -15.284992218017578, -13.704608917236328, -12.124224662780762, -10.543840408325195, -8.963457107543945, -7.383073329925537, -5.802689552307129, -4.2223052978515625, -2.6419219970703125, -1.0615382194519043, 0.5188455581665039, 2.099229335784912, 3.6796131134033203, 5.2599968910217285, 6.840380668640137, 8.420764923095703, 10.001148223876953, 11.581531524658203, 13.16191577911377, 14.742300033569336, 16.322683334350586, 17.903066635131836, 19.48345184326172, 21.06383514404297, 22.64421844482422, 24.22460174560547, 25.80498504638672, 27.3853702545166, 28.96575355529785, 30.5461368560791, 32.126522064208984, 33.706905364990234, 35.287288665771484, 36.867671966552734, 38.448055267333984, 40.028438568115234, 41.60882568359375, 43.189208984375, 44.76959228515625, 46.3499755859375, 47.93035888671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 6.0, 6.0, 12.0, 18.0, 22.0, 34.0, 51.0, 88.0, 141.0, 241.0, 529.0, 1124.0, 3159.0, 13661.0, 187536.0, 3947898.0, 30919.0, 5566.0, 1718.0, 712.0, 328.0, 188.0, 114.0, 76.0, 43.0, 32.0, 17.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.626708984375, -18.81591796875, -18.005126953125, -17.1943359375, -16.383544921875, -15.57275390625, -14.761962890625, -13.951171875, -13.140380859375, -12.32958984375, -11.518798828125, -10.7080078125, -9.897216796875, -9.08642578125, -8.275634765625, -7.46484375, -6.654052734375, -5.84326171875, -5.032470703125, -4.2216796875, -3.410888671875, -2.60009765625, -1.789306640625, -0.978515625, -0.167724609375, 0.64306640625, 1.453857421875, 2.2646484375, 3.075439453125, 3.88623046875, 4.697021484375, 5.5078125, 6.318603515625, 7.12939453125, 7.940185546875, 8.7509765625, 9.561767578125, 10.37255859375, 11.183349609375, 11.994140625, 12.804931640625, 13.61572265625, 14.426513671875, 15.2373046875, 16.048095703125, 16.85888671875, 17.669677734375, 18.48046875, 19.291259765625, 20.10205078125, 20.912841796875, 21.7236328125, 22.534423828125, 23.34521484375, 24.156005859375, 24.966796875, 25.777587890625, 26.58837890625, 27.399169921875, 28.2099609375, 29.020751953125, 29.83154296875, 30.642333984375, 31.453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 3.0, 7.0, 8.0, 5.0, 7.0, 8.0, 12.0, 12.0, 28.0, 28.0, 27.0, 37.0, 38.0, 49.0, 51.0, 53.0, 48.0, 49.0, 53.0, 52.0, 43.0, 36.0, 46.0, 42.0, 31.0, 36.0, 31.0, 21.0, 27.0, 18.0, 19.0, 13.0, 14.0, 12.0, 10.0, 10.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.625, -2.549560546875, -2.47412109375, -2.398681640625, -2.3232421875, -2.247802734375, -2.17236328125, -2.096923828125, -2.021484375, -1.946044921875, -1.87060546875, -1.795166015625, -1.7197265625, -1.644287109375, -1.56884765625, -1.493408203125, -1.41796875, -1.342529296875, -1.26708984375, -1.191650390625, -1.1162109375, -1.040771484375, -0.96533203125, -0.889892578125, -0.814453125, -0.739013671875, -0.66357421875, -0.588134765625, -0.5126953125, -0.437255859375, -0.36181640625, -0.286376953125, -0.2109375, -0.135498046875, -0.06005859375, 0.015380859375, 0.0908203125, 0.166259765625, 0.24169921875, 0.317138671875, 0.392578125, 0.468017578125, 0.54345703125, 0.618896484375, 0.6943359375, 0.769775390625, 0.84521484375, 0.920654296875, 0.99609375, 1.071533203125, 1.14697265625, 1.222412109375, 1.2978515625, 1.373291015625, 1.44873046875, 1.524169921875, 1.599609375, 1.675048828125, 1.75048828125, 1.825927734375, 1.9013671875, 1.976806640625, 2.05224609375, 2.127685546875, 2.203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 5.0, 13.0, 18.0, 23.0, 32.0, 42.0, 47.0, 74.0, 93.0, 150.0, 192.0, 317.0, 479.0, 709.0, 1134.0, 1954.0, 3432.0, 6593.0, 14675.0, 41752.0, 206909.0, 3690713.0, 160885.0, 36294.0, 13495.0, 6218.0, 3114.0, 1796.0, 1066.0, 713.0, 440.0, 262.0, 184.0, 136.0, 84.0, 66.0, 38.0, 38.0, 17.0, 19.0, 12.0, 10.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8203125, -7.5546875, -7.2890625, -7.0234375, -6.7578125, -6.4921875, -6.2265625, -5.9609375, -5.6953125, -5.4296875, -5.1640625, -4.8984375, -4.6328125, -4.3671875, -4.1015625, -3.8359375, -3.5703125, -3.3046875, -3.0390625, -2.7734375, -2.5078125, -2.2421875, -1.9765625, -1.7109375, -1.4453125, -1.1796875, -0.9140625, -0.6484375, -0.3828125, -0.1171875, 0.1484375, 0.4140625, 0.6796875, 0.9453125, 1.2109375, 1.4765625, 1.7421875, 2.0078125, 2.2734375, 2.5390625, 2.8046875, 3.0703125, 3.3359375, 3.6015625, 3.8671875, 4.1328125, 4.3984375, 4.6640625, 4.9296875, 5.1953125, 5.4609375, 5.7265625, 5.9921875, 6.2578125, 6.5234375, 6.7890625, 7.0546875, 7.3203125, 7.5859375, 7.8515625, 8.1171875, 8.3828125, 8.6484375, 8.9140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 9.0, 15.0, 13.0, 19.0, 20.0, 53.0, 98.0, 172.0, 482.0, 2619.0, 227.0, 126.0, 61.0, 34.0, 29.0, 27.0, 13.0, 11.0, 2.0, 4.0, 9.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.998443603515625, -1.93829345703125, -1.878143310546875, -1.8179931640625, -1.757843017578125, -1.69769287109375, -1.637542724609375, -1.577392578125, -1.517242431640625, -1.45709228515625, -1.396942138671875, -1.3367919921875, -1.276641845703125, -1.21649169921875, -1.156341552734375, -1.09619140625, -1.036041259765625, -0.97589111328125, -0.915740966796875, -0.8555908203125, -0.795440673828125, -0.73529052734375, -0.675140380859375, -0.614990234375, -0.554840087890625, -0.49468994140625, -0.434539794921875, -0.3743896484375, -0.314239501953125, -0.25408935546875, -0.193939208984375, -0.1337890625, -0.073638916015625, -0.01348876953125, 0.046661376953125, 0.1068115234375, 0.166961669921875, 0.22711181640625, 0.287261962890625, 0.347412109375, 0.407562255859375, 0.46771240234375, 0.527862548828125, 0.5880126953125, 0.648162841796875, 0.70831298828125, 0.768463134765625, 0.82861328125, 0.888763427734375, 0.94891357421875, 1.009063720703125, 1.0692138671875, 1.129364013671875, 1.18951416015625, 1.249664306640625, 1.309814453125, 1.369964599609375, 1.43011474609375, 1.490264892578125, 1.5504150390625, 1.610565185546875, 1.67071533203125, 1.730865478515625, 1.791015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 8.0, 17.0, 34.0, 48.0, 72.0, 91.0, 115.0, 140.0, 95.0, 115.0, 78.0, 64.0, 46.0, 26.0, 10.0, 12.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.410139083862305, -11.070477485656738, -10.730814933776855, -10.391153335571289, -10.051491737365723, -9.711830139160156, -9.372167587280273, -9.032505989074707, -8.69284439086914, -8.353182792663574, -8.013520240783691, -7.673858642578125, -7.334197044372559, -6.994534969329834, -6.654872894287109, -6.315211296081543, -5.97554874420166, -5.6358866691589355, -5.296225070953369, -4.9565629959106445, -4.616901397705078, -4.2772393226623535, -3.937577247619629, -3.5979154109954834, -3.258253574371338, -2.9185917377471924, -2.578929901123047, -2.2392678260803223, -1.8996059894561768, -1.5599441528320312, -1.2202820777893066, -0.8806202411651611, -0.5409584045410156, -0.20129650831222534, 0.13836538791656494, 0.47802734375, 0.8176891803741455, 1.157351016998291, 1.4970130920410156, 1.8366749286651611, 2.1763367652893066, 2.515998601913452, 2.8556604385375977, 3.1953225135803223, 3.5349843502044678, 3.8746461868286133, 4.214308261871338, 4.5539703369140625, 4.893631935119629, 5.2332940101623535, 5.57295560836792, 5.9126176834106445, 6.252279281616211, 6.5919413566589355, 6.93160343170166, 7.271265029907227, 7.610927104949951, 7.950589179992676, 8.290250778198242, 8.629913330078125, 8.969574928283691, 9.309236526489258, 9.64889907836914, 9.988560676574707, 10.328222274780273]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 11.0, 18.0, 14.0, 24.0, 23.0, 23.0, 25.0, 23.0, 38.0, 27.0, 32.0, 31.0, 36.0, 47.0, 55.0, 47.0, 53.0, 36.0, 52.0, 41.0, 33.0, 33.0, 43.0, 21.0, 46.0, 28.0, 18.0, 22.0, 16.0, 13.0, 11.0, 5.0, 2.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.415430068969727, -4.279882907867432, -4.144335746765137, -4.008788585662842, -3.873241424560547, -3.737694263458252, -3.602147340774536, -3.466600179672241, -3.3310530185699463, -3.1955058574676514, -3.0599586963653564, -2.9244115352630615, -2.7888646125793457, -2.653317451477051, -2.517770290374756, -2.382223129272461, -2.246675968170166, -2.111128807067871, -1.9755816459655762, -1.8400346040725708, -1.7044874429702759, -1.568940281867981, -1.4333932399749756, -1.2978460788726807, -1.1622989177703857, -1.0267517566680908, -0.8912046551704407, -0.7556575536727905, -0.6201103925704956, -0.4845632314682007, -0.34901612997055054, -0.2134690284729004, -0.07792186737060547, 0.057625263929367065, 0.1931723952293396, 0.32871952652931213, 0.46426665782928467, 0.5998138189315796, 0.7353609204292297, 0.8709080219268799, 1.0064551830291748, 1.1420023441314697, 1.2775495052337646, 1.41309654712677, 1.548643708229065, 1.6841908693313599, 1.8197379112243652, 1.9552850723266602, 2.090832233428955, 2.22637939453125, 2.361926555633545, 2.49747371673584, 2.6330208778381348, 2.7685680389404297, 2.9041149616241455, 3.0396621227264404, 3.1752092838287354, 3.3107564449310303, 3.446303606033325, 3.58185076713562, 3.717397689819336, 3.852944850921631, 3.988492012023926, 4.124039173126221, 4.259586334228516]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 14.0, 8.0, 18.0, 30.0, 44.0, 63.0, 83.0, 173.0, 289.0, 557.0, 988.0, 2307.0, 5515.0, 14224.0, 38736.0, 106931.0, 247877.0, 321451.0, 190615.0, 74384.0, 26766.0, 9928.0, 4001.0, 1676.0, 867.0, 413.0, 229.0, 144.0, 83.0, 61.0, 19.0, 21.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.67913818359375, -5.4246826171875, -5.17022705078125, -4.915771484375, -4.66131591796875, -4.4068603515625, -4.15240478515625, -3.89794921875, -3.64349365234375, -3.3890380859375, -3.13458251953125, -2.880126953125, -2.62567138671875, -2.3712158203125, -2.11676025390625, -1.8623046875, -1.60784912109375, -1.3533935546875, -1.09893798828125, -0.844482421875, -0.59002685546875, -0.3355712890625, -0.08111572265625, 0.17333984375, 0.42779541015625, 0.6822509765625, 0.93670654296875, 1.191162109375, 1.44561767578125, 1.7000732421875, 1.95452880859375, 2.208984375, 2.46343994140625, 2.7178955078125, 2.97235107421875, 3.226806640625, 3.48126220703125, 3.7357177734375, 3.99017333984375, 4.24462890625, 4.49908447265625, 4.7535400390625, 5.00799560546875, 5.262451171875, 5.51690673828125, 5.7713623046875, 6.02581787109375, 6.2802734375, 6.53472900390625, 6.7891845703125, 7.04364013671875, 7.298095703125, 7.55255126953125, 7.8070068359375, 8.06146240234375, 8.31591796875, 8.57037353515625, 8.8248291015625, 9.07928466796875, 9.333740234375, 9.58819580078125, 9.8426513671875, 10.09710693359375, 10.3515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 11.0, 5.0, 9.0, 19.0, 13.0, 17.0, 32.0, 27.0, 41.0, 40.0, 51.0, 45.0, 43.0, 42.0, 42.0, 52.0, 46.0, 43.0, 37.0, 58.0, 48.0, 32.0, 31.0, 27.0, 25.0, 28.0, 22.0, 15.0, 12.0, 18.0, 11.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.609375, -2.532379150390625, -2.45538330078125, -2.378387451171875, -2.3013916015625, -2.224395751953125, -2.14739990234375, -2.070404052734375, -1.993408203125, -1.916412353515625, -1.83941650390625, -1.762420654296875, -1.6854248046875, -1.608428955078125, -1.53143310546875, -1.454437255859375, -1.37744140625, -1.300445556640625, -1.22344970703125, -1.146453857421875, -1.0694580078125, -0.992462158203125, -0.91546630859375, -0.838470458984375, -0.761474609375, -0.684478759765625, -0.60748291015625, -0.530487060546875, -0.4534912109375, -0.376495361328125, -0.29949951171875, -0.222503662109375, -0.1455078125, -0.068511962890625, 0.00848388671875, 0.085479736328125, 0.1624755859375, 0.239471435546875, 0.31646728515625, 0.393463134765625, 0.470458984375, 0.547454833984375, 0.62445068359375, 0.701446533203125, 0.7784423828125, 0.855438232421875, 0.93243408203125, 1.009429931640625, 1.08642578125, 1.163421630859375, 1.24041748046875, 1.317413330078125, 1.3944091796875, 1.471405029296875, 1.54840087890625, 1.625396728515625, 1.702392578125, 1.779388427734375, 1.85638427734375, 1.933380126953125, 2.0103759765625, 2.087371826171875, 2.16436767578125, 2.241363525390625, 2.318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 2.0, 8.0, 11.0, 6.0, 24.0, 16.0, 43.0, 59.0, 68.0, 97.0, 137.0, 225.0, 308.0, 390.0, 620.0, 1021.0, 1820.0, 5869.0, 48450.0, 613377.0, 343209.0, 24620.0, 4020.0, 1460.0, 880.0, 556.0, 345.0, 232.0, 189.0, 132.0, 102.0, 76.0, 56.0, 29.0, 34.0, 12.0, 13.0, 5.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.109375, -17.541015625, -16.97265625, -16.404296875, -15.8359375, -15.267578125, -14.69921875, -14.130859375, -13.5625, -12.994140625, -12.42578125, -11.857421875, -11.2890625, -10.720703125, -10.15234375, -9.583984375, -9.015625, -8.447265625, -7.87890625, -7.310546875, -6.7421875, -6.173828125, -5.60546875, -5.037109375, -4.46875, -3.900390625, -3.33203125, -2.763671875, -2.1953125, -1.626953125, -1.05859375, -0.490234375, 0.078125, 0.646484375, 1.21484375, 1.783203125, 2.3515625, 2.919921875, 3.48828125, 4.056640625, 4.625, 5.193359375, 5.76171875, 6.330078125, 6.8984375, 7.466796875, 8.03515625, 8.603515625, 9.171875, 9.740234375, 10.30859375, 10.876953125, 11.4453125, 12.013671875, 12.58203125, 13.150390625, 13.71875, 14.287109375, 14.85546875, 15.423828125, 15.9921875, 16.560546875, 17.12890625, 17.697265625, 18.265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 4.0, 7.0, 9.0, 8.0, 7.0, 9.0, 13.0, 14.0, 25.0, 21.0, 21.0, 29.0, 28.0, 27.0, 41.0, 46.0, 45.0, 43.0, 45.0, 51.0, 46.0, 39.0, 38.0, 38.0, 38.0, 34.0, 31.0, 35.0, 28.0, 35.0, 17.0, 24.0, 26.0, 16.0, 8.0, 12.0, 11.0, 5.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-11.109375, -10.7779541015625, -10.446533203125, -10.1151123046875, -9.78369140625, -9.4522705078125, -9.120849609375, -8.7894287109375, -8.4580078125, -8.1265869140625, -7.795166015625, -7.4637451171875, -7.13232421875, -6.8009033203125, -6.469482421875, -6.1380615234375, -5.806640625, -5.4752197265625, -5.143798828125, -4.8123779296875, -4.48095703125, -4.1495361328125, -3.818115234375, -3.4866943359375, -3.1552734375, -2.8238525390625, -2.492431640625, -2.1610107421875, -1.82958984375, -1.4981689453125, -1.166748046875, -0.8353271484375, -0.50390625, -0.1724853515625, 0.158935546875, 0.4903564453125, 0.82177734375, 1.1531982421875, 1.484619140625, 1.8160400390625, 2.1474609375, 2.4788818359375, 2.810302734375, 3.1417236328125, 3.47314453125, 3.8045654296875, 4.135986328125, 4.4674072265625, 4.798828125, 5.1302490234375, 5.461669921875, 5.7930908203125, 6.12451171875, 6.4559326171875, 6.787353515625, 7.1187744140625, 7.4501953125, 7.7816162109375, 8.113037109375, 8.4444580078125, 8.77587890625, 9.1072998046875, 9.438720703125, 9.7701416015625, 10.1015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 8.0, 10.0, 17.0, 26.0, 23.0, 36.0, 40.0, 59.0, 103.0, 182.0, 377.0, 834.0, 2742.0, 12621.0, 105025.0, 691926.0, 206760.0, 21667.0, 3931.0, 1142.0, 426.0, 214.0, 126.0, 61.0, 50.0, 39.0, 23.0, 18.0, 10.0, 5.0, 11.0, 9.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.28778076171875, -6.0325927734375, -5.77740478515625, -5.522216796875, -5.26702880859375, -5.0118408203125, -4.75665283203125, -4.50146484375, -4.24627685546875, -3.9910888671875, -3.73590087890625, -3.480712890625, -3.22552490234375, -2.9703369140625, -2.71514892578125, -2.4599609375, -2.20477294921875, -1.9495849609375, -1.69439697265625, -1.439208984375, -1.18402099609375, -0.9288330078125, -0.67364501953125, -0.41845703125, -0.16326904296875, 0.0919189453125, 0.34710693359375, 0.602294921875, 0.85748291015625, 1.1126708984375, 1.36785888671875, 1.623046875, 1.87823486328125, 2.1334228515625, 2.38861083984375, 2.643798828125, 2.89898681640625, 3.1541748046875, 3.40936279296875, 3.66455078125, 3.91973876953125, 4.1749267578125, 4.43011474609375, 4.685302734375, 4.94049072265625, 5.1956787109375, 5.45086669921875, 5.7060546875, 5.96124267578125, 6.2164306640625, 6.47161865234375, 6.726806640625, 6.98199462890625, 7.2371826171875, 7.49237060546875, 7.74755859375, 8.00274658203125, 8.2579345703125, 8.51312255859375, 8.768310546875, 9.02349853515625, 9.2786865234375, 9.53387451171875, 9.7890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 10.0, 7.0, 15.0, 21.0, 24.0, 54.0, 59.0, 62.0, 88.0, 84.0, 92.0, 88.0, 86.0, 69.0, 61.0, 46.0, 31.0, 23.0, 18.0, 11.0, 11.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007295608520507812, -0.0007030069828033447, -0.0006764531135559082, -0.0006498992443084717, -0.0006233453750610352, -0.0005967915058135986, -0.0005702376365661621, -0.0005436837673187256, -0.0005171298980712891, -0.0004905760288238525, -0.000464022159576416, -0.0004374682903289795, -0.00041091442108154297, -0.00038436055183410645, -0.0003578066825866699, -0.0003312528133392334, -0.0003046989440917969, -0.00027814507484436035, -0.00025159120559692383, -0.0002250373363494873, -0.00019848346710205078, -0.00017192959785461426, -0.00014537572860717773, -0.00011882185935974121, -9.226799011230469e-05, -6.571412086486816e-05, -3.916025161743164e-05, -1.2606382369995117e-05, 1.3947486877441406e-05, 4.050135612487793e-05, 6.705522537231445e-05, 9.360909461975098e-05, 0.0001201629638671875, 0.00014671683311462402, 0.00017327070236206055, 0.00019982457160949707, 0.0002263784408569336, 0.0002529323101043701, 0.00027948617935180664, 0.00030604004859924316, 0.0003325939178466797, 0.0003591477870941162, 0.00038570165634155273, 0.00041225552558898926, 0.0004388093948364258, 0.0004653632640838623, 0.0004919171333312988, 0.0005184710025787354, 0.0005450248718261719, 0.0005715787410736084, 0.0005981326103210449, 0.0006246864795684814, 0.000651240348815918, 0.0006777942180633545, 0.000704348087310791, 0.0007309019565582275, 0.0007574558258056641, 0.0007840096950531006, 0.0008105635643005371, 0.0008371174335479736, 0.0008636713027954102, 0.0008902251720428467, 0.0009167790412902832, 0.0009433329105377197, 0.0009698867797851562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 4.0, 3.0, 11.0, 7.0, 16.0, 14.0, 22.0, 47.0, 64.0, 92.0, 151.0, 298.0, 584.0, 1307.0, 3646.0, 16533.0, 216654.0, 729916.0, 66842.0, 8067.0, 2255.0, 962.0, 446.0, 219.0, 120.0, 64.0, 57.0, 36.0, 28.0, 19.0, 18.0, 14.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6953125, -10.400634765625, -10.10595703125, -9.811279296875, -9.5166015625, -9.221923828125, -8.92724609375, -8.632568359375, -8.337890625, -8.043212890625, -7.74853515625, -7.453857421875, -7.1591796875, -6.864501953125, -6.56982421875, -6.275146484375, -5.98046875, -5.685791015625, -5.39111328125, -5.096435546875, -4.8017578125, -4.507080078125, -4.21240234375, -3.917724609375, -3.623046875, -3.328369140625, -3.03369140625, -2.739013671875, -2.4443359375, -2.149658203125, -1.85498046875, -1.560302734375, -1.265625, -0.970947265625, -0.67626953125, -0.381591796875, -0.0869140625, 0.207763671875, 0.50244140625, 0.797119140625, 1.091796875, 1.386474609375, 1.68115234375, 1.975830078125, 2.2705078125, 2.565185546875, 2.85986328125, 3.154541015625, 3.44921875, 3.743896484375, 4.03857421875, 4.333251953125, 4.6279296875, 4.922607421875, 5.21728515625, 5.511962890625, 5.806640625, 6.101318359375, 6.39599609375, 6.690673828125, 6.9853515625, 7.280029296875, 7.57470703125, 7.869384765625, 8.1640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 14.0, 14.0, 27.0, 44.0, 76.0, 80.0, 119.0, 114.0, 111.0, 119.0, 107.0, 50.0, 40.0, 26.0, 21.0, 14.0, 7.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.45819091796875, -7.2093505859375, -6.96051025390625, -6.711669921875, -6.46282958984375, -6.2139892578125, -5.96514892578125, -5.71630859375, -5.46746826171875, -5.2186279296875, -4.96978759765625, -4.720947265625, -4.47210693359375, -4.2232666015625, -3.97442626953125, -3.7255859375, -3.47674560546875, -3.2279052734375, -2.97906494140625, -2.730224609375, -2.48138427734375, -2.2325439453125, -1.98370361328125, -1.73486328125, -1.48602294921875, -1.2371826171875, -0.98834228515625, -0.739501953125, -0.49066162109375, -0.2418212890625, 0.00701904296875, 0.255859375, 0.50469970703125, 0.7535400390625, 1.00238037109375, 1.251220703125, 1.50006103515625, 1.7489013671875, 1.99774169921875, 2.24658203125, 2.49542236328125, 2.7442626953125, 2.99310302734375, 3.241943359375, 3.49078369140625, 3.7396240234375, 3.98846435546875, 4.2373046875, 4.48614501953125, 4.7349853515625, 4.98382568359375, 5.232666015625, 5.48150634765625, 5.7303466796875, 5.97918701171875, 6.22802734375, 6.47686767578125, 6.7257080078125, 6.97454833984375, 7.223388671875, 7.47222900390625, 7.7210693359375, 7.96990966796875, 8.21875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 20.0, 35.0, 55.0, 114.0, 200.0, 185.0, 189.0, 108.0, 56.0, 24.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.13990783691406, -140.05184936523438, -135.9637908935547, -131.875732421875, -127.78766632080078, -123.6996078491211, -119.61154174804688, -115.52348327636719, -111.4354248046875, -107.34736633300781, -103.25930786132812, -99.1712417602539, -95.08318328857422, -90.99512481689453, -86.90705871582031, -82.81900024414062, -78.73094177246094, -74.64288330078125, -70.55482482910156, -66.46675872802734, -62.378700256347656, -58.29064178466797, -54.202579498291016, -50.11451721191406, -46.026458740234375, -41.93840026855469, -37.850337982177734, -33.76227569580078, -29.674217224121094, -25.586156845092773, -21.498096466064453, -17.410036087036133, -13.321968078613281, -9.233907699584961, -5.145847320556641, -1.0577869415283203, 3.0302734375, 7.11833381652832, 11.20639419555664, 15.294454574584961, 19.38251495361328, 23.4705753326416, 27.558635711669922, 31.646696090698242, 35.73475646972656, 39.82281494140625, 43.9108772277832, 47.998939514160156, 52.086997985839844, 56.17505645751953, 60.263118743896484, 64.35118103027344, 68.43923950195312, 72.52729797363281, 76.6153564453125, 80.70342254638672, 84.7914810180664, 88.8795394897461, 92.96760559082031, 97.0556640625, 101.14372253417969, 105.23178100585938, 109.31983947753906, 113.40790557861328, 117.49596405029297]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 2.0, 7.0, 8.0, 7.0, 11.0, 12.0, 17.0, 14.0, 28.0, 37.0, 30.0, 30.0, 42.0, 40.0, 41.0, 47.0, 38.0, 56.0, 41.0, 47.0, 46.0, 48.0, 40.0, 39.0, 37.0, 32.0, 40.0, 29.0, 18.0, 17.0, 15.0, 16.0, 13.0, 12.0, 10.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-55.38923645019531, -53.77009201049805, -52.15094757080078, -50.53179931640625, -48.912654876708984, -47.29351043701172, -45.67436599731445, -44.05522155761719, -42.436073303222656, -40.81692886352539, -39.197784423828125, -37.578636169433594, -35.95949172973633, -34.34034729003906, -32.7212028503418, -31.10205841064453, -29.482913970947266, -27.86376953125, -26.2446231842041, -24.625478744506836, -23.006332397460938, -21.387187957763672, -19.768043518066406, -18.14889907836914, -16.529752731323242, -14.91060733795166, -13.291461944580078, -11.672317504882812, -10.05317211151123, -8.434026718139648, -6.814882278442383, -5.195736885070801, -3.5765953063964844, -1.9574501514434814, -0.3383049964904785, 1.2808399200439453, 2.8999853134155273, 4.519130706787109, 6.138275146484375, 7.757420539855957, 9.376565933227539, 10.995711326599121, 12.614856719970703, 14.234001159667969, 15.85314655303955, 17.472291946411133, 19.0914363861084, 20.710582733154297, 22.329727172851562, 23.948871612548828, 25.568017959594727, 27.187162399291992, 28.80630874633789, 30.425453186035156, 32.04459762573242, 33.66374206542969, 35.28289031982422, 36.902034759521484, 38.52117919921875, 40.14032745361328, 41.75947189331055, 43.37861633300781, 44.99776077270508, 46.616905212402344, 48.23604965209961]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 12.0, 13.0, 27.0, 47.0, 49.0, 93.0, 136.0, 239.0, 434.0, 856.0, 1779.0, 4173.0, 12804.0, 89582.0, 3971405.0, 91547.0, 13056.0, 4198.0, 1816.0, 849.0, 478.0, 258.0, 150.0, 76.0, 53.0, 33.0, 26.0, 18.0, 13.0, 10.0, 6.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3125, -12.79052734375, -12.2685546875, -11.74658203125, -11.224609375, -10.70263671875, -10.1806640625, -9.65869140625, -9.13671875, -8.61474609375, -8.0927734375, -7.57080078125, -7.048828125, -6.52685546875, -6.0048828125, -5.48291015625, -4.9609375, -4.43896484375, -3.9169921875, -3.39501953125, -2.873046875, -2.35107421875, -1.8291015625, -1.30712890625, -0.78515625, -0.26318359375, 0.2587890625, 0.78076171875, 1.302734375, 1.82470703125, 2.3466796875, 2.86865234375, 3.390625, 3.91259765625, 4.4345703125, 4.95654296875, 5.478515625, 6.00048828125, 6.5224609375, 7.04443359375, 7.56640625, 8.08837890625, 8.6103515625, 9.13232421875, 9.654296875, 10.17626953125, 10.6982421875, 11.22021484375, 11.7421875, 12.26416015625, 12.7861328125, 13.30810546875, 13.830078125, 14.35205078125, 14.8740234375, 15.39599609375, 15.91796875, 16.43994140625, 16.9619140625, 17.48388671875, 18.005859375, 18.52783203125, 19.0498046875, 19.57177734375, 20.09375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 11.0, 11.0, 20.0, 22.0, 22.0, 22.0, 33.0, 31.0, 29.0, 32.0, 46.0, 46.0, 53.0, 54.0, 44.0, 59.0, 45.0, 39.0, 40.0, 45.0, 36.0, 35.0, 29.0, 33.0, 15.0, 22.0, 21.0, 12.0, 16.0, 8.0, 9.0, 9.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6328125, -2.5555419921875, -2.478271484375, -2.4010009765625, -2.32373046875, -2.2464599609375, -2.169189453125, -2.0919189453125, -2.0146484375, -1.9373779296875, -1.860107421875, -1.7828369140625, -1.70556640625, -1.6282958984375, -1.551025390625, -1.4737548828125, -1.396484375, -1.3192138671875, -1.241943359375, -1.1646728515625, -1.08740234375, -1.0101318359375, -0.932861328125, -0.8555908203125, -0.7783203125, -0.7010498046875, -0.623779296875, -0.5465087890625, -0.46923828125, -0.3919677734375, -0.314697265625, -0.2374267578125, -0.16015625, -0.0828857421875, -0.005615234375, 0.0716552734375, 0.14892578125, 0.2261962890625, 0.303466796875, 0.3807373046875, 0.4580078125, 0.5352783203125, 0.612548828125, 0.6898193359375, 0.76708984375, 0.8443603515625, 0.921630859375, 0.9989013671875, 1.076171875, 1.1534423828125, 1.230712890625, 1.3079833984375, 1.38525390625, 1.4625244140625, 1.539794921875, 1.6170654296875, 1.6943359375, 1.7716064453125, 1.848876953125, 1.9261474609375, 2.00341796875, 2.0806884765625, 2.157958984375, 2.2352294921875, 2.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 12.0, 19.0, 17.0, 27.0, 27.0, 47.0, 48.0, 74.0, 112.0, 186.0, 242.0, 369.0, 543.0, 928.0, 1606.0, 3251.0, 7040.0, 21010.0, 102946.0, 3776841.0, 227750.0, 32016.0, 10010.0, 3969.0, 2069.0, 1093.0, 672.0, 388.0, 272.0, 157.0, 141.0, 113.0, 69.0, 50.0, 31.0, 33.0, 23.0, 13.0, 12.0, 3.0, 13.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.96875, -11.6131591796875, -11.257568359375, -10.9019775390625, -10.54638671875, -10.1907958984375, -9.835205078125, -9.4796142578125, -9.1240234375, -8.7684326171875, -8.412841796875, -8.0572509765625, -7.70166015625, -7.3460693359375, -6.990478515625, -6.6348876953125, -6.279296875, -5.9237060546875, -5.568115234375, -5.2125244140625, -4.85693359375, -4.5013427734375, -4.145751953125, -3.7901611328125, -3.4345703125, -3.0789794921875, -2.723388671875, -2.3677978515625, -2.01220703125, -1.6566162109375, -1.301025390625, -0.9454345703125, -0.58984375, -0.2342529296875, 0.121337890625, 0.4769287109375, 0.83251953125, 1.1881103515625, 1.543701171875, 1.8992919921875, 2.2548828125, 2.6104736328125, 2.966064453125, 3.3216552734375, 3.67724609375, 4.0328369140625, 4.388427734375, 4.7440185546875, 5.099609375, 5.4552001953125, 5.810791015625, 6.1663818359375, 6.52197265625, 6.8775634765625, 7.233154296875, 7.5887451171875, 7.9443359375, 8.2999267578125, 8.655517578125, 9.0111083984375, 9.36669921875, 9.7222900390625, 10.077880859375, 10.4334716796875, 10.7890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 7.0, 8.0, 19.0, 26.0, 48.0, 84.0, 160.0, 759.0, 2516.0, 221.0, 95.0, 40.0, 24.0, 24.0, 8.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.808197021484375, -2.70819091796875, -2.608184814453125, -2.5081787109375, -2.408172607421875, -2.30816650390625, -2.208160400390625, -2.108154296875, -2.008148193359375, -1.90814208984375, -1.808135986328125, -1.7081298828125, -1.608123779296875, -1.50811767578125, -1.408111572265625, -1.30810546875, -1.208099365234375, -1.10809326171875, -1.008087158203125, -0.9080810546875, -0.808074951171875, -0.70806884765625, -0.608062744140625, -0.508056640625, -0.408050537109375, -0.30804443359375, -0.208038330078125, -0.1080322265625, -0.008026123046875, 0.09197998046875, 0.191986083984375, 0.2919921875, 0.391998291015625, 0.49200439453125, 0.592010498046875, 0.6920166015625, 0.792022705078125, 0.89202880859375, 0.992034912109375, 1.092041015625, 1.192047119140625, 1.29205322265625, 1.392059326171875, 1.4920654296875, 1.592071533203125, 1.69207763671875, 1.792083740234375, 1.89208984375, 1.992095947265625, 2.09210205078125, 2.192108154296875, 2.2921142578125, 2.392120361328125, 2.49212646484375, 2.592132568359375, 2.692138671875, 2.792144775390625, 2.89215087890625, 2.992156982421875, 3.0921630859375, 3.192169189453125, 3.29217529296875, 3.392181396484375, 3.4921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 14.0, 12.0, 22.0, 18.0, 23.0, 29.0, 34.0, 52.0, 60.0, 69.0, 64.0, 69.0, 75.0, 69.0, 55.0, 62.0, 49.0, 41.0, 40.0, 36.0, 31.0, 19.0, 8.0, 10.0, 7.0, 4.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.038154125213623, -6.782145023345947, -6.526135444641113, -6.2701263427734375, -6.0141167640686035, -5.758107662200928, -5.502098083496094, -5.246088981628418, -4.990079879760742, -4.734070777893066, -4.478061199188232, -4.222052097320557, -3.9660425186157227, -3.710033416748047, -3.454024076461792, -3.198014736175537, -2.942005157470703, -2.6859958171844482, -2.4299864768981934, -2.1739773750305176, -1.9179679155349731, -1.6619585752487183, -1.405949354171753, -1.149940013885498, -0.8939306735992432, -0.6379213333129883, -0.3819120526313782, -0.12590277194976807, 0.13010656833648682, 0.3861159086227417, 0.642125129699707, 0.8981344699859619, 1.1541433334350586, 1.4101526737213135, 1.6661620140075684, 1.9221712350845337, 2.178180694580078, 2.434189796447754, 2.690199136734009, 2.9462084770202637, 3.2022178173065186, 3.4582271575927734, 3.7142364978790283, 3.970245838165283, 4.226254940032959, 4.482264518737793, 4.738273620605469, 4.9942827224731445, 5.2502923011779785, 5.506301403045654, 5.762310981750488, 6.018320083618164, 6.274329662322998, 6.530338764190674, 6.786348342895508, 7.042357444763184, 7.298366546630859, 7.554375648498535, 7.810385227203369, 8.066394805908203, 8.322403907775879, 8.578413009643555, 8.83442211151123, 9.090431213378906, 9.346441268920898]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 20.0, 12.0, 12.0, 19.0, 11.0, 26.0, 22.0, 20.0, 29.0, 31.0, 35.0, 37.0, 37.0, 39.0, 35.0, 40.0, 53.0, 45.0, 58.0, 46.0, 30.0, 25.0, 35.0, 33.0, 32.0, 24.0, 20.0, 20.0, 29.0, 24.0, 14.0, 9.0, 11.0, 9.0, 7.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.410158157348633, -6.222423553466797, -6.034688949584961, -5.846954345703125, -5.659219741821289, -5.471485137939453, -5.283750534057617, -5.096015930175781, -4.908281326293945, -4.720546722412109, -4.532812118530273, -4.3450775146484375, -4.157342910766602, -3.9696083068847656, -3.781873941421509, -3.594139337539673, -3.406404972076416, -3.21867036819458, -3.030935764312744, -2.843201160430908, -2.6554665565490723, -2.4677319526672363, -2.2799975872039795, -2.0922629833221436, -1.9045283794403076, -1.7167937755584717, -1.5290591716766357, -1.3413246870040894, -1.1535900831222534, -0.9658554792404175, -0.7781209945678711, -0.5903863906860352, -0.4026517868041992, -0.21491721272468567, -0.02718263864517212, 0.16055190563201904, 0.348286509513855, 0.5360211133956909, 0.7237555980682373, 0.9114902019500732, 1.0992248058319092, 1.2869594097137451, 1.474694013595581, 1.6624284982681274, 1.8501631021499634, 2.0378975868225098, 2.2256321907043457, 2.4133667945861816, 2.6011013984680176, 2.7888360023498535, 2.9765706062316895, 3.1643052101135254, 3.3520398139953613, 3.5397744178771973, 3.727508783340454, 3.91524338722229, 4.102977752685547, 4.290712356567383, 4.478446960449219, 4.666181564331055, 4.853916168212891, 5.041650772094727, 5.2293853759765625, 5.417119979858398, 5.604854583740234]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 10.0, 14.0, 20.0, 32.0, 48.0, 54.0, 96.0, 148.0, 257.0, 413.0, 696.0, 1193.0, 2198.0, 4321.0, 9469.0, 22358.0, 58429.0, 147224.0, 283885.0, 278959.0, 142129.0, 56388.0, 21825.0, 9199.0, 4166.0, 2170.0, 1134.0, 656.0, 393.0, 235.0, 150.0, 91.0, 53.0, 33.0, 27.0, 15.0, 20.0, 7.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0], "bins": [-7.05859375, -6.87274169921875, -6.6868896484375, -6.50103759765625, -6.315185546875, -6.12933349609375, -5.9434814453125, -5.75762939453125, -5.57177734375, -5.38592529296875, -5.2000732421875, -5.01422119140625, -4.828369140625, -4.64251708984375, -4.4566650390625, -4.27081298828125, -4.0849609375, -3.89910888671875, -3.7132568359375, -3.52740478515625, -3.341552734375, -3.15570068359375, -2.9698486328125, -2.78399658203125, -2.59814453125, -2.41229248046875, -2.2264404296875, -2.04058837890625, -1.854736328125, -1.66888427734375, -1.4830322265625, -1.29718017578125, -1.111328125, -0.92547607421875, -0.7396240234375, -0.55377197265625, -0.367919921875, -0.18206787109375, 0.0037841796875, 0.18963623046875, 0.37548828125, 0.56134033203125, 0.7471923828125, 0.93304443359375, 1.118896484375, 1.30474853515625, 1.4906005859375, 1.67645263671875, 1.8623046875, 2.04815673828125, 2.2340087890625, 2.41986083984375, 2.605712890625, 2.79156494140625, 2.9774169921875, 3.16326904296875, 3.34912109375, 3.53497314453125, 3.7208251953125, 3.90667724609375, 4.092529296875, 4.27838134765625, 4.4642333984375, 4.65008544921875, 4.8359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 8.0, 5.0, 8.0, 14.0, 11.0, 26.0, 17.0, 29.0, 27.0, 35.0, 35.0, 37.0, 35.0, 47.0, 40.0, 51.0, 56.0, 38.0, 48.0, 49.0, 41.0, 36.0, 39.0, 36.0, 25.0, 25.0, 23.0, 26.0, 18.0, 21.0, 15.0, 9.0, 15.0, 9.0, 12.0, 3.0, 3.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.482421875, -2.4034423828125, -2.324462890625, -2.2454833984375, -2.16650390625, -2.0875244140625, -2.008544921875, -1.9295654296875, -1.8505859375, -1.7716064453125, -1.692626953125, -1.6136474609375, -1.53466796875, -1.4556884765625, -1.376708984375, -1.2977294921875, -1.21875, -1.1397705078125, -1.060791015625, -0.9818115234375, -0.90283203125, -0.8238525390625, -0.744873046875, -0.6658935546875, -0.5869140625, -0.5079345703125, -0.428955078125, -0.3499755859375, -0.27099609375, -0.1920166015625, -0.113037109375, -0.0340576171875, 0.044921875, 0.1239013671875, 0.202880859375, 0.2818603515625, 0.36083984375, 0.4398193359375, 0.518798828125, 0.5977783203125, 0.6767578125, 0.7557373046875, 0.834716796875, 0.9136962890625, 0.99267578125, 1.0716552734375, 1.150634765625, 1.2296142578125, 1.30859375, 1.3875732421875, 1.466552734375, 1.5455322265625, 1.62451171875, 1.7034912109375, 1.782470703125, 1.8614501953125, 1.9404296875, 2.0194091796875, 2.098388671875, 2.1773681640625, 2.25634765625, 2.3353271484375, 2.414306640625, 2.4932861328125, 2.572265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 16.0, 21.0, 24.0, 24.0, 43.0, 49.0, 88.0, 94.0, 158.0, 232.0, 270.0, 440.0, 602.0, 863.0, 1381.0, 3098.0, 12630.0, 134399.0, 760477.0, 115099.0, 11352.0, 2986.0, 1385.0, 865.0, 574.0, 385.0, 263.0, 219.0, 107.0, 94.0, 84.0, 65.0, 35.0, 27.0, 17.0, 18.0, 12.0, 6.0, 10.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.703125, -12.2569580078125, -11.810791015625, -11.3646240234375, -10.91845703125, -10.4722900390625, -10.026123046875, -9.5799560546875, -9.1337890625, -8.6876220703125, -8.241455078125, -7.7952880859375, -7.34912109375, -6.9029541015625, -6.456787109375, -6.0106201171875, -5.564453125, -5.1182861328125, -4.672119140625, -4.2259521484375, -3.77978515625, -3.3336181640625, -2.887451171875, -2.4412841796875, -1.9951171875, -1.5489501953125, -1.102783203125, -0.6566162109375, -0.21044921875, 0.2357177734375, 0.681884765625, 1.1280517578125, 1.57421875, 2.0203857421875, 2.466552734375, 2.9127197265625, 3.35888671875, 3.8050537109375, 4.251220703125, 4.6973876953125, 5.1435546875, 5.5897216796875, 6.035888671875, 6.4820556640625, 6.92822265625, 7.3743896484375, 7.820556640625, 8.2667236328125, 8.712890625, 9.1590576171875, 9.605224609375, 10.0513916015625, 10.49755859375, 10.9437255859375, 11.389892578125, 11.8360595703125, 12.2822265625, 12.7283935546875, 13.174560546875, 13.6207275390625, 14.06689453125, 14.5130615234375, 14.959228515625, 15.4053955078125, 15.8515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 14.0, 7.0, 13.0, 16.0, 23.0, 23.0, 39.0, 30.0, 29.0, 27.0, 31.0, 43.0, 45.0, 56.0, 45.0, 50.0, 52.0, 42.0, 45.0, 35.0, 34.0, 38.0, 33.0, 29.0, 31.0, 19.0, 19.0, 17.0, 16.0, 15.0, 18.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-12.875, -12.5174560546875, -12.159912109375, -11.8023681640625, -11.44482421875, -11.0872802734375, -10.729736328125, -10.3721923828125, -10.0146484375, -9.6571044921875, -9.299560546875, -8.9420166015625, -8.58447265625, -8.2269287109375, -7.869384765625, -7.5118408203125, -7.154296875, -6.7967529296875, -6.439208984375, -6.0816650390625, -5.72412109375, -5.3665771484375, -5.009033203125, -4.6514892578125, -4.2939453125, -3.9364013671875, -3.578857421875, -3.2213134765625, -2.86376953125, -2.5062255859375, -2.148681640625, -1.7911376953125, -1.43359375, -1.0760498046875, -0.718505859375, -0.3609619140625, -0.00341796875, 0.3541259765625, 0.711669921875, 1.0692138671875, 1.4267578125, 1.7843017578125, 2.141845703125, 2.4993896484375, 2.85693359375, 3.2144775390625, 3.572021484375, 3.9295654296875, 4.287109375, 4.6446533203125, 5.002197265625, 5.3597412109375, 5.71728515625, 6.0748291015625, 6.432373046875, 6.7899169921875, 7.1474609375, 7.5050048828125, 7.862548828125, 8.2200927734375, 8.57763671875, 8.9351806640625, 9.292724609375, 9.6502685546875, 10.0078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 6.0, 15.0, 23.0, 35.0, 53.0, 86.0, 174.0, 351.0, 905.0, 3515.0, 54568.0, 955350.0, 29509.0, 2580.0, 720.0, 285.0, 169.0, 82.0, 41.0, 19.0, 20.0, 11.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8582763671875, -13.333740234375, -12.8092041015625, -12.28466796875, -11.7601318359375, -11.235595703125, -10.7110595703125, -10.1865234375, -9.6619873046875, -9.137451171875, -8.6129150390625, -8.08837890625, -7.5638427734375, -7.039306640625, -6.5147705078125, -5.990234375, -5.4656982421875, -4.941162109375, -4.4166259765625, -3.89208984375, -3.3675537109375, -2.843017578125, -2.3184814453125, -1.7939453125, -1.2694091796875, -0.744873046875, -0.2203369140625, 0.30419921875, 0.8287353515625, 1.353271484375, 1.8778076171875, 2.40234375, 2.9268798828125, 3.451416015625, 3.9759521484375, 4.50048828125, 5.0250244140625, 5.549560546875, 6.0740966796875, 6.5986328125, 7.1231689453125, 7.647705078125, 8.1722412109375, 8.69677734375, 9.2213134765625, 9.745849609375, 10.2703857421875, 10.794921875, 11.3194580078125, 11.843994140625, 12.3685302734375, 12.89306640625, 13.4176025390625, 13.942138671875, 14.4666748046875, 14.9912109375, 15.5157470703125, 16.040283203125, 16.5648193359375, 17.08935546875, 17.6138916015625, 18.138427734375, 18.6629638671875, 19.1875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 13.0, 12.0, 25.0, 31.0, 52.0, 84.0, 105.0, 171.0, 154.0, 109.0, 77.0, 49.0, 47.0, 25.0, 14.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010347366333007812, -0.0009977370500564575, -0.0009607374668121338, -0.0009237378835678101, -0.0008867383003234863, -0.0008497387170791626, -0.0008127391338348389, -0.0007757395505905151, -0.0007387399673461914, -0.0007017403841018677, -0.0006647408008575439, -0.0006277412176132202, -0.0005907416343688965, -0.0005537420511245728, -0.000516742467880249, -0.0004797428846359253, -0.00044274330139160156, -0.00040574371814727783, -0.0003687441349029541, -0.00033174455165863037, -0.00029474496841430664, -0.0002577453851699829, -0.00022074580192565918, -0.00018374621868133545, -0.00014674663543701172, -0.00010974705219268799, -7.274746894836426e-05, -3.574788570404053e-05, 1.2516975402832031e-06, 3.8251280784606934e-05, 7.525086402893066e-05, 0.0001122504472732544, 0.00014925003051757812, 0.00018624961376190186, 0.00022324919700622559, 0.0002602487802505493, 0.00029724836349487305, 0.0003342479467391968, 0.0003712475299835205, 0.00040824711322784424, 0.00044524669647216797, 0.0004822462797164917, 0.0005192458629608154, 0.0005562454462051392, 0.0005932450294494629, 0.0006302446126937866, 0.0006672441959381104, 0.0007042437791824341, 0.0007412433624267578, 0.0007782429456710815, 0.0008152425289154053, 0.000852242112159729, 0.0008892416954040527, 0.0009262412786483765, 0.0009632408618927002, 0.001000240445137024, 0.0010372400283813477, 0.0010742396116256714, 0.0011112391948699951, 0.0011482387781143188, 0.0011852383613586426, 0.0012222379446029663, 0.00125923752784729, 0.0012962371110916138, 0.0013332366943359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 23.0, 18.0, 27.0, 33.0, 71.0, 140.0, 273.0, 785.0, 2718.0, 31832.0, 976543.0, 31933.0, 2826.0, 745.0, 291.0, 118.0, 77.0, 39.0, 19.0, 11.0, 3.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.421875, -25.71728515625, -25.0126953125, -24.30810546875, -23.603515625, -22.89892578125, -22.1943359375, -21.48974609375, -20.78515625, -20.08056640625, -19.3759765625, -18.67138671875, -17.966796875, -17.26220703125, -16.5576171875, -15.85302734375, -15.1484375, -14.44384765625, -13.7392578125, -13.03466796875, -12.330078125, -11.62548828125, -10.9208984375, -10.21630859375, -9.51171875, -8.80712890625, -8.1025390625, -7.39794921875, -6.693359375, -5.98876953125, -5.2841796875, -4.57958984375, -3.875, -3.17041015625, -2.4658203125, -1.76123046875, -1.056640625, -0.35205078125, 0.3525390625, 1.05712890625, 1.76171875, 2.46630859375, 3.1708984375, 3.87548828125, 4.580078125, 5.28466796875, 5.9892578125, 6.69384765625, 7.3984375, 8.10302734375, 8.8076171875, 9.51220703125, 10.216796875, 10.92138671875, 11.6259765625, 12.33056640625, 13.03515625, 13.73974609375, 14.4443359375, 15.14892578125, 15.853515625, 16.55810546875, 17.2626953125, 17.96728515625, 18.671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 26.0, 24.0, 33.0, 48.0, 82.0, 104.0, 160.0, 150.0, 112.0, 89.0, 57.0, 31.0, 20.0, 24.0, 10.0, 5.0, 7.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.740234375, -10.39453125, -10.048828125, -9.703125, -9.357421875, -9.01171875, -8.666015625, -8.3203125, -7.974609375, -7.62890625, -7.283203125, -6.9375, -6.591796875, -6.24609375, -5.900390625, -5.5546875, -5.208984375, -4.86328125, -4.517578125, -4.171875, -3.826171875, -3.48046875, -3.134765625, -2.7890625, -2.443359375, -2.09765625, -1.751953125, -1.40625, -1.060546875, -0.71484375, -0.369140625, -0.0234375, 0.322265625, 0.66796875, 1.013671875, 1.359375, 1.705078125, 2.05078125, 2.396484375, 2.7421875, 3.087890625, 3.43359375, 3.779296875, 4.125, 4.470703125, 4.81640625, 5.162109375, 5.5078125, 5.853515625, 6.19921875, 6.544921875, 6.890625, 7.236328125, 7.58203125, 7.927734375, 8.2734375, 8.619140625, 8.96484375, 9.310546875, 9.65625, 10.001953125, 10.34765625, 10.693359375, 11.0390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 11.0, 20.0, 56.0, 156.0, 271.0, 284.0, 130.0, 50.0, 15.0, 9.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.652587890625, -127.0541763305664, -121.45575714111328, -115.85734558105469, -110.25892639160156, -104.66051483154297, -99.06210327148438, -93.46368408203125, -87.86526489257812, -82.26685333251953, -76.6684341430664, -71.07002258300781, -65.47160339355469, -59.873191833496094, -54.274776458740234, -48.676361083984375, -43.07794952392578, -37.47953414916992, -31.881118774414062, -26.282705307006836, -20.684289932250977, -15.085874557495117, -9.48746109008789, -3.8890457153320312, 1.7093696594238281, 7.307784557342529, 12.90619945526123, 18.504613876342773, 24.103029251098633, 29.701444625854492, 35.29985809326172, 40.89827346801758, 46.49668884277344, 52.0951042175293, 57.693519592285156, 63.29193115234375, 68.89035034179688, 74.48876190185547, 80.08717346191406, 85.68559265136719, 91.28401184082031, 96.8824234008789, 102.48084259033203, 108.07925415039062, 113.67767333984375, 119.27608489990234, 124.87449645996094, 130.47291564941406, 136.07131958007812, 141.66973876953125, 147.2681427001953, 152.86656188964844, 158.46498107910156, 164.0634002685547, 169.66180419921875, 175.26022338867188, 180.858642578125, 186.45706176757812, 192.0554656982422, 197.6538848876953, 203.25230407714844, 208.85072326660156, 214.44912719726562, 220.04754638671875, 225.64596557617188]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 8.0, 7.0, 5.0, 17.0, 18.0, 15.0, 28.0, 36.0, 27.0, 33.0, 41.0, 42.0, 47.0, 53.0, 45.0, 41.0, 50.0, 41.0, 34.0, 45.0, 43.0, 40.0, 43.0, 24.0, 36.0, 32.0, 26.0, 24.0, 10.0, 20.0, 14.0, 11.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.297813415527344, -55.48482131958008, -53.67182922363281, -51.85883712768555, -50.04584503173828, -48.232852935791016, -46.41986083984375, -44.606868743896484, -42.79387664794922, -40.98088455200195, -39.16789245605469, -37.35490036010742, -35.541908264160156, -33.72891616821289, -31.915924072265625, -30.10293197631836, -28.28993797302246, -26.476945877075195, -24.66395378112793, -22.850961685180664, -21.0379695892334, -19.2249755859375, -17.411983489990234, -15.598992347717285, -13.78600025177002, -11.973008155822754, -10.160016059875488, -8.347023010253906, -6.534031391143799, -4.721038818359375, -2.9080467224121094, -1.0950546264648438, 0.7179374694824219, 2.5309295654296875, 4.343921661376953, 6.156914234161377, 7.969906330108643, 9.782898902893066, 11.595890998840332, 13.408883094787598, 15.221875190734863, 17.034868240356445, 18.84786033630371, 20.660852432250977, 22.473844528198242, 24.286836624145508, 26.099828720092773, 27.91282081604004, 29.725812911987305, 31.53880500793457, 33.35179901123047, 35.164791107177734, 36.977783203125, 38.790775299072266, 40.60376739501953, 42.4167594909668, 44.22975158691406, 46.04274368286133, 47.855735778808594, 49.66872787475586, 51.481719970703125, 53.29471206665039, 55.107704162597656, 56.92069625854492, 58.73368835449219]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 3.0, 4.0, 9.0, 9.0, 14.0, 23.0, 49.0, 60.0, 105.0, 166.0, 249.0, 396.0, 716.0, 1306.0, 2677.0, 8370.0, 47398.0, 4059162.0, 58008.0, 9372.0, 2933.0, 1309.0, 788.0, 443.0, 275.0, 175.0, 86.0, 64.0, 33.0, 22.0, 21.0, 10.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.71875, -18.16064453125, -17.6025390625, -17.04443359375, -16.486328125, -15.92822265625, -15.3701171875, -14.81201171875, -14.25390625, -13.69580078125, -13.1376953125, -12.57958984375, -12.021484375, -11.46337890625, -10.9052734375, -10.34716796875, -9.7890625, -9.23095703125, -8.6728515625, -8.11474609375, -7.556640625, -6.99853515625, -6.4404296875, -5.88232421875, -5.32421875, -4.76611328125, -4.2080078125, -3.64990234375, -3.091796875, -2.53369140625, -1.9755859375, -1.41748046875, -0.859375, -0.30126953125, 0.2568359375, 0.81494140625, 1.373046875, 1.93115234375, 2.4892578125, 3.04736328125, 3.60546875, 4.16357421875, 4.7216796875, 5.27978515625, 5.837890625, 6.39599609375, 6.9541015625, 7.51220703125, 8.0703125, 8.62841796875, 9.1865234375, 9.74462890625, 10.302734375, 10.86083984375, 11.4189453125, 11.97705078125, 12.53515625, 13.09326171875, 13.6513671875, 14.20947265625, 14.767578125, 15.32568359375, 15.8837890625, 16.44189453125, 17.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 9.0, 13.0, 8.0, 22.0, 30.0, 31.0, 36.0, 46.0, 34.0, 53.0, 49.0, 54.0, 63.0, 58.0, 51.0, 56.0, 51.0, 49.0, 43.0, 33.0, 40.0, 30.0, 22.0, 18.0, 21.0, 8.0, 15.0, 9.0, 10.0, 5.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.79168701171875, -2.6907958984375, -2.58990478515625, -2.489013671875, -2.38812255859375, -2.2872314453125, -2.18634033203125, -2.08544921875, -1.98455810546875, -1.8836669921875, -1.78277587890625, -1.681884765625, -1.58099365234375, -1.4801025390625, -1.37921142578125, -1.2783203125, -1.17742919921875, -1.0765380859375, -0.97564697265625, -0.874755859375, -0.77386474609375, -0.6729736328125, -0.57208251953125, -0.47119140625, -0.37030029296875, -0.2694091796875, -0.16851806640625, -0.067626953125, 0.03326416015625, 0.1341552734375, 0.23504638671875, 0.3359375, 0.43682861328125, 0.5377197265625, 0.63861083984375, 0.739501953125, 0.84039306640625, 0.9412841796875, 1.04217529296875, 1.14306640625, 1.24395751953125, 1.3448486328125, 1.44573974609375, 1.546630859375, 1.64752197265625, 1.7484130859375, 1.84930419921875, 1.9501953125, 2.05108642578125, 2.1519775390625, 2.25286865234375, 2.353759765625, 2.45465087890625, 2.5555419921875, 2.65643310546875, 2.75732421875, 2.85821533203125, 2.9591064453125, 3.05999755859375, 3.160888671875, 3.26177978515625, 3.3626708984375, 3.46356201171875, 3.564453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 0.0, 6.0, 4.0, 3.0, 7.0, 6.0, 1.0, 8.0, 8.0, 5.0, 9.0, 12.0, 14.0, 18.0, 17.0, 32.0, 26.0, 43.0, 39.0, 69.0, 96.0, 147.0, 249.0, 520.0, 1158.0, 3204.0, 12547.0, 325323.0, 3828703.0, 15692.0, 3619.0, 1244.0, 575.0, 273.0, 150.0, 115.0, 74.0, 54.0, 32.0, 26.0, 23.0, 19.0, 19.0, 17.0, 15.0, 13.0, 11.0, 5.0, 12.0, 9.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.609375, -19.966552734375, -19.32373046875, -18.680908203125, -18.0380859375, -17.395263671875, -16.75244140625, -16.109619140625, -15.466796875, -14.823974609375, -14.18115234375, -13.538330078125, -12.8955078125, -12.252685546875, -11.60986328125, -10.967041015625, -10.32421875, -9.681396484375, -9.03857421875, -8.395751953125, -7.7529296875, -7.110107421875, -6.46728515625, -5.824462890625, -5.181640625, -4.538818359375, -3.89599609375, -3.253173828125, -2.6103515625, -1.967529296875, -1.32470703125, -0.681884765625, -0.0390625, 0.603759765625, 1.24658203125, 1.889404296875, 2.5322265625, 3.175048828125, 3.81787109375, 4.460693359375, 5.103515625, 5.746337890625, 6.38916015625, 7.031982421875, 7.6748046875, 8.317626953125, 8.96044921875, 9.603271484375, 10.24609375, 10.888916015625, 11.53173828125, 12.174560546875, 12.8173828125, 13.460205078125, 14.10302734375, 14.745849609375, 15.388671875, 16.031494140625, 16.67431640625, 17.317138671875, 17.9599609375, 18.602783203125, 19.24560546875, 19.888427734375, 20.53125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 23.0, 50.0, 197.0, 3541.0, 165.0, 40.0, 22.0, 8.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.111541748046875, -2.95941162109375, -2.807281494140625, -2.6551513671875, -2.503021240234375, -2.35089111328125, -2.198760986328125, -2.046630859375, -1.894500732421875, -1.74237060546875, -1.590240478515625, -1.4381103515625, -1.285980224609375, -1.13385009765625, -0.981719970703125, -0.82958984375, -0.677459716796875, -0.52532958984375, -0.373199462890625, -0.2210693359375, -0.068939208984375, 0.08319091796875, 0.235321044921875, 0.387451171875, 0.539581298828125, 0.69171142578125, 0.843841552734375, 0.9959716796875, 1.148101806640625, 1.30023193359375, 1.452362060546875, 1.6044921875, 1.756622314453125, 1.90875244140625, 2.060882568359375, 2.2130126953125, 2.365142822265625, 2.51727294921875, 2.669403076171875, 2.821533203125, 2.973663330078125, 3.12579345703125, 3.277923583984375, 3.4300537109375, 3.582183837890625, 3.73431396484375, 3.886444091796875, 4.03857421875, 4.190704345703125, 4.34283447265625, 4.494964599609375, 4.6470947265625, 4.799224853515625, 4.95135498046875, 5.103485107421875, 5.255615234375, 5.407745361328125, 5.55987548828125, 5.712005615234375, 5.8641357421875, 6.016265869140625, 6.16839599609375, 6.320526123046875, 6.47265625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 8.0, 8.0, 33.0, 57.0, 83.0, 126.0, 144.0, 148.0, 146.0, 95.0, 57.0, 39.0, 22.0, 15.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.874612808227539, -15.409102439880371, -14.943591117858887, -14.478080749511719, -14.012569427490234, -13.547059059143066, -13.081548690795898, -12.616037368774414, -12.15052604675293, -11.685015678405762, -11.219504356384277, -10.75399398803711, -10.288482666015625, -9.822972297668457, -9.357461929321289, -8.891950607299805, -8.426440238952637, -7.9609293937683105, -7.495418548583984, -7.029908180236816, -6.564396858215332, -6.098886489868164, -5.633375644683838, -5.167864799499512, -4.7023539543151855, -4.236843109130859, -3.771332263946533, -3.305821657180786, -2.84031081199646, -2.374799966812134, -1.9092893600463867, -1.4437785148620605, -0.978266716003418, -0.5127559304237366, -0.047245144844055176, 0.41826558113098145, 0.8837764263153076, 1.3492872714996338, 1.8147978782653809, 2.280308723449707, 2.745819568634033, 3.2113304138183594, 3.6768412590026855, 4.142352104187012, 4.60786247253418, 5.073373794555664, 5.538884162902832, 6.004395008087158, 6.469905853271484, 6.9354166984558105, 7.400927543640137, 7.866437911987305, 8.331949234008789, 8.797459602355957, 9.262969970703125, 9.72848129272461, 10.193992614746094, 10.659502983093262, 11.125014305114746, 11.590524673461914, 12.056035995483398, 12.521546363830566, 12.987056732177734, 13.452568054199219, 13.918078422546387]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 5.0, 12.0, 9.0, 10.0, 17.0, 16.0, 13.0, 26.0, 28.0, 31.0, 22.0, 35.0, 35.0, 35.0, 49.0, 35.0, 29.0, 39.0, 45.0, 40.0, 38.0, 27.0, 44.0, 36.0, 35.0, 22.0, 26.0, 38.0, 30.0, 28.0, 30.0, 12.0, 19.0, 14.0, 10.0, 7.0, 8.0, 6.0, 9.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-5.357210159301758, -5.199270248413086, -5.041330337524414, -4.8833909034729, -4.7254509925842285, -4.567511081695557, -4.409571647644043, -4.251631736755371, -4.093691825866699, -3.9357519149780273, -3.7778122425079346, -3.619872570037842, -3.46193265914917, -3.303992748260498, -3.1460530757904053, -2.9881134033203125, -2.8301734924316406, -2.6722335815429688, -2.514293909072876, -2.356354236602783, -2.1984143257141113, -2.0404744148254395, -1.8825347423553467, -1.7245949506759644, -1.566655158996582, -1.4087153673171997, -1.2507755756378174, -1.092835783958435, -0.9348959922790527, -0.7769562005996704, -0.6190164089202881, -0.46107661724090576, -0.30313634872436523, -0.1451965570449829, 0.012743234634399414, 0.17068302631378174, 0.32862281799316406, 0.4865626096725464, 0.6445024013519287, 0.802442193031311, 0.9603819847106934, 1.1183217763900757, 1.276261568069458, 1.4342013597488403, 1.5921411514282227, 1.750080943107605, 1.9080207347869873, 2.06596040725708, 2.223900318145752, 2.381840229034424, 2.5397799015045166, 2.6977195739746094, 2.8556594848632812, 3.013599395751953, 3.171539068222046, 3.3294787406921387, 3.4874186515808105, 3.6453585624694824, 3.803298234939575, 3.961237907409668, 4.11917781829834, 4.277117729187012, 4.435057640075684, 4.592997074127197, 4.750936985015869]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 13.0, 20.0, 19.0, 20.0, 42.0, 75.0, 118.0, 191.0, 377.0, 735.0, 1694.0, 4536.0, 14710.0, 57599.0, 242718.0, 490131.0, 176305.0, 41805.0, 11161.0, 3546.0, 1328.0, 649.0, 318.0, 168.0, 82.0, 73.0, 29.0, 20.0, 23.0, 11.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.34539794921875, -9.0736083984375, -8.80181884765625, -8.530029296875, -8.25823974609375, -7.9864501953125, -7.71466064453125, -7.44287109375, -7.17108154296875, -6.8992919921875, -6.62750244140625, -6.355712890625, -6.08392333984375, -5.8121337890625, -5.54034423828125, -5.2685546875, -4.99676513671875, -4.7249755859375, -4.45318603515625, -4.181396484375, -3.90960693359375, -3.6378173828125, -3.36602783203125, -3.09423828125, -2.82244873046875, -2.5506591796875, -2.27886962890625, -2.007080078125, -1.73529052734375, -1.4635009765625, -1.19171142578125, -0.919921875, -0.64813232421875, -0.3763427734375, -0.10455322265625, 0.167236328125, 0.43902587890625, 0.7108154296875, 0.98260498046875, 1.25439453125, 1.52618408203125, 1.7979736328125, 2.06976318359375, 2.341552734375, 2.61334228515625, 2.8851318359375, 3.15692138671875, 3.4287109375, 3.70050048828125, 3.9722900390625, 4.24407958984375, 4.515869140625, 4.78765869140625, 5.0594482421875, 5.33123779296875, 5.60302734375, 5.87481689453125, 6.1466064453125, 6.41839599609375, 6.690185546875, 6.96197509765625, 7.2337646484375, 7.50555419921875, 7.77734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 9.0, 14.0, 17.0, 28.0, 32.0, 39.0, 38.0, 36.0, 48.0, 43.0, 52.0, 51.0, 59.0, 64.0, 59.0, 49.0, 52.0, 42.0, 43.0, 36.0, 34.0, 33.0, 19.0, 12.0, 14.0, 10.0, 13.0, 11.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.096527099609375, -2.98992919921875, -2.883331298828125, -2.7767333984375, -2.670135498046875, -2.56353759765625, -2.456939697265625, -2.350341796875, -2.243743896484375, -2.13714599609375, -2.030548095703125, -1.9239501953125, -1.817352294921875, -1.71075439453125, -1.604156494140625, -1.49755859375, -1.390960693359375, -1.28436279296875, -1.177764892578125, -1.0711669921875, -0.964569091796875, -0.85797119140625, -0.751373291015625, -0.644775390625, -0.538177490234375, -0.43157958984375, -0.324981689453125, -0.2183837890625, -0.111785888671875, -0.00518798828125, 0.101409912109375, 0.2080078125, 0.314605712890625, 0.42120361328125, 0.527801513671875, 0.6343994140625, 0.740997314453125, 0.84759521484375, 0.954193115234375, 1.060791015625, 1.167388916015625, 1.27398681640625, 1.380584716796875, 1.4871826171875, 1.593780517578125, 1.70037841796875, 1.806976318359375, 1.91357421875, 2.020172119140625, 2.12677001953125, 2.233367919921875, 2.3399658203125, 2.446563720703125, 2.55316162109375, 2.659759521484375, 2.766357421875, 2.872955322265625, 2.97955322265625, 3.086151123046875, 3.1927490234375, 3.299346923828125, 3.40594482421875, 3.512542724609375, 3.619140625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 10.0, 19.0, 36.0, 57.0, 94.0, 170.0, 346.0, 637.0, 1643.0, 9568.0, 765231.0, 262785.0, 5484.0, 1329.0, 538.0, 255.0, 145.0, 68.0, 42.0, 38.0, 16.0, 10.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.375, -26.458984375, -25.54296875, -24.626953125, -23.7109375, -22.794921875, -21.87890625, -20.962890625, -20.046875, -19.130859375, -18.21484375, -17.298828125, -16.3828125, -15.466796875, -14.55078125, -13.634765625, -12.71875, -11.802734375, -10.88671875, -9.970703125, -9.0546875, -8.138671875, -7.22265625, -6.306640625, -5.390625, -4.474609375, -3.55859375, -2.642578125, -1.7265625, -0.810546875, 0.10546875, 1.021484375, 1.9375, 2.853515625, 3.76953125, 4.685546875, 5.6015625, 6.517578125, 7.43359375, 8.349609375, 9.265625, 10.181640625, 11.09765625, 12.013671875, 12.9296875, 13.845703125, 14.76171875, 15.677734375, 16.59375, 17.509765625, 18.42578125, 19.341796875, 20.2578125, 21.173828125, 22.08984375, 23.005859375, 23.921875, 24.837890625, 25.75390625, 26.669921875, 27.5859375, 28.501953125, 29.41796875, 30.333984375, 31.25]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 15.0, 25.0, 23.0, 29.0, 43.0, 43.0, 58.0, 72.0, 83.0, 93.0, 67.0, 66.0, 66.0, 53.0, 47.0, 45.0, 34.0, 31.0, 28.0, 15.0, 16.0, 5.0, 13.0, 8.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.625, -18.95068359375, -18.2763671875, -17.60205078125, -16.927734375, -16.25341796875, -15.5791015625, -14.90478515625, -14.23046875, -13.55615234375, -12.8818359375, -12.20751953125, -11.533203125, -10.85888671875, -10.1845703125, -9.51025390625, -8.8359375, -8.16162109375, -7.4873046875, -6.81298828125, -6.138671875, -5.46435546875, -4.7900390625, -4.11572265625, -3.44140625, -2.76708984375, -2.0927734375, -1.41845703125, -0.744140625, -0.06982421875, 0.6044921875, 1.27880859375, 1.953125, 2.62744140625, 3.3017578125, 3.97607421875, 4.650390625, 5.32470703125, 5.9990234375, 6.67333984375, 7.34765625, 8.02197265625, 8.6962890625, 9.37060546875, 10.044921875, 10.71923828125, 11.3935546875, 12.06787109375, 12.7421875, 13.41650390625, 14.0908203125, 14.76513671875, 15.439453125, 16.11376953125, 16.7880859375, 17.46240234375, 18.13671875, 18.81103515625, 19.4853515625, 20.15966796875, 20.833984375, 21.50830078125, 22.1826171875, 22.85693359375, 23.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 1.0, 3.0, 9.0, 7.0, 8.0, 10.0, 13.0, 26.0, 31.0, 42.0, 75.0, 104.0, 194.0, 388.0, 986.0, 3880.0, 36743.0, 941442.0, 57802.0, 4540.0, 1224.0, 440.0, 212.0, 140.0, 82.0, 48.0, 28.0, 21.0, 17.0, 7.0, 11.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9140625, -12.5048828125, -12.095703125, -11.6865234375, -11.27734375, -10.8681640625, -10.458984375, -10.0498046875, -9.640625, -9.2314453125, -8.822265625, -8.4130859375, -8.00390625, -7.5947265625, -7.185546875, -6.7763671875, -6.3671875, -5.9580078125, -5.548828125, -5.1396484375, -4.73046875, -4.3212890625, -3.912109375, -3.5029296875, -3.09375, -2.6845703125, -2.275390625, -1.8662109375, -1.45703125, -1.0478515625, -0.638671875, -0.2294921875, 0.1796875, 0.5888671875, 0.998046875, 1.4072265625, 1.81640625, 2.2255859375, 2.634765625, 3.0439453125, 3.453125, 3.8623046875, 4.271484375, 4.6806640625, 5.08984375, 5.4990234375, 5.908203125, 6.3173828125, 6.7265625, 7.1357421875, 7.544921875, 7.9541015625, 8.36328125, 8.7724609375, 9.181640625, 9.5908203125, 10.0, 10.4091796875, 10.818359375, 11.2275390625, 11.63671875, 12.0458984375, 12.455078125, 12.8642578125, 13.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 16.0, 16.0, 20.0, 46.0, 62.0, 117.0, 179.0, 253.0, 108.0, 60.0, 39.0, 30.0, 12.0, 18.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014667510986328125, -0.0014225691556930542, -0.001378387212753296, -0.0013342052698135376, -0.0012900233268737793, -0.001245841383934021, -0.0012016594409942627, -0.0011574774980545044, -0.001113295555114746, -0.0010691136121749878, -0.0010249316692352295, -0.0009807497262954712, -0.0009365677833557129, -0.0008923858404159546, -0.0008482038974761963, -0.000804021954536438, -0.0007598400115966797, -0.0007156580686569214, -0.0006714761257171631, -0.0006272941827774048, -0.0005831122398376465, -0.0005389302968978882, -0.0004947483539581299, -0.0004505664110183716, -0.0004063844680786133, -0.000362202525138855, -0.0003180205821990967, -0.0002738386392593384, -0.00022965669631958008, -0.00018547475337982178, -0.00014129281044006348, -9.711086750030518e-05, -5.2928924560546875e-05, -8.746981620788574e-06, 3.5434961318969727e-05, 7.961690425872803e-05, 0.00012379884719848633, 0.00016798079013824463, 0.00021216273307800293, 0.00025634467601776123, 0.00030052661895751953, 0.00034470856189727783, 0.00038889050483703613, 0.00043307244777679443, 0.00047725439071655273, 0.000521436333656311, 0.0005656182765960693, 0.0006098002195358276, 0.0006539821624755859, 0.0006981641054153442, 0.0007423460483551025, 0.0007865279912948608, 0.0008307099342346191, 0.0008748918771743774, 0.0009190738201141357, 0.000963255763053894, 0.0010074377059936523, 0.0010516196489334106, 0.001095801591873169, 0.0011399835348129272, 0.0011841654777526855, 0.0012283474206924438, 0.0012725293636322021, 0.0013167113065719604, 0.0013608932495117188]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 17.0, 32.0, 50.0, 78.0, 119.0, 197.0, 349.0, 792.0, 1661.0, 5023.0, 28470.0, 630954.0, 353961.0, 19842.0, 3993.0, 1450.0, 695.0, 335.0, 183.0, 89.0, 73.0, 49.0, 36.0, 15.0, 11.0, 10.0, 13.0, 6.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4140625, -8.1014404296875, -7.788818359375, -7.4761962890625, -7.16357421875, -6.8509521484375, -6.538330078125, -6.2257080078125, -5.9130859375, -5.6004638671875, -5.287841796875, -4.9752197265625, -4.66259765625, -4.3499755859375, -4.037353515625, -3.7247314453125, -3.412109375, -3.0994873046875, -2.786865234375, -2.4742431640625, -2.16162109375, -1.8489990234375, -1.536376953125, -1.2237548828125, -0.9111328125, -0.5985107421875, -0.285888671875, 0.0267333984375, 0.33935546875, 0.6519775390625, 0.964599609375, 1.2772216796875, 1.58984375, 1.9024658203125, 2.215087890625, 2.5277099609375, 2.84033203125, 3.1529541015625, 3.465576171875, 3.7781982421875, 4.0908203125, 4.4034423828125, 4.716064453125, 5.0286865234375, 5.34130859375, 5.6539306640625, 5.966552734375, 6.2791748046875, 6.591796875, 6.9044189453125, 7.217041015625, 7.5296630859375, 7.84228515625, 8.1549072265625, 8.467529296875, 8.7801513671875, 9.0927734375, 9.4053955078125, 9.718017578125, 10.0306396484375, 10.34326171875, 10.6558837890625, 10.968505859375, 11.2811279296875, 11.59375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 0.0, 4.0, 3.0, 5.0, 12.0, 11.0, 15.0, 19.0, 28.0, 51.0, 62.0, 98.0, 140.0, 150.0, 102.0, 75.0, 64.0, 48.0, 26.0, 26.0, 21.0, 9.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.528564453125, -6.26806640625, -6.007568359375, -5.7470703125, -5.486572265625, -5.22607421875, -4.965576171875, -4.705078125, -4.444580078125, -4.18408203125, -3.923583984375, -3.6630859375, -3.402587890625, -3.14208984375, -2.881591796875, -2.62109375, -2.360595703125, -2.10009765625, -1.839599609375, -1.5791015625, -1.318603515625, -1.05810546875, -0.797607421875, -0.537109375, -0.276611328125, -0.01611328125, 0.244384765625, 0.5048828125, 0.765380859375, 1.02587890625, 1.286376953125, 1.546875, 1.807373046875, 2.06787109375, 2.328369140625, 2.5888671875, 2.849365234375, 3.10986328125, 3.370361328125, 3.630859375, 3.891357421875, 4.15185546875, 4.412353515625, 4.6728515625, 4.933349609375, 5.19384765625, 5.454345703125, 5.71484375, 5.975341796875, 6.23583984375, 6.496337890625, 6.7568359375, 7.017333984375, 7.27783203125, 7.538330078125, 7.798828125, 8.059326171875, 8.31982421875, 8.580322265625, 8.8408203125, 9.101318359375, 9.36181640625, 9.622314453125, 9.8828125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 50.0, 152.0, 286.0, 291.0, 141.0, 44.0, 13.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.44915771484375, -137.2250213623047, -131.00086975097656, -124.77672576904297, -118.55258178710938, -112.32843780517578, -106.10429382324219, -99.88015747070312, -93.656005859375, -87.4318618774414, -81.20771789550781, -74.98357391357422, -68.75942993164062, -62.53528594970703, -56.3111457824707, -50.08700180053711, -43.86286163330078, -37.63871765136719, -31.414573669433594, -25.190431594848633, -18.96628761291504, -12.742143630981445, -6.518001556396484, -0.2938575744628906, 5.930286407470703, 12.154430389404297, 18.37857437133789, 24.60271644592285, 30.826860427856445, 37.051002502441406, 43.275146484375, 49.499290466308594, 55.72343444824219, 61.94757843017578, 68.17172241210938, 74.39586639404297, 80.62001037597656, 86.84415435791016, 93.06829833984375, 99.29243469238281, 105.51658630371094, 111.74073028564453, 117.96487426757812, 124.18901824951172, 130.4131622314453, 136.63729858398438, 142.8614501953125, 149.08558654785156, 155.30972290039062, 161.5338592529297, 167.7580108642578, 173.98214721679688, 180.206298828125, 186.43043518066406, 192.6545867919922, 198.87872314453125, 205.10287475585938, 211.32701110839844, 217.55116271972656, 223.77529907226562, 229.99945068359375, 236.2235870361328, 242.44773864746094, 248.671875, 254.89602661132812]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 8.0, 11.0, 10.0, 13.0, 11.0, 14.0, 14.0, 33.0, 24.0, 30.0, 30.0, 56.0, 40.0, 43.0, 52.0, 43.0, 53.0, 62.0, 39.0, 53.0, 38.0, 47.0, 33.0, 34.0, 31.0, 30.0, 17.0, 21.0, 28.0, 16.0, 12.0, 13.0, 11.0, 6.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.47263717651367, -61.5108757019043, -59.54911422729492, -57.58735275268555, -55.62559127807617, -53.6638298034668, -51.70207214355469, -49.74031066894531, -47.77854919433594, -45.81678771972656, -43.85502624511719, -41.89326477050781, -39.93150329589844, -37.96974182128906, -36.00798034667969, -34.04621887207031, -32.08445739746094, -30.122695922851562, -28.160934448242188, -26.199172973632812, -24.237411499023438, -22.275650024414062, -20.31389045715332, -18.352128982543945, -16.39036750793457, -14.428606033325195, -12.46684455871582, -10.505084037780762, -8.543322563171387, -6.581561088562012, -4.619800567626953, -2.658039093017578, -0.6962776184082031, 1.2654836177825928, 3.2272448539733887, 5.1890058517456055, 7.1507673263549805, 9.112528800964355, 11.074289321899414, 13.036050796508789, 14.997812271118164, 16.95957374572754, 18.921335220336914, 20.883094787597656, 22.84485626220703, 24.806617736816406, 26.76837921142578, 28.730140686035156, 30.69190216064453, 32.653663635253906, 34.61542510986328, 36.577186584472656, 38.53894805908203, 40.500709533691406, 42.46247100830078, 44.424232482910156, 46.38599395751953, 48.347755432128906, 50.30951690673828, 52.271278381347656, 54.23303985595703, 56.194801330566406, 58.15656280517578, 60.118324279785156, 62.080081939697266]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 11.0, 15.0, 14.0, 40.0, 48.0, 57.0, 114.0, 163.0, 233.0, 388.0, 530.0, 975.0, 1627.0, 2937.0, 6700.0, 21905.0, 185031.0, 3892474.0, 58408.0, 12267.0, 4694.0, 2329.0, 1197.0, 765.0, 446.0, 288.0, 185.0, 125.0, 85.0, 68.0, 37.0, 32.0, 22.0, 11.0, 10.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7071533203125, -11.320556640625, -10.9339599609375, -10.54736328125, -10.1607666015625, -9.774169921875, -9.3875732421875, -9.0009765625, -8.6143798828125, -8.227783203125, -7.8411865234375, -7.45458984375, -7.0679931640625, -6.681396484375, -6.2947998046875, -5.908203125, -5.5216064453125, -5.135009765625, -4.7484130859375, -4.36181640625, -3.9752197265625, -3.588623046875, -3.2020263671875, -2.8154296875, -2.4288330078125, -2.042236328125, -1.6556396484375, -1.26904296875, -0.8824462890625, -0.495849609375, -0.1092529296875, 0.27734375, 0.6639404296875, 1.050537109375, 1.4371337890625, 1.82373046875, 2.2103271484375, 2.596923828125, 2.9835205078125, 3.3701171875, 3.7567138671875, 4.143310546875, 4.5299072265625, 4.91650390625, 5.3031005859375, 5.689697265625, 6.0762939453125, 6.462890625, 6.8494873046875, 7.236083984375, 7.6226806640625, 8.00927734375, 8.3958740234375, 8.782470703125, 9.1690673828125, 9.5556640625, 9.9422607421875, 10.328857421875, 10.7154541015625, 11.10205078125, 11.4886474609375, 11.875244140625, 12.2618408203125, 12.6484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 12.0, 8.0, 15.0, 23.0, 19.0, 21.0, 34.0, 30.0, 41.0, 46.0, 37.0, 52.0, 70.0, 65.0, 59.0, 64.0, 43.0, 50.0, 38.0, 35.0, 43.0, 37.0, 33.0, 20.0, 21.0, 15.0, 13.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.23046875, -3.129852294921875, -3.02923583984375, -2.928619384765625, -2.8280029296875, -2.727386474609375, -2.62677001953125, -2.526153564453125, -2.425537109375, -2.324920654296875, -2.22430419921875, -2.123687744140625, -2.0230712890625, -1.922454833984375, -1.82183837890625, -1.721221923828125, -1.62060546875, -1.519989013671875, -1.41937255859375, -1.318756103515625, -1.2181396484375, -1.117523193359375, -1.01690673828125, -0.916290283203125, -0.815673828125, -0.715057373046875, -0.61444091796875, -0.513824462890625, -0.4132080078125, -0.312591552734375, -0.21197509765625, -0.111358642578125, -0.0107421875, 0.089874267578125, 0.19049072265625, 0.291107177734375, 0.3917236328125, 0.492340087890625, 0.59295654296875, 0.693572998046875, 0.794189453125, 0.894805908203125, 0.99542236328125, 1.096038818359375, 1.1966552734375, 1.297271728515625, 1.39788818359375, 1.498504638671875, 1.59912109375, 1.699737548828125, 1.80035400390625, 1.900970458984375, 2.0015869140625, 2.102203369140625, 2.20281982421875, 2.303436279296875, 2.404052734375, 2.504669189453125, 2.60528564453125, 2.705902099609375, 2.8065185546875, 2.907135009765625, 3.00775146484375, 3.108367919921875, 3.208984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 6.0, 12.0, 8.0, 15.0, 12.0, 16.0, 28.0, 26.0, 29.0, 69.0, 99.0, 182.0, 291.0, 648.0, 1394.0, 4048.0, 17027.0, 327715.0, 3807366.0, 26360.0, 5418.0, 1801.0, 760.0, 366.0, 198.0, 102.0, 64.0, 56.0, 31.0, 20.0, 13.0, 15.0, 11.0, 8.0, 9.0, 17.0, 5.0, 6.0, 3.0, 3.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.078125, -18.5499267578125, -18.021728515625, -17.4935302734375, -16.96533203125, -16.4371337890625, -15.908935546875, -15.3807373046875, -14.8525390625, -14.3243408203125, -13.796142578125, -13.2679443359375, -12.73974609375, -12.2115478515625, -11.683349609375, -11.1551513671875, -10.626953125, -10.0987548828125, -9.570556640625, -9.0423583984375, -8.51416015625, -7.9859619140625, -7.457763671875, -6.9295654296875, -6.4013671875, -5.8731689453125, -5.344970703125, -4.8167724609375, -4.28857421875, -3.7603759765625, -3.232177734375, -2.7039794921875, -2.17578125, -1.6475830078125, -1.119384765625, -0.5911865234375, -0.06298828125, 0.4652099609375, 0.993408203125, 1.5216064453125, 2.0498046875, 2.5780029296875, 3.106201171875, 3.6343994140625, 4.16259765625, 4.6907958984375, 5.218994140625, 5.7471923828125, 6.275390625, 6.8035888671875, 7.331787109375, 7.8599853515625, 8.38818359375, 8.9163818359375, 9.444580078125, 9.9727783203125, 10.5009765625, 11.0291748046875, 11.557373046875, 12.0855712890625, 12.61376953125, 13.1419677734375, 13.670166015625, 14.1983642578125, 14.7265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 11.0, 19.0, 38.0, 85.0, 273.0, 3154.0, 313.0, 89.0, 26.0, 19.0, 11.0, 10.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.70159912109375, -4.4930419921875, -4.28448486328125, -4.075927734375, -3.86737060546875, -3.6588134765625, -3.45025634765625, -3.24169921875, -3.03314208984375, -2.8245849609375, -2.61602783203125, -2.407470703125, -2.19891357421875, -1.9903564453125, -1.78179931640625, -1.5732421875, -1.36468505859375, -1.1561279296875, -0.94757080078125, -0.739013671875, -0.53045654296875, -0.3218994140625, -0.11334228515625, 0.09521484375, 0.30377197265625, 0.5123291015625, 0.72088623046875, 0.929443359375, 1.13800048828125, 1.3465576171875, 1.55511474609375, 1.763671875, 1.97222900390625, 2.1807861328125, 2.38934326171875, 2.597900390625, 2.80645751953125, 3.0150146484375, 3.22357177734375, 3.43212890625, 3.64068603515625, 3.8492431640625, 4.05780029296875, 4.266357421875, 4.47491455078125, 4.6834716796875, 4.89202880859375, 5.1005859375, 5.30914306640625, 5.5177001953125, 5.72625732421875, 5.934814453125, 6.14337158203125, 6.3519287109375, 6.56048583984375, 6.76904296875, 6.97760009765625, 7.1861572265625, 7.39471435546875, 7.603271484375, 7.81182861328125, 8.0203857421875, 8.22894287109375, 8.4375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 12.0, 21.0, 37.0, 55.0, 99.0, 130.0, 157.0, 158.0, 119.0, 75.0, 47.0, 34.0, 13.0, 13.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.69977569580078, -30.904190063476562, -30.10860252380371, -29.313016891479492, -28.517431259155273, -27.721845626831055, -26.926258087158203, -26.130672454833984, -25.335086822509766, -24.539501190185547, -23.743913650512695, -22.948328018188477, -22.152742385864258, -21.35715675354004, -20.561569213867188, -19.76598358154297, -18.97039794921875, -18.17481231689453, -17.37922477722168, -16.58363914489746, -15.788053512573242, -14.992466926574707, -14.196880340576172, -13.401294708251953, -12.605707168579102, -11.810120582580566, -11.014534950256348, -10.218948364257812, -9.423362731933594, -8.627776145935059, -7.832190036773682, -7.036603927612305, -6.241018295288086, -5.445432186126709, -4.649846076965332, -3.854259729385376, -3.058673620223999, -2.263087511062622, -1.467501163482666, -0.6719150543212891, 0.12367105484008789, 0.9192572236061096, 1.7148433923721313, 2.510429620742798, 3.306015729904175, 4.101601600646973, 4.897188186645508, 5.692774295806885, 6.488360404968262, 7.283946514129639, 8.079532623291016, 8.87511920928955, 9.67070484161377, 10.466291427612305, 11.261877059936523, 12.057463645935059, 12.853050231933594, 13.648636817932129, 14.444222450256348, 15.239809036254883, 16.0353946685791, 16.83098030090332, 17.626567840576172, 18.42215347290039, 19.21773910522461]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 3.0, 5.0, 9.0, 11.0, 6.0, 12.0, 16.0, 15.0, 15.0, 23.0, 46.0, 38.0, 41.0, 36.0, 41.0, 42.0, 36.0, 50.0, 32.0, 38.0, 35.0, 44.0, 40.0, 33.0, 37.0, 34.0, 52.0, 33.0, 22.0, 21.0, 20.0, 18.0, 16.0, 18.0, 13.0, 7.0, 6.0, 9.0, 4.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.77528190612793, -9.477632522583008, -9.179983139038086, -8.882333755493164, -8.584684371948242, -8.28703498840332, -7.989386081695557, -7.691737174987793, -7.394087791442871, -7.096438407897949, -6.798789024353027, -6.5011396408081055, -6.203490734100342, -5.90584135055542, -5.608191967010498, -5.310543060302734, -5.012893199920654, -4.715243816375732, -4.4175944328308105, -4.119945526123047, -3.822296142578125, -3.524646759033203, -3.2269973754882812, -2.9293482303619385, -2.6316988468170166, -2.3340494632720947, -2.036400318145752, -1.73875093460083, -1.4411016702651978, -1.1434524059295654, -0.8458030223846436, -0.5481538772583008, -0.2505044937133789, 0.047144800424575806, 0.3447940945625305, 0.6424434185028076, 0.9400926828384399, 1.2377419471740723, 1.5353913307189941, 1.833040475845337, 2.130689859390259, 2.4283392429351807, 2.7259883880615234, 3.0236377716064453, 3.321287155151367, 3.61893630027771, 3.916585683822632, 4.214234828948975, 4.5118842124938965, 4.809533596038818, 5.10718297958374, 5.404831886291504, 5.702481269836426, 6.000130653381348, 6.2977800369262695, 6.595429420471191, 6.893078804016113, 7.190728187561035, 7.488377571105957, 7.786026954650879, 8.0836763381958, 8.381324768066406, 8.678974151611328, 8.97662353515625, 9.274272918701172]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 2.0, 9.0, 14.0, 17.0, 30.0, 55.0, 82.0, 179.0, 372.0, 679.0, 1513.0, 4020.0, 13001.0, 52889.0, 238275.0, 524980.0, 161407.0, 36063.0, 9444.0, 3058.0, 1264.0, 587.0, 258.0, 140.0, 82.0, 56.0, 27.0, 22.0, 10.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.59375, -8.2095947265625, -7.825439453125, -7.4412841796875, -7.05712890625, -6.6729736328125, -6.288818359375, -5.9046630859375, -5.5205078125, -5.1363525390625, -4.752197265625, -4.3680419921875, -3.98388671875, -3.5997314453125, -3.215576171875, -2.8314208984375, -2.447265625, -2.0631103515625, -1.678955078125, -1.2947998046875, -0.91064453125, -0.5264892578125, -0.142333984375, 0.2418212890625, 0.6259765625, 1.0101318359375, 1.394287109375, 1.7784423828125, 2.16259765625, 2.5467529296875, 2.930908203125, 3.3150634765625, 3.69921875, 4.0833740234375, 4.467529296875, 4.8516845703125, 5.23583984375, 5.6199951171875, 6.004150390625, 6.3883056640625, 6.7724609375, 7.1566162109375, 7.540771484375, 7.9249267578125, 8.30908203125, 8.6932373046875, 9.077392578125, 9.4615478515625, 9.845703125, 10.2298583984375, 10.614013671875, 10.9981689453125, 11.38232421875, 11.7664794921875, 12.150634765625, 12.5347900390625, 12.9189453125, 13.3031005859375, 13.687255859375, 14.0714111328125, 14.45556640625, 14.8397216796875, 15.223876953125, 15.6080322265625, 15.9921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 4.0, 10.0, 11.0, 14.0, 14.0, 16.0, 30.0, 30.0, 28.0, 47.0, 38.0, 42.0, 50.0, 52.0, 59.0, 50.0, 59.0, 55.0, 46.0, 45.0, 35.0, 40.0, 31.0, 47.0, 30.0, 16.0, 17.0, 12.0, 6.0, 9.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.90740966796875, -2.8089599609375, -2.71051025390625, -2.612060546875, -2.51361083984375, -2.4151611328125, -2.31671142578125, -2.21826171875, -2.11981201171875, -2.0213623046875, -1.92291259765625, -1.824462890625, -1.72601318359375, -1.6275634765625, -1.52911376953125, -1.4306640625, -1.33221435546875, -1.2337646484375, -1.13531494140625, -1.036865234375, -0.93841552734375, -0.8399658203125, -0.74151611328125, -0.64306640625, -0.54461669921875, -0.4461669921875, -0.34771728515625, -0.249267578125, -0.15081787109375, -0.0523681640625, 0.04608154296875, 0.14453125, 0.24298095703125, 0.3414306640625, 0.43988037109375, 0.538330078125, 0.63677978515625, 0.7352294921875, 0.83367919921875, 0.93212890625, 1.03057861328125, 1.1290283203125, 1.22747802734375, 1.325927734375, 1.42437744140625, 1.5228271484375, 1.62127685546875, 1.7197265625, 1.81817626953125, 1.9166259765625, 2.01507568359375, 2.113525390625, 2.21197509765625, 2.3104248046875, 2.40887451171875, 2.50732421875, 2.60577392578125, 2.7042236328125, 2.80267333984375, 2.901123046875, 2.99957275390625, 3.0980224609375, 3.19647216796875, 3.294921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 5.0, 13.0, 10.0, 14.0, 17.0, 19.0, 41.0, 57.0, 73.0, 127.0, 170.0, 251.0, 484.0, 1008.0, 3317.0, 30820.0, 853500.0, 148323.0, 7006.0, 1604.0, 668.0, 358.0, 181.0, 161.0, 96.0, 71.0, 42.0, 27.0, 18.0, 11.0, 15.0, 13.0, 4.0, 5.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-28.40625, -27.563720703125, -26.72119140625, -25.878662109375, -25.0361328125, -24.193603515625, -23.35107421875, -22.508544921875, -21.666015625, -20.823486328125, -19.98095703125, -19.138427734375, -18.2958984375, -17.453369140625, -16.61083984375, -15.768310546875, -14.92578125, -14.083251953125, -13.24072265625, -12.398193359375, -11.5556640625, -10.713134765625, -9.87060546875, -9.028076171875, -8.185546875, -7.343017578125, -6.50048828125, -5.657958984375, -4.8154296875, -3.972900390625, -3.13037109375, -2.287841796875, -1.4453125, -0.602783203125, 0.23974609375, 1.082275390625, 1.9248046875, 2.767333984375, 3.60986328125, 4.452392578125, 5.294921875, 6.137451171875, 6.97998046875, 7.822509765625, 8.6650390625, 9.507568359375, 10.35009765625, 11.192626953125, 12.03515625, 12.877685546875, 13.72021484375, 14.562744140625, 15.4052734375, 16.247802734375, 17.09033203125, 17.932861328125, 18.775390625, 19.617919921875, 20.46044921875, 21.302978515625, 22.1455078125, 22.988037109375, 23.83056640625, 24.673095703125, 25.515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 17.0, 12.0, 13.0, 25.0, 34.0, 53.0, 49.0, 43.0, 61.0, 73.0, 77.0, 68.0, 60.0, 68.0, 59.0, 43.0, 54.0, 38.0, 28.0, 31.0, 19.0, 21.0, 8.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.546875, -21.97607421875, -21.4052734375, -20.83447265625, -20.263671875, -19.69287109375, -19.1220703125, -18.55126953125, -17.98046875, -17.40966796875, -16.8388671875, -16.26806640625, -15.697265625, -15.12646484375, -14.5556640625, -13.98486328125, -13.4140625, -12.84326171875, -12.2724609375, -11.70166015625, -11.130859375, -10.56005859375, -9.9892578125, -9.41845703125, -8.84765625, -8.27685546875, -7.7060546875, -7.13525390625, -6.564453125, -5.99365234375, -5.4228515625, -4.85205078125, -4.28125, -3.71044921875, -3.1396484375, -2.56884765625, -1.998046875, -1.42724609375, -0.8564453125, -0.28564453125, 0.28515625, 0.85595703125, 1.4267578125, 1.99755859375, 2.568359375, 3.13916015625, 3.7099609375, 4.28076171875, 4.8515625, 5.42236328125, 5.9931640625, 6.56396484375, 7.134765625, 7.70556640625, 8.2763671875, 8.84716796875, 9.41796875, 9.98876953125, 10.5595703125, 11.13037109375, 11.701171875, 12.27197265625, 12.8427734375, 13.41357421875, 13.984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 10.0, 11.0, 24.0, 20.0, 35.0, 59.0, 81.0, 155.0, 292.0, 620.0, 1584.0, 5752.0, 31440.0, 342556.0, 602933.0, 51424.0, 7924.0, 2075.0, 770.0, 348.0, 149.0, 94.0, 65.0, 36.0, 23.0, 18.0, 16.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2265625, -6.02642822265625, -5.8262939453125, -5.62615966796875, -5.426025390625, -5.22589111328125, -5.0257568359375, -4.82562255859375, -4.62548828125, -4.42535400390625, -4.2252197265625, -4.02508544921875, -3.824951171875, -3.62481689453125, -3.4246826171875, -3.22454833984375, -3.0244140625, -2.82427978515625, -2.6241455078125, -2.42401123046875, -2.223876953125, -2.02374267578125, -1.8236083984375, -1.62347412109375, -1.42333984375, -1.22320556640625, -1.0230712890625, -0.82293701171875, -0.622802734375, -0.42266845703125, -0.2225341796875, -0.02239990234375, 0.177734375, 0.37786865234375, 0.5780029296875, 0.77813720703125, 0.978271484375, 1.17840576171875, 1.3785400390625, 1.57867431640625, 1.77880859375, 1.97894287109375, 2.1790771484375, 2.37921142578125, 2.579345703125, 2.77947998046875, 2.9796142578125, 3.17974853515625, 3.3798828125, 3.58001708984375, 3.7801513671875, 3.98028564453125, 4.180419921875, 4.38055419921875, 4.5806884765625, 4.78082275390625, 4.98095703125, 5.18109130859375, 5.3812255859375, 5.58135986328125, 5.781494140625, 5.98162841796875, 6.1817626953125, 6.38189697265625, 6.58203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 11.0, 5.0, 10.0, 14.0, 14.0, 23.0, 18.0, 42.0, 38.0, 48.0, 59.0, 112.0, 148.0, 117.0, 73.0, 55.0, 38.0, 27.0, 39.0, 31.0, 19.0, 9.0, 9.0, 2.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00104522705078125, -0.001012369990348816, -0.0009795129299163818, -0.0009466558694839478, -0.0009137988090515137, -0.0008809417486190796, -0.0008480846881866455, -0.0008152276277542114, -0.0007823705673217773, -0.0007495135068893433, -0.0007166564464569092, -0.0006837993860244751, -0.000650942325592041, -0.0006180852651596069, -0.0005852282047271729, -0.0005523711442947388, -0.0005195140838623047, -0.0004866570234298706, -0.0004537999629974365, -0.00042094290256500244, -0.00038808584213256836, -0.0003552287817001343, -0.0003223717212677002, -0.0002895146608352661, -0.00025665760040283203, -0.00022380053997039795, -0.00019094347953796387, -0.00015808641910552979, -0.0001252293586730957, -9.237229824066162e-05, -5.951523780822754e-05, -2.6658177375793457e-05, 6.198883056640625e-06, 3.905594348907471e-05, 7.191300392150879e-05, 0.00010477006435394287, 0.00013762712478637695, 0.00017048418521881104, 0.00020334124565124512, 0.0002361983060836792, 0.0002690553665161133, 0.00030191242694854736, 0.00033476948738098145, 0.00036762654781341553, 0.0004004836082458496, 0.0004333406686782837, 0.0004661977291107178, 0.0004990547895431519, 0.0005319118499755859, 0.00056476891040802, 0.0005976259708404541, 0.0006304830312728882, 0.0006633400917053223, 0.0006961971521377563, 0.0007290542125701904, 0.0007619112730026245, 0.0007947683334350586, 0.0008276253938674927, 0.0008604824542999268, 0.0008933395147323608, 0.0009261965751647949, 0.000959053635597229, 0.000991910696029663, 0.0010247677564620972, 0.0010576248168945312]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 13.0, 15.0, 9.0, 21.0, 33.0, 38.0, 79.0, 102.0, 120.0, 222.0, 366.0, 601.0, 1372.0, 3890.0, 20518.0, 238107.0, 704697.0, 65677.0, 8246.0, 2319.0, 867.0, 469.0, 244.0, 183.0, 93.0, 56.0, 47.0, 51.0, 23.0, 21.0, 15.0, 7.0, 8.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.46502685546875, -6.2581787109375, -6.05133056640625, -5.844482421875, -5.63763427734375, -5.4307861328125, -5.22393798828125, -5.01708984375, -4.81024169921875, -4.6033935546875, -4.39654541015625, -4.189697265625, -3.98284912109375, -3.7760009765625, -3.56915283203125, -3.3623046875, -3.15545654296875, -2.9486083984375, -2.74176025390625, -2.534912109375, -2.32806396484375, -2.1212158203125, -1.91436767578125, -1.70751953125, -1.50067138671875, -1.2938232421875, -1.08697509765625, -0.880126953125, -0.67327880859375, -0.4664306640625, -0.25958251953125, -0.052734375, 0.15411376953125, 0.3609619140625, 0.56781005859375, 0.774658203125, 0.98150634765625, 1.1883544921875, 1.39520263671875, 1.60205078125, 1.80889892578125, 2.0157470703125, 2.22259521484375, 2.429443359375, 2.63629150390625, 2.8431396484375, 3.04998779296875, 3.2568359375, 3.46368408203125, 3.6705322265625, 3.87738037109375, 4.084228515625, 4.29107666015625, 4.4979248046875, 4.70477294921875, 4.91162109375, 5.11846923828125, 5.3253173828125, 5.53216552734375, 5.739013671875, 5.94586181640625, 6.1527099609375, 6.35955810546875, 6.56640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 9.0, 19.0, 5.0, 18.0, 25.0, 16.0, 29.0, 27.0, 28.0, 31.0, 29.0, 38.0, 57.0, 47.0, 59.0, 62.0, 53.0, 56.0, 46.0, 43.0, 37.0, 40.0, 33.0, 24.0, 19.0, 20.0, 16.0, 16.0, 10.0, 12.0, 12.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.26171875, -3.16217041015625, -3.0626220703125, -2.96307373046875, -2.863525390625, -2.76397705078125, -2.6644287109375, -2.56488037109375, -2.46533203125, -2.36578369140625, -2.2662353515625, -2.16668701171875, -2.067138671875, -1.96759033203125, -1.8680419921875, -1.76849365234375, -1.6689453125, -1.56939697265625, -1.4698486328125, -1.37030029296875, -1.270751953125, -1.17120361328125, -1.0716552734375, -0.97210693359375, -0.87255859375, -0.77301025390625, -0.6734619140625, -0.57391357421875, -0.474365234375, -0.37481689453125, -0.2752685546875, -0.17572021484375, -0.076171875, 0.02337646484375, 0.1229248046875, 0.22247314453125, 0.322021484375, 0.42156982421875, 0.5211181640625, 0.62066650390625, 0.72021484375, 0.81976318359375, 0.9193115234375, 1.01885986328125, 1.118408203125, 1.21795654296875, 1.3175048828125, 1.41705322265625, 1.5166015625, 1.61614990234375, 1.7156982421875, 1.81524658203125, 1.914794921875, 2.01434326171875, 2.1138916015625, 2.21343994140625, 2.31298828125, 2.41253662109375, 2.5120849609375, 2.61163330078125, 2.711181640625, 2.81072998046875, 2.9102783203125, 3.00982666015625, 3.109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 22.0, 38.0, 105.0, 186.0, 267.0, 199.0, 105.0, 42.0, 15.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-189.07131958007812, -183.71221923828125, -178.35311889648438, -172.9940185546875, -167.6349334716797, -162.2758331298828, -156.91673278808594, -151.55763244628906, -146.19854736328125, -140.83944702148438, -135.4803466796875, -130.12124633789062, -124.76216125488281, -119.40306091308594, -114.04396057128906, -108.68486022949219, -103.32575988769531, -97.96665954589844, -92.6075668334961, -87.24846649169922, -81.88937377929688, -76.5302734375, -71.17117309570312, -65.81207275390625, -60.452980041503906, -55.0938835144043, -49.73478698730469, -44.37568664550781, -39.0165901184082, -33.657493591308594, -28.29839324951172, -22.93929672241211, -17.5802001953125, -12.221102714538574, -6.862005233764648, -1.5029067993164062, 3.856189727783203, 9.215286254882812, 14.574386596679688, 19.933483123779297, 25.292579650878906, 30.651676177978516, 36.010772705078125, 41.369873046875, 46.72896957397461, 52.08806610107422, 57.447166442871094, 62.8062629699707, 68.16535949707031, 73.52445983886719, 78.88355255126953, 84.2426528930664, 89.60174560546875, 94.96084594726562, 100.3199462890625, 105.67904663085938, 111.03813934326172, 116.3972396850586, 121.75633239746094, 127.11543273925781, 132.4745330810547, 137.8336181640625, 143.19271850585938, 148.55181884765625, 153.91091918945312]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 4.0, 7.0, 11.0, 10.0, 14.0, 16.0, 16.0, 28.0, 29.0, 30.0, 51.0, 41.0, 50.0, 41.0, 59.0, 45.0, 52.0, 58.0, 38.0, 48.0, 40.0, 47.0, 27.0, 44.0, 32.0, 25.0, 28.0, 16.0, 16.0, 12.0, 14.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.929161071777344, -58.04840850830078, -56.16765594482422, -54.286903381347656, -52.406150817871094, -50.52539825439453, -48.644649505615234, -46.76389694213867, -44.88314437866211, -43.00239181518555, -41.121639251708984, -39.24088668823242, -37.360137939453125, -35.47938537597656, -33.5986328125, -31.717880249023438, -29.837127685546875, -27.956375122070312, -26.07562255859375, -24.19487190246582, -22.314119338989258, -20.433366775512695, -18.552616119384766, -16.671863555908203, -14.79111099243164, -12.910358428955078, -11.029606819152832, -9.148855209350586, -7.268102645874023, -5.387350082397461, -3.506598472595215, -1.6258468627929688, 0.25490570068359375, 2.135657787322998, 4.016409873962402, 5.897161960601807, 7.777914047241211, 9.658666610717773, 11.53941822052002, 13.420169830322266, 15.300922393798828, 17.18167495727539, 19.062427520751953, 20.943178176879883, 22.823930740356445, 24.704683303833008, 26.585433959960938, 28.4661865234375, 30.346939086914062, 32.227691650390625, 34.10844421386719, 35.98919677734375, 37.86994934082031, 39.750701904296875, 41.63145065307617, 43.512203216552734, 45.3929557800293, 47.27370834350586, 49.15446090698242, 51.035213470458984, 52.91596221923828, 54.796714782714844, 56.677467346191406, 58.55821990966797, 60.43897247314453]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 16.0, 30.0, 51.0, 86.0, 133.0, 231.0, 413.0, 778.0, 1620.0, 3599.0, 9096.0, 26271.0, 107681.0, 1264759.0, 2557272.0, 166692.0, 36068.0, 11328.0, 4355.0, 1861.0, 841.0, 456.0, 266.0, 130.0, 90.0, 53.0, 33.0, 20.0, 11.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.23187255859375, -7.0067138671875, -6.78155517578125, -6.556396484375, -6.33123779296875, -6.1060791015625, -5.88092041015625, -5.65576171875, -5.43060302734375, -5.2054443359375, -4.98028564453125, -4.755126953125, -4.52996826171875, -4.3048095703125, -4.07965087890625, -3.8544921875, -3.62933349609375, -3.4041748046875, -3.17901611328125, -2.953857421875, -2.72869873046875, -2.5035400390625, -2.27838134765625, -2.05322265625, -1.82806396484375, -1.6029052734375, -1.37774658203125, -1.152587890625, -0.92742919921875, -0.7022705078125, -0.47711181640625, -0.251953125, -0.02679443359375, 0.1983642578125, 0.42352294921875, 0.648681640625, 0.87384033203125, 1.0989990234375, 1.32415771484375, 1.54931640625, 1.77447509765625, 1.9996337890625, 2.22479248046875, 2.449951171875, 2.67510986328125, 2.9002685546875, 3.12542724609375, 3.3505859375, 3.57574462890625, 3.8009033203125, 4.02606201171875, 4.251220703125, 4.47637939453125, 4.7015380859375, 4.92669677734375, 5.15185546875, 5.37701416015625, 5.6021728515625, 5.82733154296875, 6.052490234375, 6.27764892578125, 6.5028076171875, 6.72796630859375, 6.953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 8.0, 13.0, 14.0, 20.0, 21.0, 18.0, 33.0, 52.0, 36.0, 43.0, 54.0, 60.0, 57.0, 61.0, 56.0, 56.0, 49.0, 44.0, 45.0, 38.0, 49.0, 31.0, 26.0, 23.0, 18.0, 20.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.806640625, -3.70263671875, -3.5986328125, -3.49462890625, -3.390625, -3.28662109375, -3.1826171875, -3.07861328125, -2.974609375, -2.87060546875, -2.7666015625, -2.66259765625, -2.55859375, -2.45458984375, -2.3505859375, -2.24658203125, -2.142578125, -2.03857421875, -1.9345703125, -1.83056640625, -1.7265625, -1.62255859375, -1.5185546875, -1.41455078125, -1.310546875, -1.20654296875, -1.1025390625, -0.99853515625, -0.89453125, -0.79052734375, -0.6865234375, -0.58251953125, -0.478515625, -0.37451171875, -0.2705078125, -0.16650390625, -0.0625, 0.04150390625, 0.1455078125, 0.24951171875, 0.353515625, 0.45751953125, 0.5615234375, 0.66552734375, 0.76953125, 0.87353515625, 0.9775390625, 1.08154296875, 1.185546875, 1.28955078125, 1.3935546875, 1.49755859375, 1.6015625, 1.70556640625, 1.8095703125, 1.91357421875, 2.017578125, 2.12158203125, 2.2255859375, 2.32958984375, 2.43359375, 2.53759765625, 2.6416015625, 2.74560546875, 2.849609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 13.0, 9.0, 21.0, 51.0, 92.0, 178.0, 447.0, 1430.0, 5442.0, 29708.0, 405270.0, 3624568.0, 108096.0, 14249.0, 3145.0, 902.0, 319.0, 143.0, 86.0, 24.0, 29.0, 15.0, 9.0, 7.0, 2.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.4195556640625, -14.010986328125, -13.6024169921875, -13.19384765625, -12.7852783203125, -12.376708984375, -11.9681396484375, -11.5595703125, -11.1510009765625, -10.742431640625, -10.3338623046875, -9.92529296875, -9.5167236328125, -9.108154296875, -8.6995849609375, -8.291015625, -7.8824462890625, -7.473876953125, -7.0653076171875, -6.65673828125, -6.2481689453125, -5.839599609375, -5.4310302734375, -5.0224609375, -4.6138916015625, -4.205322265625, -3.7967529296875, -3.38818359375, -2.9796142578125, -2.571044921875, -2.1624755859375, -1.75390625, -1.3453369140625, -0.936767578125, -0.5281982421875, -0.11962890625, 0.2889404296875, 0.697509765625, 1.1060791015625, 1.5146484375, 1.9232177734375, 2.331787109375, 2.7403564453125, 3.14892578125, 3.5574951171875, 3.966064453125, 4.3746337890625, 4.783203125, 5.1917724609375, 5.600341796875, 6.0089111328125, 6.41748046875, 6.8260498046875, 7.234619140625, 7.6431884765625, 8.0517578125, 8.4603271484375, 8.868896484375, 9.2774658203125, 9.68603515625, 10.0946044921875, 10.503173828125, 10.9117431640625, 11.3203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 5.0, 14.0, 26.0, 34.0, 52.0, 59.0, 86.0, 140.0, 281.0, 628.0, 1045.0, 787.0, 377.0, 174.0, 108.0, 64.0, 48.0, 35.0, 22.0, 21.0, 10.0, 11.0, 1.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.115478515625, -7.83251953125, -7.549560546875, -7.2666015625, -6.983642578125, -6.70068359375, -6.417724609375, -6.134765625, -5.851806640625, -5.56884765625, -5.285888671875, -5.0029296875, -4.719970703125, -4.43701171875, -4.154052734375, -3.87109375, -3.588134765625, -3.30517578125, -3.022216796875, -2.7392578125, -2.456298828125, -2.17333984375, -1.890380859375, -1.607421875, -1.324462890625, -1.04150390625, -0.758544921875, -0.4755859375, -0.192626953125, 0.09033203125, 0.373291015625, 0.65625, 0.939208984375, 1.22216796875, 1.505126953125, 1.7880859375, 2.071044921875, 2.35400390625, 2.636962890625, 2.919921875, 3.202880859375, 3.48583984375, 3.768798828125, 4.0517578125, 4.334716796875, 4.61767578125, 4.900634765625, 5.18359375, 5.466552734375, 5.74951171875, 6.032470703125, 6.3154296875, 6.598388671875, 6.88134765625, 7.164306640625, 7.447265625, 7.730224609375, 8.01318359375, 8.296142578125, 8.5791015625, 8.862060546875, 9.14501953125, 9.427978515625, 9.7109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 12.0, 8.0, 19.0, 52.0, 100.0, 217.0, 238.0, 183.0, 99.0, 32.0, 14.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.02342224121094, -89.48925018310547, -85.95508575439453, -82.42091369628906, -78.88674926757812, -75.35257720947266, -71.81840515136719, -68.28424072265625, -64.75006866455078, -61.21590042114258, -57.681732177734375, -54.147560119628906, -50.6133918762207, -47.0792236328125, -43.5450553894043, -40.010887145996094, -36.47671890258789, -32.94255065917969, -29.40838050842285, -25.87421226501465, -22.340042114257812, -18.80587387084961, -15.271705627441406, -11.73753547668457, -8.203367233276367, -4.669198036193848, -1.1350293159484863, 2.399139404296875, 5.9333086013793945, 9.467477798461914, 13.001646041870117, 16.535816192626953, 20.069984436035156, 23.60415267944336, 27.138322830200195, 30.6724910736084, 34.206661224365234, 37.74082946777344, 41.27499771118164, 44.809165954589844, 48.34333801269531, 51.877506256103516, 55.41167449951172, 58.94584655761719, 62.48001480102539, 66.0141830444336, 69.54835510253906, 73.08251953125, 76.61668395996094, 80.1508560180664, 83.68502044677734, 87.21919250488281, 90.75335693359375, 94.28752899169922, 97.82170104980469, 101.35586547851562, 104.8900375366211, 108.42420959472656, 111.9583740234375, 115.49254608154297, 119.0267105102539, 122.56088256835938, 126.09504699707031, 129.6292266845703, 133.16339111328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 12.0, 13.0, 14.0, 6.0, 11.0, 21.0, 21.0, 24.0, 30.0, 35.0, 35.0, 35.0, 48.0, 41.0, 57.0, 42.0, 49.0, 55.0, 42.0, 41.0, 48.0, 43.0, 38.0, 34.0, 23.0, 27.0, 19.0, 27.0, 24.0, 19.0, 16.0, 7.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-37.557533264160156, -36.48500442504883, -35.412471771240234, -34.339942932128906, -33.26741409301758, -32.194881439208984, -31.122352600097656, -30.049821853637695, -28.977291107177734, -27.904760360717773, -26.832231521606445, -25.759700775146484, -24.687170028686523, -23.614639282226562, -22.542110443115234, -21.469579696655273, -20.397050857543945, -19.324520111083984, -18.251991271972656, -17.179460525512695, -16.106929779052734, -15.03439998626709, -13.961870193481445, -12.889339447021484, -11.81680965423584, -10.744279861450195, -9.671749114990234, -8.59921932220459, -7.526689052581787, -6.454158782958984, -5.38162899017334, -4.309098720550537, -3.236570358276367, -2.1640400886535645, -1.0915100574493408, -0.018980026245117188, 1.0535502433776855, 2.1260805130004883, 3.198610305786133, 4.2711405754089355, 5.343670845031738, 6.416201114654541, 7.488731384277344, 8.561261177062988, 9.633790969848633, 10.706321716308594, 11.778851509094238, 12.851381301879883, 13.923912048339844, 14.996441841125488, 16.068971633911133, 17.141502380371094, 18.214033126831055, 19.286563873291016, 20.359092712402344, 21.431623458862305, 22.504154205322266, 23.576684951782227, 24.649213790893555, 25.721744537353516, 26.794275283813477, 27.866806030273438, 28.939334869384766, 30.011865615844727, 31.084394454956055]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 8.0, 19.0, 24.0, 36.0, 68.0, 85.0, 160.0, 232.0, 367.0, 640.0, 1051.0, 1803.0, 3281.0, 6007.0, 12021.0, 24831.0, 55095.0, 133859.0, 343133.0, 277241.0, 102737.0, 44168.0, 20144.0, 9715.0, 5128.0, 2652.0, 1573.0, 923.0, 556.0, 349.0, 224.0, 151.0, 75.0, 49.0, 36.0, 27.0, 20.0, 19.0, 10.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.28125, -6.0841064453125, -5.886962890625, -5.6898193359375, -5.49267578125, -5.2955322265625, -5.098388671875, -4.9012451171875, -4.7041015625, -4.5069580078125, -4.309814453125, -4.1126708984375, -3.91552734375, -3.7183837890625, -3.521240234375, -3.3240966796875, -3.126953125, -2.9298095703125, -2.732666015625, -2.5355224609375, -2.33837890625, -2.1412353515625, -1.944091796875, -1.7469482421875, -1.5498046875, -1.3526611328125, -1.155517578125, -0.9583740234375, -0.76123046875, -0.5640869140625, -0.366943359375, -0.1697998046875, 0.02734375, 0.2244873046875, 0.421630859375, 0.6187744140625, 0.81591796875, 1.0130615234375, 1.210205078125, 1.4073486328125, 1.6044921875, 1.8016357421875, 1.998779296875, 2.1959228515625, 2.39306640625, 2.5902099609375, 2.787353515625, 2.9844970703125, 3.181640625, 3.3787841796875, 3.575927734375, 3.7730712890625, 3.97021484375, 4.1673583984375, 4.364501953125, 4.5616455078125, 4.7587890625, 4.9559326171875, 5.153076171875, 5.3502197265625, 5.54736328125, 5.7445068359375, 5.941650390625, 6.1387939453125, 6.3359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 7.0, 6.0, 15.0, 15.0, 6.0, 17.0, 22.0, 25.0, 29.0, 31.0, 26.0, 32.0, 37.0, 48.0, 41.0, 61.0, 47.0, 43.0, 50.0, 44.0, 48.0, 40.0, 41.0, 29.0, 31.0, 27.0, 23.0, 29.0, 21.0, 21.0, 16.0, 15.0, 9.0, 9.0, 5.0, 4.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.4921875, -2.4073486328125, -2.322509765625, -2.2376708984375, -2.15283203125, -2.0679931640625, -1.983154296875, -1.8983154296875, -1.8134765625, -1.7286376953125, -1.643798828125, -1.5589599609375, -1.47412109375, -1.3892822265625, -1.304443359375, -1.2196044921875, -1.134765625, -1.0499267578125, -0.965087890625, -0.8802490234375, -0.79541015625, -0.7105712890625, -0.625732421875, -0.5408935546875, -0.4560546875, -0.3712158203125, -0.286376953125, -0.2015380859375, -0.11669921875, -0.0318603515625, 0.052978515625, 0.1378173828125, 0.22265625, 0.3074951171875, 0.392333984375, 0.4771728515625, 0.56201171875, 0.6468505859375, 0.731689453125, 0.8165283203125, 0.9013671875, 0.9862060546875, 1.071044921875, 1.1558837890625, 1.24072265625, 1.3255615234375, 1.410400390625, 1.4952392578125, 1.580078125, 1.6649169921875, 1.749755859375, 1.8345947265625, 1.91943359375, 2.0042724609375, 2.089111328125, 2.1739501953125, 2.2587890625, 2.3436279296875, 2.428466796875, 2.5133056640625, 2.59814453125, 2.6829833984375, 2.767822265625, 2.8526611328125, 2.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 20.0, 20.0, 27.0, 38.0, 64.0, 96.0, 114.0, 183.0, 318.0, 573.0, 1520.0, 5880.0, 88029.0, 904499.0, 40662.0, 4034.0, 1145.0, 493.0, 258.0, 168.0, 104.0, 78.0, 47.0, 33.0, 27.0, 14.0, 18.0, 12.0, 11.0, 7.0, 2.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.375732421875, -20.59521484375, -19.814697265625, -19.0341796875, -18.253662109375, -17.47314453125, -16.692626953125, -15.912109375, -15.131591796875, -14.35107421875, -13.570556640625, -12.7900390625, -12.009521484375, -11.22900390625, -10.448486328125, -9.66796875, -8.887451171875, -8.10693359375, -7.326416015625, -6.5458984375, -5.765380859375, -4.98486328125, -4.204345703125, -3.423828125, -2.643310546875, -1.86279296875, -1.082275390625, -0.3017578125, 0.478759765625, 1.25927734375, 2.039794921875, 2.8203125, 3.600830078125, 4.38134765625, 5.161865234375, 5.9423828125, 6.722900390625, 7.50341796875, 8.283935546875, 9.064453125, 9.844970703125, 10.62548828125, 11.406005859375, 12.1865234375, 12.967041015625, 13.74755859375, 14.528076171875, 15.30859375, 16.089111328125, 16.86962890625, 17.650146484375, 18.4306640625, 19.211181640625, 19.99169921875, 20.772216796875, 21.552734375, 22.333251953125, 23.11376953125, 23.894287109375, 24.6748046875, 25.455322265625, 26.23583984375, 27.016357421875, 27.796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 18.0, 15.0, 15.0, 17.0, 19.0, 25.0, 21.0, 32.0, 31.0, 41.0, 36.0, 49.0, 40.0, 42.0, 48.0, 43.0, 45.0, 41.0, 46.0, 37.0, 35.0, 41.0, 32.0, 27.0, 17.0, 15.0, 18.0, 19.0, 20.0, 11.0, 10.0, 13.0, 10.0, 6.0, 6.0, 7.0, 2.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.7734375, -11.4317626953125, -11.090087890625, -10.7484130859375, -10.40673828125, -10.0650634765625, -9.723388671875, -9.3817138671875, -9.0400390625, -8.6983642578125, -8.356689453125, -8.0150146484375, -7.67333984375, -7.3316650390625, -6.989990234375, -6.6483154296875, -6.306640625, -5.9649658203125, -5.623291015625, -5.2816162109375, -4.93994140625, -4.5982666015625, -4.256591796875, -3.9149169921875, -3.5732421875, -3.2315673828125, -2.889892578125, -2.5482177734375, -2.20654296875, -1.8648681640625, -1.523193359375, -1.1815185546875, -0.83984375, -0.4981689453125, -0.156494140625, 0.1851806640625, 0.52685546875, 0.8685302734375, 1.210205078125, 1.5518798828125, 1.8935546875, 2.2352294921875, 2.576904296875, 2.9185791015625, 3.26025390625, 3.6019287109375, 3.943603515625, 4.2852783203125, 4.626953125, 4.9686279296875, 5.310302734375, 5.6519775390625, 5.99365234375, 6.3353271484375, 6.677001953125, 7.0186767578125, 7.3603515625, 7.7020263671875, 8.043701171875, 8.3853759765625, 8.72705078125, 9.0687255859375, 9.410400390625, 9.7520751953125, 10.09375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 16.0, 10.0, 14.0, 23.0, 34.0, 44.0, 74.0, 158.0, 263.0, 657.0, 2252.0, 12520.0, 232739.0, 768008.0, 26440.0, 3552.0, 966.0, 336.0, 185.0, 93.0, 63.0, 31.0, 17.0, 17.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.91015625, -7.62921142578125, -7.3482666015625, -7.06732177734375, -6.786376953125, -6.50543212890625, -6.2244873046875, -5.94354248046875, -5.66259765625, -5.38165283203125, -5.1007080078125, -4.81976318359375, -4.538818359375, -4.25787353515625, -3.9769287109375, -3.69598388671875, -3.4150390625, -3.13409423828125, -2.8531494140625, -2.57220458984375, -2.291259765625, -2.01031494140625, -1.7293701171875, -1.44842529296875, -1.16748046875, -0.88653564453125, -0.6055908203125, -0.32464599609375, -0.043701171875, 0.23724365234375, 0.5181884765625, 0.79913330078125, 1.080078125, 1.36102294921875, 1.6419677734375, 1.92291259765625, 2.203857421875, 2.48480224609375, 2.7657470703125, 3.04669189453125, 3.32763671875, 3.60858154296875, 3.8895263671875, 4.17047119140625, 4.451416015625, 4.73236083984375, 5.0133056640625, 5.29425048828125, 5.5751953125, 5.85614013671875, 6.1370849609375, 6.41802978515625, 6.698974609375, 6.97991943359375, 7.2608642578125, 7.54180908203125, 7.82275390625, 8.10369873046875, 8.3846435546875, 8.66558837890625, 8.946533203125, 9.22747802734375, 9.5084228515625, 9.78936767578125, 10.0703125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 8.0, 12.0, 7.0, 17.0, 17.0, 24.0, 24.0, 43.0, 45.0, 68.0, 109.0, 147.0, 127.0, 75.0, 53.0, 26.0, 28.0, 17.0, 24.0, 18.0, 15.0, 17.0, 13.0, 13.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008487701416015625, -0.0008218884468078613, -0.0007950067520141602, -0.000768125057220459, -0.0007412433624267578, -0.0007143616676330566, -0.0006874799728393555, -0.0006605982780456543, -0.0006337165832519531, -0.000606834888458252, -0.0005799531936645508, -0.0005530714988708496, -0.0005261898040771484, -0.0004993081092834473, -0.0004724264144897461, -0.0004455447196960449, -0.00041866302490234375, -0.0003917813301086426, -0.0003648996353149414, -0.00033801794052124023, -0.00031113624572753906, -0.0002842545509338379, -0.0002573728561401367, -0.00023049116134643555, -0.00020360946655273438, -0.0001767277717590332, -0.00014984607696533203, -0.00012296438217163086, -9.608268737792969e-05, -6.920099258422852e-05, -4.2319297790527344e-05, -1.5437602996826172e-05, 1.1444091796875e-05, 3.832578659057617e-05, 6.520748138427734e-05, 9.208917617797852e-05, 0.00011897087097167969, 0.00014585256576538086, 0.00017273426055908203, 0.0001996159553527832, 0.00022649765014648438, 0.00025337934494018555, 0.0002802610397338867, 0.0003071427345275879, 0.00033402442932128906, 0.00036090612411499023, 0.0003877878189086914, 0.0004146695137023926, 0.00044155120849609375, 0.0004684329032897949, 0.0004953145980834961, 0.0005221962928771973, 0.0005490779876708984, 0.0005759596824645996, 0.0006028413772583008, 0.000629723072052002, 0.0006566047668457031, 0.0006834864616394043, 0.0007103681564331055, 0.0007372498512268066, 0.0007641315460205078, 0.000791013240814209, 0.0008178949356079102, 0.0008447766304016113, 0.0008716583251953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 14.0, 16.0, 33.0, 25.0, 44.0, 72.0, 128.0, 177.0, 330.0, 675.0, 1602.0, 5338.0, 36323.0, 766925.0, 216643.0, 14692.0, 3141.0, 1112.0, 517.0, 255.0, 167.0, 103.0, 51.0, 42.0, 43.0, 16.0, 16.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.45672607421875, -6.2064208984375, -5.95611572265625, -5.705810546875, -5.45550537109375, -5.2052001953125, -4.95489501953125, -4.70458984375, -4.45428466796875, -4.2039794921875, -3.95367431640625, -3.703369140625, -3.45306396484375, -3.2027587890625, -2.95245361328125, -2.7021484375, -2.45184326171875, -2.2015380859375, -1.95123291015625, -1.700927734375, -1.45062255859375, -1.2003173828125, -0.95001220703125, -0.69970703125, -0.44940185546875, -0.1990966796875, 0.05120849609375, 0.301513671875, 0.55181884765625, 0.8021240234375, 1.05242919921875, 1.302734375, 1.55303955078125, 1.8033447265625, 2.05364990234375, 2.303955078125, 2.55426025390625, 2.8045654296875, 3.05487060546875, 3.30517578125, 3.55548095703125, 3.8057861328125, 4.05609130859375, 4.306396484375, 4.55670166015625, 4.8070068359375, 5.05731201171875, 5.3076171875, 5.55792236328125, 5.8082275390625, 6.05853271484375, 6.308837890625, 6.55914306640625, 6.8094482421875, 7.05975341796875, 7.31005859375, 7.56036376953125, 7.8106689453125, 8.06097412109375, 8.311279296875, 8.56158447265625, 8.8118896484375, 9.06219482421875, 9.3125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 10.0, 8.0, 9.0, 7.0, 18.0, 28.0, 22.0, 48.0, 64.0, 79.0, 105.0, 107.0, 121.0, 79.0, 76.0, 48.0, 36.0, 36.0, 21.0, 22.0, 12.0, 11.0, 12.0, 6.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9375, -3.77142333984375, -3.6053466796875, -3.43927001953125, -3.273193359375, -3.10711669921875, -2.9410400390625, -2.77496337890625, -2.60888671875, -2.44281005859375, -2.2767333984375, -2.11065673828125, -1.944580078125, -1.77850341796875, -1.6124267578125, -1.44635009765625, -1.2802734375, -1.11419677734375, -0.9481201171875, -0.78204345703125, -0.615966796875, -0.44989013671875, -0.2838134765625, -0.11773681640625, 0.04833984375, 0.21441650390625, 0.3804931640625, 0.54656982421875, 0.712646484375, 0.87872314453125, 1.0447998046875, 1.21087646484375, 1.376953125, 1.54302978515625, 1.7091064453125, 1.87518310546875, 2.041259765625, 2.20733642578125, 2.3734130859375, 2.53948974609375, 2.70556640625, 2.87164306640625, 3.0377197265625, 3.20379638671875, 3.369873046875, 3.53594970703125, 3.7020263671875, 3.86810302734375, 4.0341796875, 4.20025634765625, 4.3663330078125, 4.53240966796875, 4.698486328125, 4.86456298828125, 5.0306396484375, 5.19671630859375, 5.36279296875, 5.52886962890625, 5.6949462890625, 5.86102294921875, 6.027099609375, 6.19317626953125, 6.3592529296875, 6.52532958984375, 6.69140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 35.0, 83.0, 170.0, 259.0, 238.0, 101.0, 42.0, 16.0, 14.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-123.66731262207031, -119.63440704345703, -115.60150146484375, -111.56859588623047, -107.53569030761719, -103.5027847290039, -99.46987915039062, -95.43698120117188, -91.40406799316406, -87.37116241455078, -83.3382568359375, -79.30535125732422, -75.27244567871094, -71.23954010009766, -67.20663452148438, -63.17373275756836, -59.140830993652344, -55.10792541503906, -51.07501983642578, -47.0421142578125, -43.00920867919922, -38.97630310058594, -34.94340133666992, -30.91049575805664, -26.87759017944336, -22.844684600830078, -18.811779022216797, -14.778875350952148, -10.745969772338867, -6.713064193725586, -2.6801605224609375, 1.3527450561523438, 5.385650634765625, 9.418556213378906, 13.451460838317871, 17.484365463256836, 21.517271041870117, 25.5501766204834, 29.583080291748047, 33.61598587036133, 37.64889144897461, 41.68179702758789, 45.71470260620117, 49.74760437011719, 53.78050994873047, 57.81341552734375, 61.84632110595703, 65.87922668457031, 69.9121322631836, 73.94503784179688, 77.97794342041016, 82.01084899902344, 86.04375457763672, 90.07666015625, 94.10955810546875, 98.14247131347656, 102.17536926269531, 106.2082748413086, 110.24118041992188, 114.27408599853516, 118.30699157714844, 122.33989715576172, 126.372802734375, 130.40570068359375, 134.43861389160156]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 6.0, 6.0, 9.0, 14.0, 10.0, 20.0, 19.0, 37.0, 23.0, 26.0, 36.0, 36.0, 42.0, 47.0, 66.0, 46.0, 58.0, 66.0, 48.0, 44.0, 58.0, 41.0, 42.0, 38.0, 34.0, 23.0, 22.0, 24.0, 12.0, 8.0, 9.0, 3.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.27438735961914, -38.66165542602539, -37.04892349243164, -35.436187744140625, -33.823455810546875, -32.210723876953125, -30.597991943359375, -28.985260009765625, -27.372526168823242, -25.759794235229492, -24.14706039428711, -22.53432846069336, -20.92159652709961, -19.308862686157227, -17.696130752563477, -16.083396911621094, -14.470664978027344, -12.857932090759277, -11.245199203491211, -9.632467269897461, -8.019734382629395, -6.407001495361328, -4.794269561767578, -3.1815366744995117, -1.5688037872314453, 0.04392886161804199, 1.6566615104675293, 3.2693939208984375, 4.882126808166504, 6.49485969543457, 8.10759162902832, 9.720324516296387, 11.333053588867188, 12.945786476135254, 14.55851936340332, 16.17125129699707, 17.783985137939453, 19.396717071533203, 21.009449005126953, 22.622180938720703, 24.234914779663086, 25.847646713256836, 27.46038055419922, 29.07311248779297, 30.68584442138672, 32.29857635498047, 33.91130828857422, 35.524044036865234, 37.136775970458984, 38.749507904052734, 40.362239837646484, 41.9749755859375, 43.58770751953125, 45.200439453125, 46.81317138671875, 48.4259033203125, 50.03863525390625, 51.6513671875, 53.26409912109375, 54.8768310546875, 56.489566802978516, 58.102298736572266, 59.715030670166016, 61.327762603759766, 62.94049835205078]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 15.0, 12.0, 19.0, 20.0, 19.0, 19.0, 32.0, 58.0, 59.0, 56.0, 88.0, 133.0, 153.0, 305.0, 1097.0, 13700.0, 4053043.0, 121080.0, 2984.0, 547.0, 233.0, 156.0, 95.0, 78.0, 57.0, 47.0, 40.0, 27.0, 18.0, 22.0, 12.0, 11.0, 4.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.46875, -20.694580078125, -19.92041015625, -19.146240234375, -18.3720703125, -17.597900390625, -16.82373046875, -16.049560546875, -15.275390625, -14.501220703125, -13.72705078125, -12.952880859375, -12.1787109375, -11.404541015625, -10.63037109375, -9.856201171875, -9.08203125, -8.307861328125, -7.53369140625, -6.759521484375, -5.9853515625, -5.211181640625, -4.43701171875, -3.662841796875, -2.888671875, -2.114501953125, -1.34033203125, -0.566162109375, 0.2080078125, 0.982177734375, 1.75634765625, 2.530517578125, 3.3046875, 4.078857421875, 4.85302734375, 5.627197265625, 6.4013671875, 7.175537109375, 7.94970703125, 8.723876953125, 9.498046875, 10.272216796875, 11.04638671875, 11.820556640625, 12.5947265625, 13.368896484375, 14.14306640625, 14.917236328125, 15.69140625, 16.465576171875, 17.23974609375, 18.013916015625, 18.7880859375, 19.562255859375, 20.33642578125, 21.110595703125, 21.884765625, 22.658935546875, 23.43310546875, 24.207275390625, 24.9814453125, 25.755615234375, 26.52978515625, 27.303955078125, 28.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 3.0, 8.0, 13.0, 24.0, 24.0, 33.0, 41.0, 53.0, 54.0, 86.0, 90.0, 95.0, 92.0, 74.0, 74.0, 72.0, 39.0, 34.0, 27.0, 22.0, 16.0, 12.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.25823974609375, -5.1063232421875, -4.95440673828125, -4.802490234375, -4.65057373046875, -4.4986572265625, -4.34674072265625, -4.19482421875, -4.04290771484375, -3.8909912109375, -3.73907470703125, -3.587158203125, -3.43524169921875, -3.2833251953125, -3.13140869140625, -2.9794921875, -2.82757568359375, -2.6756591796875, -2.52374267578125, -2.371826171875, -2.21990966796875, -2.0679931640625, -1.91607666015625, -1.76416015625, -1.61224365234375, -1.4603271484375, -1.30841064453125, -1.156494140625, -1.00457763671875, -0.8526611328125, -0.70074462890625, -0.548828125, -0.39691162109375, -0.2449951171875, -0.09307861328125, 0.058837890625, 0.21075439453125, 0.3626708984375, 0.51458740234375, 0.66650390625, 0.81842041015625, 0.9703369140625, 1.12225341796875, 1.274169921875, 1.42608642578125, 1.5780029296875, 1.72991943359375, 1.8818359375, 2.03375244140625, 2.1856689453125, 2.33758544921875, 2.489501953125, 2.64141845703125, 2.7933349609375, 2.94525146484375, 3.09716796875, 3.24908447265625, 3.4010009765625, 3.55291748046875, 3.704833984375, 3.85675048828125, 4.0086669921875, 4.16058349609375, 4.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 6.0, 9.0, 11.0, 16.0, 27.0, 50.0, 104.0, 206.0, 434.0, 858.0, 1800.0, 4175.0, 10360.0, 31446.0, 150956.0, 2469850.0, 1380529.0, 102452.0, 24516.0, 8740.0, 3857.0, 1858.0, 927.0, 507.0, 274.0, 136.0, 76.0, 44.0, 25.0, 14.0, 6.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.23828125, -7.0308837890625, -6.823486328125, -6.6160888671875, -6.40869140625, -6.2012939453125, -5.993896484375, -5.7864990234375, -5.5791015625, -5.3717041015625, -5.164306640625, -4.9569091796875, -4.74951171875, -4.5421142578125, -4.334716796875, -4.1273193359375, -3.919921875, -3.7125244140625, -3.505126953125, -3.2977294921875, -3.09033203125, -2.8829345703125, -2.675537109375, -2.4681396484375, -2.2607421875, -2.0533447265625, -1.845947265625, -1.6385498046875, -1.43115234375, -1.2237548828125, -1.016357421875, -0.8089599609375, -0.6015625, -0.3941650390625, -0.186767578125, 0.0206298828125, 0.22802734375, 0.4354248046875, 0.642822265625, 0.8502197265625, 1.0576171875, 1.2650146484375, 1.472412109375, 1.6798095703125, 1.88720703125, 2.0946044921875, 2.302001953125, 2.5093994140625, 2.716796875, 2.9241943359375, 3.131591796875, 3.3389892578125, 3.54638671875, 3.7537841796875, 3.961181640625, 4.1685791015625, 4.3759765625, 4.5833740234375, 4.790771484375, 4.9981689453125, 5.20556640625, 5.4129638671875, 5.620361328125, 5.8277587890625, 6.03515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 4.0, 7.0, 16.0, 11.0, 17.0, 28.0, 43.0, 54.0, 93.0, 165.0, 242.0, 479.0, 822.0, 775.0, 532.0, 293.0, 179.0, 84.0, 54.0, 47.0, 29.0, 16.0, 10.0, 9.0, 12.0, 6.0, 7.0, 1.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46484375, -5.26318359375, -5.0615234375, -4.85986328125, -4.658203125, -4.45654296875, -4.2548828125, -4.05322265625, -3.8515625, -3.64990234375, -3.4482421875, -3.24658203125, -3.044921875, -2.84326171875, -2.6416015625, -2.43994140625, -2.23828125, -2.03662109375, -1.8349609375, -1.63330078125, -1.431640625, -1.22998046875, -1.0283203125, -0.82666015625, -0.625, -0.42333984375, -0.2216796875, -0.02001953125, 0.181640625, 0.38330078125, 0.5849609375, 0.78662109375, 0.98828125, 1.18994140625, 1.3916015625, 1.59326171875, 1.794921875, 1.99658203125, 2.1982421875, 2.39990234375, 2.6015625, 2.80322265625, 3.0048828125, 3.20654296875, 3.408203125, 3.60986328125, 3.8115234375, 4.01318359375, 4.21484375, 4.41650390625, 4.6181640625, 4.81982421875, 5.021484375, 5.22314453125, 5.4248046875, 5.62646484375, 5.828125, 6.02978515625, 6.2314453125, 6.43310546875, 6.634765625, 6.83642578125, 7.0380859375, 7.23974609375, 7.44140625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 17.0, 32.0, 68.0, 102.0, 208.0, 239.0, 173.0, 86.0, 29.0, 14.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-107.73631286621094, -105.00628662109375, -102.2762680053711, -99.54624938964844, -96.81622314453125, -94.08619689941406, -91.3561782836914, -88.62615966796875, -85.89613342285156, -83.16610717773438, -80.43608856201172, -77.70606994628906, -74.97604370117188, -72.24601745605469, -69.51599884033203, -66.78598022460938, -64.05595397949219, -61.325931549072266, -58.595909118652344, -55.86588668823242, -53.1358642578125, -50.40584182739258, -47.675819396972656, -44.945796966552734, -42.21577453613281, -39.48575210571289, -36.75572967529297, -34.02570724487305, -31.295684814453125, -28.565662384033203, -25.83563995361328, -23.10561752319336, -20.375587463378906, -17.645565032958984, -14.915542602539062, -12.18552017211914, -9.455497741699219, -6.725475311279297, -3.995452880859375, -1.2654304504394531, 1.4645919799804688, 4.194614410400391, 6.9246368408203125, 9.654659271240234, 12.384681701660156, 15.114704132080078, 17.8447265625, 20.574748992919922, 23.304771423339844, 26.034793853759766, 28.764816284179688, 31.49483871459961, 34.22486114501953, 36.95488357543945, 39.684906005859375, 42.4149284362793, 45.14495086669922, 47.87497329711914, 50.60499572753906, 53.335018157958984, 56.065040588378906, 58.79506301879883, 61.52508544921875, 64.25511169433594, 66.9851303100586]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 9.0, 9.0, 9.0, 15.0, 10.0, 18.0, 25.0, 28.0, 34.0, 33.0, 44.0, 43.0, 38.0, 52.0, 62.0, 49.0, 61.0, 56.0, 66.0, 41.0, 38.0, 28.0, 27.0, 36.0, 29.0, 31.0, 22.0, 13.0, 21.0, 15.0, 8.0, 10.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-30.920757293701172, -30.000701904296875, -29.080646514892578, -28.16058921813965, -27.24053382873535, -26.320478439331055, -25.400421142578125, -24.480365753173828, -23.56031036376953, -22.640254974365234, -21.720199584960938, -20.800142288208008, -19.88008689880371, -18.960031509399414, -18.039974212646484, -17.119918823242188, -16.19986343383789, -15.279808044433594, -14.35975170135498, -13.439695358276367, -12.51963996887207, -11.599584579467773, -10.67952823638916, -9.759471893310547, -8.83941650390625, -7.919360637664795, -6.99930477142334, -6.079248905181885, -5.15919303894043, -4.239137172698975, -3.3190813064575195, -2.3990254402160645, -1.4789695739746094, -0.5589137077331543, 0.3611421585083008, 1.2811980247497559, 2.201253890991211, 3.121309757232666, 4.041365623474121, 4.961421489715576, 5.881477355957031, 6.801533222198486, 7.721589088439941, 8.641645431518555, 9.561700820922852, 10.481756210327148, 11.401812553405762, 12.321868896484375, 13.241924285888672, 14.161979675292969, 15.082036018371582, 16.002092361450195, 16.922147750854492, 17.84220314025879, 18.76226043701172, 19.682315826416016, 20.602371215820312, 21.52242660522461, 22.442481994628906, 23.362539291381836, 24.282594680786133, 25.20265007019043, 26.12270736694336, 27.042762756347656, 27.962818145751953]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 14.0, 21.0, 27.0, 42.0, 68.0, 108.0, 177.0, 313.0, 591.0, 1042.0, 2092.0, 4260.0, 9477.0, 22316.0, 57484.0, 168194.0, 422462.0, 232522.0, 76062.0, 28543.0, 12028.0, 5340.0, 2595.0, 1292.0, 608.0, 361.0, 198.0, 117.0, 62.0, 52.0, 20.0, 27.0, 6.0, 10.0, 7.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.63525390625, -5.4384765625, -5.24169921875, -5.044921875, -4.84814453125, -4.6513671875, -4.45458984375, -4.2578125, -4.06103515625, -3.8642578125, -3.66748046875, -3.470703125, -3.27392578125, -3.0771484375, -2.88037109375, -2.68359375, -2.48681640625, -2.2900390625, -2.09326171875, -1.896484375, -1.69970703125, -1.5029296875, -1.30615234375, -1.109375, -0.91259765625, -0.7158203125, -0.51904296875, -0.322265625, -0.12548828125, 0.0712890625, 0.26806640625, 0.46484375, 0.66162109375, 0.8583984375, 1.05517578125, 1.251953125, 1.44873046875, 1.6455078125, 1.84228515625, 2.0390625, 2.23583984375, 2.4326171875, 2.62939453125, 2.826171875, 3.02294921875, 3.2197265625, 3.41650390625, 3.61328125, 3.81005859375, 4.0068359375, 4.20361328125, 4.400390625, 4.59716796875, 4.7939453125, 4.99072265625, 5.1875, 5.38427734375, 5.5810546875, 5.77783203125, 5.974609375, 6.17138671875, 6.3681640625, 6.56494140625, 6.76171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 5.0, 11.0, 10.0, 13.0, 15.0, 7.0, 21.0, 19.0, 17.0, 37.0, 38.0, 39.0, 42.0, 40.0, 49.0, 57.0, 60.0, 50.0, 49.0, 50.0, 50.0, 39.0, 40.0, 29.0, 35.0, 31.0, 22.0, 23.0, 16.0, 11.0, 19.0, 6.0, 9.0, 11.0, 2.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.6590576171875, -2.570068359375, -2.4810791015625, -2.39208984375, -2.3031005859375, -2.214111328125, -2.1251220703125, -2.0361328125, -1.9471435546875, -1.858154296875, -1.7691650390625, -1.68017578125, -1.5911865234375, -1.502197265625, -1.4132080078125, -1.32421875, -1.2352294921875, -1.146240234375, -1.0572509765625, -0.96826171875, -0.8792724609375, -0.790283203125, -0.7012939453125, -0.6123046875, -0.5233154296875, -0.434326171875, -0.3453369140625, -0.25634765625, -0.1673583984375, -0.078369140625, 0.0106201171875, 0.099609375, 0.1885986328125, 0.277587890625, 0.3665771484375, 0.45556640625, 0.5445556640625, 0.633544921875, 0.7225341796875, 0.8115234375, 0.9005126953125, 0.989501953125, 1.0784912109375, 1.16748046875, 1.2564697265625, 1.345458984375, 1.4344482421875, 1.5234375, 1.6124267578125, 1.701416015625, 1.7904052734375, 1.87939453125, 1.9683837890625, 2.057373046875, 2.1463623046875, 2.2353515625, 2.3243408203125, 2.413330078125, 2.5023193359375, 2.59130859375, 2.6802978515625, 2.769287109375, 2.8582763671875, 2.947265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 6.0, 7.0, 9.0, 20.0, 17.0, 51.0, 62.0, 136.0, 229.0, 450.0, 1157.0, 4387.0, 38469.0, 776206.0, 210383.0, 13136.0, 2290.0, 765.0, 346.0, 166.0, 85.0, 61.0, 34.0, 25.0, 20.0, 13.0, 7.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.390625, -17.82958984375, -17.2685546875, -16.70751953125, -16.146484375, -15.58544921875, -15.0244140625, -14.46337890625, -13.90234375, -13.34130859375, -12.7802734375, -12.21923828125, -11.658203125, -11.09716796875, -10.5361328125, -9.97509765625, -9.4140625, -8.85302734375, -8.2919921875, -7.73095703125, -7.169921875, -6.60888671875, -6.0478515625, -5.48681640625, -4.92578125, -4.36474609375, -3.8037109375, -3.24267578125, -2.681640625, -2.12060546875, -1.5595703125, -0.99853515625, -0.4375, 0.12353515625, 0.6845703125, 1.24560546875, 1.806640625, 2.36767578125, 2.9287109375, 3.48974609375, 4.05078125, 4.61181640625, 5.1728515625, 5.73388671875, 6.294921875, 6.85595703125, 7.4169921875, 7.97802734375, 8.5390625, 9.10009765625, 9.6611328125, 10.22216796875, 10.783203125, 11.34423828125, 11.9052734375, 12.46630859375, 13.02734375, 13.58837890625, 14.1494140625, 14.71044921875, 15.271484375, 15.83251953125, 16.3935546875, 16.95458984375, 17.515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 3.0, 6.0, 8.0, 9.0, 14.0, 16.0, 20.0, 18.0, 26.0, 31.0, 20.0, 32.0, 47.0, 37.0, 51.0, 49.0, 57.0, 47.0, 38.0, 52.0, 42.0, 43.0, 37.0, 34.0, 27.0, 34.0, 29.0, 26.0, 21.0, 19.0, 18.0, 18.0, 15.0, 6.0, 3.0, 8.0, 4.0, 2.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.033935546875, -8.72412109375, -8.414306640625, -8.1044921875, -7.794677734375, -7.48486328125, -7.175048828125, -6.865234375, -6.555419921875, -6.24560546875, -5.935791015625, -5.6259765625, -5.316162109375, -5.00634765625, -4.696533203125, -4.38671875, -4.076904296875, -3.76708984375, -3.457275390625, -3.1474609375, -2.837646484375, -2.52783203125, -2.218017578125, -1.908203125, -1.598388671875, -1.28857421875, -0.978759765625, -0.6689453125, -0.359130859375, -0.04931640625, 0.260498046875, 0.5703125, 0.880126953125, 1.18994140625, 1.499755859375, 1.8095703125, 2.119384765625, 2.42919921875, 2.739013671875, 3.048828125, 3.358642578125, 3.66845703125, 3.978271484375, 4.2880859375, 4.597900390625, 4.90771484375, 5.217529296875, 5.52734375, 5.837158203125, 6.14697265625, 6.456787109375, 6.7666015625, 7.076416015625, 7.38623046875, 7.696044921875, 8.005859375, 8.315673828125, 8.62548828125, 8.935302734375, 9.2451171875, 9.554931640625, 9.86474609375, 10.174560546875, 10.484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 6.0, 10.0, 15.0, 23.0, 42.0, 43.0, 96.0, 217.0, 647.0, 2544.0, 23619.0, 967395.0, 48950.0, 3561.0, 788.0, 260.0, 123.0, 65.0, 43.0, 29.0, 20.0, 11.0, 12.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1640625, -13.754638671875, -13.34521484375, -12.935791015625, -12.5263671875, -12.116943359375, -11.70751953125, -11.298095703125, -10.888671875, -10.479248046875, -10.06982421875, -9.660400390625, -9.2509765625, -8.841552734375, -8.43212890625, -8.022705078125, -7.61328125, -7.203857421875, -6.79443359375, -6.385009765625, -5.9755859375, -5.566162109375, -5.15673828125, -4.747314453125, -4.337890625, -3.928466796875, -3.51904296875, -3.109619140625, -2.7001953125, -2.290771484375, -1.88134765625, -1.471923828125, -1.0625, -0.653076171875, -0.24365234375, 0.165771484375, 0.5751953125, 0.984619140625, 1.39404296875, 1.803466796875, 2.212890625, 2.622314453125, 3.03173828125, 3.441162109375, 3.8505859375, 4.260009765625, 4.66943359375, 5.078857421875, 5.48828125, 5.897705078125, 6.30712890625, 6.716552734375, 7.1259765625, 7.535400390625, 7.94482421875, 8.354248046875, 8.763671875, 9.173095703125, 9.58251953125, 9.991943359375, 10.4013671875, 10.810791015625, 11.22021484375, 11.629638671875, 12.0390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 7.0, 3.0, 8.0, 5.0, 3.0, 14.0, 9.0, 16.0, 18.0, 24.0, 29.0, 36.0, 59.0, 50.0, 80.0, 90.0, 106.0, 96.0, 82.0, 47.0, 43.0, 24.0, 28.0, 24.0, 10.0, 17.0, 10.0, 13.0, 11.0, 8.0, 4.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0006394386291503906, -0.0006213411688804626, -0.0006032437086105347, -0.0005851462483406067, -0.0005670487880706787, -0.0005489513278007507, -0.0005308538675308228, -0.0005127564072608948, -0.0004946589469909668, -0.0004765614867210388, -0.00045846402645111084, -0.00044036656618118286, -0.0004222691059112549, -0.0004041716456413269, -0.0003860741853713989, -0.00036797672510147095, -0.00034987926483154297, -0.000331781804561615, -0.000313684344291687, -0.00029558688402175903, -0.00027748942375183105, -0.0002593919634819031, -0.0002412945032119751, -0.00022319704294204712, -0.00020509958267211914, -0.00018700212240219116, -0.00016890466213226318, -0.0001508072018623352, -0.00013270974159240723, -0.00011461228132247925, -9.651482105255127e-05, -7.841736078262329e-05, -6.031990051269531e-05, -4.2222440242767334e-05, -2.4124979972839355e-05, -6.027519702911377e-06, 1.2069940567016602e-05, 3.016740083694458e-05, 4.826486110687256e-05, 6.636232137680054e-05, 8.445978164672852e-05, 0.0001025572419166565, 0.00012065470218658447, 0.00013875216245651245, 0.00015684962272644043, 0.0001749470829963684, 0.0001930445432662964, 0.00021114200353622437, 0.00022923946380615234, 0.0002473369240760803, 0.0002654343843460083, 0.0002835318446159363, 0.00030162930488586426, 0.00031972676515579224, 0.0003378242254257202, 0.0003559216856956482, 0.00037401914596557617, 0.00039211660623550415, 0.00041021406650543213, 0.0004283115267753601, 0.0004464089870452881, 0.00046450644731521606, 0.00048260390758514404, 0.000500701367855072, 0.000518798828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 5.0, 9.0, 10.0, 17.0, 32.0, 34.0, 51.0, 89.0, 140.0, 218.0, 349.0, 695.0, 1492.0, 3492.0, 12651.0, 103249.0, 790575.0, 114887.0, 13630.0, 3696.0, 1528.0, 694.0, 370.0, 239.0, 107.0, 90.0, 55.0, 31.0, 26.0, 16.0, 20.0, 7.0, 6.0, 6.0, 9.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.04296875, -4.86614990234375, -4.6893310546875, -4.51251220703125, -4.335693359375, -4.15887451171875, -3.9820556640625, -3.80523681640625, -3.62841796875, -3.45159912109375, -3.2747802734375, -3.09796142578125, -2.921142578125, -2.74432373046875, -2.5675048828125, -2.39068603515625, -2.2138671875, -2.03704833984375, -1.8602294921875, -1.68341064453125, -1.506591796875, -1.32977294921875, -1.1529541015625, -0.97613525390625, -0.79931640625, -0.62249755859375, -0.4456787109375, -0.26885986328125, -0.092041015625, 0.08477783203125, 0.2615966796875, 0.43841552734375, 0.615234375, 0.79205322265625, 0.9688720703125, 1.14569091796875, 1.322509765625, 1.49932861328125, 1.6761474609375, 1.85296630859375, 2.02978515625, 2.20660400390625, 2.3834228515625, 2.56024169921875, 2.737060546875, 2.91387939453125, 3.0906982421875, 3.26751708984375, 3.4443359375, 3.62115478515625, 3.7979736328125, 3.97479248046875, 4.151611328125, 4.32843017578125, 4.5052490234375, 4.68206787109375, 4.85888671875, 5.03570556640625, 5.2125244140625, 5.38934326171875, 5.566162109375, 5.74298095703125, 5.9197998046875, 6.09661865234375, 6.2734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 14.0, 17.0, 31.0, 38.0, 51.0, 53.0, 78.0, 69.0, 90.0, 95.0, 82.0, 78.0, 61.0, 48.0, 40.0, 27.0, 27.0, 16.0, 13.0, 13.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4375, -4.320404052734375, -4.20330810546875, -4.086212158203125, -3.9691162109375, -3.852020263671875, -3.73492431640625, -3.617828369140625, -3.500732421875, -3.383636474609375, -3.26654052734375, -3.149444580078125, -3.0323486328125, -2.915252685546875, -2.79815673828125, -2.681060791015625, -2.56396484375, -2.446868896484375, -2.32977294921875, -2.212677001953125, -2.0955810546875, -1.978485107421875, -1.86138916015625, -1.744293212890625, -1.627197265625, -1.510101318359375, -1.39300537109375, -1.275909423828125, -1.1588134765625, -1.041717529296875, -0.92462158203125, -0.807525634765625, -0.6904296875, -0.573333740234375, -0.45623779296875, -0.339141845703125, -0.2220458984375, -0.104949951171875, 0.01214599609375, 0.129241943359375, 0.246337890625, 0.363433837890625, 0.48052978515625, 0.597625732421875, 0.7147216796875, 0.831817626953125, 0.94891357421875, 1.066009521484375, 1.18310546875, 1.300201416015625, 1.41729736328125, 1.534393310546875, 1.6514892578125, 1.768585205078125, 1.88568115234375, 2.002777099609375, 2.119873046875, 2.236968994140625, 2.35406494140625, 2.471160888671875, 2.5882568359375, 2.705352783203125, 2.82244873046875, 2.939544677734375, 3.056640625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 12.0, 11.0, 17.0, 80.0, 195.0, 348.0, 231.0, 73.0, 20.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.63168334960938, -139.75608825683594, -134.8804931640625, -130.00489807128906, -125.12930297851562, -120.25370788574219, -115.37811279296875, -110.50251770019531, -105.62692260742188, -100.75132751464844, -95.875732421875, -91.00013732910156, -86.12454223632812, -81.24894714355469, -76.37335205078125, -71.49775695800781, -66.62215423583984, -61.746559143066406, -56.87096405029297, -51.99536895751953, -47.119773864746094, -42.244178771972656, -37.36857986450195, -32.492984771728516, -27.617389678955078, -22.74179458618164, -17.866199493408203, -12.990602493286133, -8.115007400512695, -3.239412307739258, 1.6361846923828125, 6.51177978515625, 11.387374877929688, 16.262969970703125, 21.138565063476562, 26.014162063598633, 30.88975715637207, 35.765350341796875, 40.64094924926758, 45.516544342041016, 50.39213943481445, 55.26773452758789, 60.14332962036133, 65.01892852783203, 69.89452362060547, 74.7701187133789, 79.64571380615234, 84.52130889892578, 89.39690399169922, 94.27249908447266, 99.1480941772461, 104.02368927001953, 108.89928436279297, 113.7748794555664, 118.65048217773438, 123.52607727050781, 128.40167236328125, 133.2772674560547, 138.15286254882812, 143.02845764160156, 147.904052734375, 152.77964782714844, 157.65524291992188, 162.5308380126953, 167.40643310546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 14.0, 9.0, 15.0, 17.0, 25.0, 24.0, 21.0, 32.0, 30.0, 36.0, 63.0, 65.0, 54.0, 54.0, 67.0, 58.0, 60.0, 51.0, 34.0, 39.0, 24.0, 24.0, 25.0, 20.0, 18.0, 15.0, 19.0, 11.0, 9.0, 15.0, 11.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-54.15583801269531, -52.63431930541992, -51.112796783447266, -49.591278076171875, -48.069759368896484, -46.54823684692383, -45.02671813964844, -43.50519561767578, -41.98367691040039, -40.462158203125, -38.940635681152344, -37.41911697387695, -35.89759826660156, -34.376075744628906, -32.854557037353516, -31.333036422729492, -29.8115177154541, -28.289997100830078, -26.768478393554688, -25.246957778930664, -23.72543716430664, -22.20391845703125, -20.682397842407227, -19.160877227783203, -17.639358520507812, -16.11783790588379, -14.596318244934082, -13.074798583984375, -11.553277969360352, -10.031758308410645, -8.510238647460938, -6.988718032836914, -5.467197418212891, -3.9456772804260254, -2.4241573810577393, -0.9026374816894531, 0.6188826560974121, 2.1404027938842773, 3.6619224548339844, 5.183443069458008, 6.704962730407715, 8.226482391357422, 9.748003005981445, 11.269522666931152, 12.79104232788086, 14.312562942504883, 15.83408260345459, 17.355602264404297, 18.87712287902832, 20.398643493652344, 21.920162200927734, 23.441682815551758, 24.96320343017578, 26.484722137451172, 28.006242752075195, 29.52776336669922, 31.04928207397461, 32.57080078125, 34.092323303222656, 35.61384201049805, 37.13536071777344, 38.656883239746094, 40.178401947021484, 41.699920654296875, 43.22144317626953]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 7.0, 7.0, 16.0, 21.0, 36.0, 65.0, 100.0, 223.0, 507.0, 1694.0, 7806.0, 48856.0, 827523.0, 3122828.0, 161965.0, 17480.0, 3466.0, 940.0, 338.0, 139.0, 96.0, 52.0, 20.0, 21.0, 22.0, 9.0, 3.0, 4.0, 10.0, 4.0, 2.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9639892578125, -7.717041015625, -7.4700927734375, -7.22314453125, -6.9761962890625, -6.729248046875, -6.4822998046875, -6.2353515625, -5.9884033203125, -5.741455078125, -5.4945068359375, -5.24755859375, -5.0006103515625, -4.753662109375, -4.5067138671875, -4.259765625, -4.0128173828125, -3.765869140625, -3.5189208984375, -3.27197265625, -3.0250244140625, -2.778076171875, -2.5311279296875, -2.2841796875, -2.0372314453125, -1.790283203125, -1.5433349609375, -1.29638671875, -1.0494384765625, -0.802490234375, -0.5555419921875, -0.30859375, -0.0616455078125, 0.185302734375, 0.4322509765625, 0.67919921875, 0.9261474609375, 1.173095703125, 1.4200439453125, 1.6669921875, 1.9139404296875, 2.160888671875, 2.4078369140625, 2.65478515625, 2.9017333984375, 3.148681640625, 3.3956298828125, 3.642578125, 3.8895263671875, 4.136474609375, 4.3834228515625, 4.63037109375, 4.8773193359375, 5.124267578125, 5.3712158203125, 5.6181640625, 5.8651123046875, 6.112060546875, 6.3590087890625, 6.60595703125, 6.8529052734375, 7.099853515625, 7.3468017578125, 7.59375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 20.0, 6.0, 32.0, 23.0, 39.0, 59.0, 61.0, 65.0, 95.0, 75.0, 76.0, 85.0, 82.0, 63.0, 56.0, 35.0, 38.0, 23.0, 18.0, 12.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.10333251953125, -1.9722900390625, -1.84124755859375, -1.710205078125, -1.57916259765625, -1.4481201171875, -1.31707763671875, -1.18603515625, -1.05499267578125, -0.9239501953125, -0.79290771484375, -0.661865234375, -0.53082275390625, -0.3997802734375, -0.26873779296875, -0.1376953125, -0.00665283203125, 0.1243896484375, 0.25543212890625, 0.386474609375, 0.51751708984375, 0.6485595703125, 0.77960205078125, 0.91064453125, 1.04168701171875, 1.1727294921875, 1.30377197265625, 1.434814453125, 1.56585693359375, 1.6968994140625, 1.82794189453125, 1.958984375, 2.09002685546875, 2.2210693359375, 2.35211181640625, 2.483154296875, 2.61419677734375, 2.7452392578125, 2.87628173828125, 3.00732421875, 3.13836669921875, 3.2694091796875, 3.40045166015625, 3.531494140625, 3.66253662109375, 3.7935791015625, 3.92462158203125, 4.0556640625, 4.18670654296875, 4.3177490234375, 4.44879150390625, 4.579833984375, 4.71087646484375, 4.8419189453125, 4.97296142578125, 5.10400390625, 5.23504638671875, 5.3660888671875, 5.49713134765625, 5.628173828125, 5.75921630859375, 5.8902587890625, 6.02130126953125, 6.15234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 16.0, 27.0, 27.0, 38.0, 63.0, 120.0, 210.0, 385.0, 842.0, 1845.0, 4776.0, 13803.0, 49158.0, 248095.0, 2394157.0, 1266631.0, 154282.0, 38782.0, 12275.0, 4724.0, 1984.0, 885.0, 455.0, 255.0, 139.0, 91.0, 53.0, 41.0, 22.0, 21.0, 12.0, 17.0, 13.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.18359375, -5.00994873046875, -4.8363037109375, -4.66265869140625, -4.489013671875, -4.31536865234375, -4.1417236328125, -3.96807861328125, -3.79443359375, -3.62078857421875, -3.4471435546875, -3.27349853515625, -3.099853515625, -2.92620849609375, -2.7525634765625, -2.57891845703125, -2.4052734375, -2.23162841796875, -2.0579833984375, -1.88433837890625, -1.710693359375, -1.53704833984375, -1.3634033203125, -1.18975830078125, -1.01611328125, -0.84246826171875, -0.6688232421875, -0.49517822265625, -0.321533203125, -0.14788818359375, 0.0257568359375, 0.19940185546875, 0.373046875, 0.54669189453125, 0.7203369140625, 0.89398193359375, 1.067626953125, 1.24127197265625, 1.4149169921875, 1.58856201171875, 1.76220703125, 1.93585205078125, 2.1094970703125, 2.28314208984375, 2.456787109375, 2.63043212890625, 2.8040771484375, 2.97772216796875, 3.1513671875, 3.32501220703125, 3.4986572265625, 3.67230224609375, 3.845947265625, 4.01959228515625, 4.1932373046875, 4.36688232421875, 4.54052734375, 4.71417236328125, 4.8878173828125, 5.06146240234375, 5.235107421875, 5.40875244140625, 5.5823974609375, 5.75604248046875, 5.9296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 15.0, 8.0, 11.0, 18.0, 21.0, 31.0, 42.0, 66.0, 86.0, 97.0, 147.0, 191.0, 286.0, 409.0, 478.0, 506.0, 397.0, 308.0, 225.0, 151.0, 114.0, 76.0, 73.0, 59.0, 46.0, 40.0, 35.0, 20.0, 17.0, 11.0, 11.0, 15.0, 9.0, 11.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.03125, -3.86480712890625, -3.6983642578125, -3.53192138671875, -3.365478515625, -3.19903564453125, -3.0325927734375, -2.86614990234375, -2.69970703125, -2.53326416015625, -2.3668212890625, -2.20037841796875, -2.033935546875, -1.86749267578125, -1.7010498046875, -1.53460693359375, -1.3681640625, -1.20172119140625, -1.0352783203125, -0.86883544921875, -0.702392578125, -0.53594970703125, -0.3695068359375, -0.20306396484375, -0.03662109375, 0.12982177734375, 0.2962646484375, 0.46270751953125, 0.629150390625, 0.79559326171875, 0.9620361328125, 1.12847900390625, 1.294921875, 1.46136474609375, 1.6278076171875, 1.79425048828125, 1.960693359375, 2.12713623046875, 2.2935791015625, 2.46002197265625, 2.62646484375, 2.79290771484375, 2.9593505859375, 3.12579345703125, 3.292236328125, 3.45867919921875, 3.6251220703125, 3.79156494140625, 3.9580078125, 4.12445068359375, 4.2908935546875, 4.45733642578125, 4.623779296875, 4.79022216796875, 4.9566650390625, 5.12310791015625, 5.28955078125, 5.45599365234375, 5.6224365234375, 5.78887939453125, 5.955322265625, 6.12176513671875, 6.2882080078125, 6.45465087890625, 6.62109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 10.0, 41.0, 134.0, 278.0, 321.0, 141.0, 54.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.74945068359375, -102.31724548339844, -97.88504791259766, -93.45284271240234, -89.02064514160156, -84.58843994140625, -80.15623474121094, -75.72402954101562, -71.29183197021484, -66.85962677001953, -62.42742919921875, -57.99522399902344, -53.56302261352539, -49.130821228027344, -44.69861602783203, -40.266414642333984, -35.83421325683594, -31.40201187133789, -26.96980857849121, -22.53760528564453, -18.105403900146484, -13.673202514648438, -9.240999221801758, -4.808795928955078, -0.37659454345703125, 4.055607795715332, 8.487810134887695, 12.920012474060059, 17.352214813232422, 21.78441619873047, 26.21661949157715, 30.648822784423828, 35.081024169921875, 39.51322555541992, 43.94542694091797, 48.37763214111328, 52.80983352661133, 57.242034912109375, 61.67424011230469, 66.1064453125, 70.53864288330078, 74.9708480834961, 79.40304565429688, 83.83525085449219, 88.2674560546875, 92.69965362548828, 97.1318588256836, 101.56405639648438, 105.99626159667969, 110.428466796875, 114.86066436767578, 119.2928695678711, 123.72506713867188, 128.1572723388672, 132.5894775390625, 137.0216827392578, 141.45388793945312, 145.88609313964844, 150.31829833984375, 154.75048828125, 159.1826934814453, 163.61489868164062, 168.04710388183594, 172.47930908203125, 176.9114990234375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 10.0, 20.0, 23.0, 25.0, 33.0, 27.0, 48.0, 48.0, 50.0, 47.0, 68.0, 49.0, 54.0, 61.0, 55.0, 43.0, 62.0, 38.0, 38.0, 30.0, 29.0, 26.0, 24.0, 20.0, 17.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-54.768924713134766, -53.43083572387695, -52.09274673461914, -50.75465774536133, -49.416568756103516, -48.07848358154297, -46.740394592285156, -45.402305603027344, -44.06421661376953, -42.72612762451172, -41.388038635253906, -40.049949645996094, -38.71186065673828, -37.37377166748047, -36.035682678222656, -34.69759750366211, -33.35950469970703, -32.02141571044922, -30.683326721191406, -29.345237731933594, -28.007150650024414, -26.6690616607666, -25.33097267150879, -23.99288558959961, -22.654796600341797, -21.316707611083984, -19.978618621826172, -18.64052963256836, -17.30244255065918, -15.964353561401367, -14.626264572143555, -13.288176536560059, -11.950088500976562, -10.61199951171875, -9.273911476135254, -7.935822486877441, -6.597733974456787, -5.259645462036133, -3.9215564727783203, -2.583468437194824, -1.2453794479370117, 0.09270918369293213, 1.430797815322876, 2.7688865661621094, 4.106975078582764, 5.445063591003418, 6.7831525802612305, 8.121240615844727, 9.459329605102539, 10.797418594360352, 12.135506629943848, 13.47359561920166, 14.811683654785156, 16.14977264404297, 17.48786163330078, 18.825950622558594, 20.164039611816406, 21.50212860107422, 22.84021759033203, 24.178306579589844, 25.516393661499023, 26.854482650756836, 28.19257164001465, 29.530658721923828, 30.86874771118164]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 9.0, 16.0, 26.0, 52.0, 61.0, 138.0, 204.0, 347.0, 609.0, 1236.0, 2533.0, 5862.0, 15779.0, 46153.0, 138796.0, 388171.0, 297527.0, 98109.0, 32701.0, 11543.0, 4418.0, 2087.0, 984.0, 497.0, 253.0, 143.0, 91.0, 77.0, 37.0, 22.0, 22.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.56640625, -6.34637451171875, -6.1263427734375, -5.90631103515625, -5.686279296875, -5.46624755859375, -5.2462158203125, -5.02618408203125, -4.80615234375, -4.58612060546875, -4.3660888671875, -4.14605712890625, -3.926025390625, -3.70599365234375, -3.4859619140625, -3.26593017578125, -3.0458984375, -2.82586669921875, -2.6058349609375, -2.38580322265625, -2.165771484375, -1.94573974609375, -1.7257080078125, -1.50567626953125, -1.28564453125, -1.06561279296875, -0.8455810546875, -0.62554931640625, -0.405517578125, -0.18548583984375, 0.0345458984375, 0.25457763671875, 0.474609375, 0.69464111328125, 0.9146728515625, 1.13470458984375, 1.354736328125, 1.57476806640625, 1.7947998046875, 2.01483154296875, 2.23486328125, 2.45489501953125, 2.6749267578125, 2.89495849609375, 3.114990234375, 3.33502197265625, 3.5550537109375, 3.77508544921875, 3.9951171875, 4.21514892578125, 4.4351806640625, 4.65521240234375, 4.875244140625, 5.09527587890625, 5.3153076171875, 5.53533935546875, 5.75537109375, 5.97540283203125, 6.1954345703125, 6.41546630859375, 6.635498046875, 6.85552978515625, 7.0755615234375, 7.29559326171875, 7.515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 12.0, 11.0, 13.0, 18.0, 11.0, 21.0, 20.0, 28.0, 33.0, 34.0, 37.0, 39.0, 47.0, 41.0, 47.0, 61.0, 58.0, 42.0, 44.0, 47.0, 42.0, 40.0, 37.0, 34.0, 23.0, 25.0, 18.0, 23.0, 19.0, 13.0, 14.0, 9.0, 5.0, 8.0, 3.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.310546875, -2.232391357421875, -2.15423583984375, -2.076080322265625, -1.9979248046875, -1.919769287109375, -1.84161376953125, -1.763458251953125, -1.685302734375, -1.607147216796875, -1.52899169921875, -1.450836181640625, -1.3726806640625, -1.294525146484375, -1.21636962890625, -1.138214111328125, -1.06005859375, -0.981903076171875, -0.90374755859375, -0.825592041015625, -0.7474365234375, -0.669281005859375, -0.59112548828125, -0.512969970703125, -0.434814453125, -0.356658935546875, -0.27850341796875, -0.200347900390625, -0.1221923828125, -0.044036865234375, 0.03411865234375, 0.112274169921875, 0.1904296875, 0.268585205078125, 0.34674072265625, 0.424896240234375, 0.5030517578125, 0.581207275390625, 0.65936279296875, 0.737518310546875, 0.815673828125, 0.893829345703125, 0.97198486328125, 1.050140380859375, 1.1282958984375, 1.206451416015625, 1.28460693359375, 1.362762451171875, 1.44091796875, 1.519073486328125, 1.59722900390625, 1.675384521484375, 1.7535400390625, 1.831695556640625, 1.90985107421875, 1.988006591796875, 2.066162109375, 2.144317626953125, 2.22247314453125, 2.300628662109375, 2.3787841796875, 2.456939697265625, 2.53509521484375, 2.613250732421875, 2.69140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 20.0, 18.0, 31.0, 35.0, 43.0, 89.0, 116.0, 179.0, 276.0, 481.0, 942.0, 2212.0, 7619.0, 97878.0, 876056.0, 53119.0, 5631.0, 1778.0, 834.0, 435.0, 255.0, 136.0, 102.0, 64.0, 56.0, 35.0, 23.0, 16.0, 13.0, 8.0, 5.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.02490234375, -18.3779296875, -17.73095703125, -17.083984375, -16.43701171875, -15.7900390625, -15.14306640625, -14.49609375, -13.84912109375, -13.2021484375, -12.55517578125, -11.908203125, -11.26123046875, -10.6142578125, -9.96728515625, -9.3203125, -8.67333984375, -8.0263671875, -7.37939453125, -6.732421875, -6.08544921875, -5.4384765625, -4.79150390625, -4.14453125, -3.49755859375, -2.8505859375, -2.20361328125, -1.556640625, -0.90966796875, -0.2626953125, 0.38427734375, 1.03125, 1.67822265625, 2.3251953125, 2.97216796875, 3.619140625, 4.26611328125, 4.9130859375, 5.56005859375, 6.20703125, 6.85400390625, 7.5009765625, 8.14794921875, 8.794921875, 9.44189453125, 10.0888671875, 10.73583984375, 11.3828125, 12.02978515625, 12.6767578125, 13.32373046875, 13.970703125, 14.61767578125, 15.2646484375, 15.91162109375, 16.55859375, 17.20556640625, 17.8525390625, 18.49951171875, 19.146484375, 19.79345703125, 20.4404296875, 21.08740234375, 21.734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 6.0, 8.0, 5.0, 6.0, 8.0, 14.0, 17.0, 16.0, 17.0, 18.0, 26.0, 28.0, 27.0, 33.0, 32.0, 37.0, 38.0, 50.0, 52.0, 38.0, 47.0, 46.0, 46.0, 44.0, 35.0, 48.0, 35.0, 31.0, 33.0, 23.0, 22.0, 15.0, 21.0, 19.0, 10.0, 7.0, 7.0, 9.0, 2.0, 5.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.6796875, -11.337158203125, -10.99462890625, -10.652099609375, -10.3095703125, -9.967041015625, -9.62451171875, -9.281982421875, -8.939453125, -8.596923828125, -8.25439453125, -7.911865234375, -7.5693359375, -7.226806640625, -6.88427734375, -6.541748046875, -6.19921875, -5.856689453125, -5.51416015625, -5.171630859375, -4.8291015625, -4.486572265625, -4.14404296875, -3.801513671875, -3.458984375, -3.116455078125, -2.77392578125, -2.431396484375, -2.0888671875, -1.746337890625, -1.40380859375, -1.061279296875, -0.71875, -0.376220703125, -0.03369140625, 0.308837890625, 0.6513671875, 0.993896484375, 1.33642578125, 1.678955078125, 2.021484375, 2.364013671875, 2.70654296875, 3.049072265625, 3.3916015625, 3.734130859375, 4.07666015625, 4.419189453125, 4.76171875, 5.104248046875, 5.44677734375, 5.789306640625, 6.1318359375, 6.474365234375, 6.81689453125, 7.159423828125, 7.501953125, 7.844482421875, 8.18701171875, 8.529541015625, 8.8720703125, 9.214599609375, 9.55712890625, 9.899658203125, 10.2421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 3.0, 6.0, 11.0, 12.0, 14.0, 22.0, 30.0, 60.0, 71.0, 169.0, 345.0, 768.0, 2171.0, 8678.0, 91603.0, 864385.0, 69318.0, 7481.0, 1951.0, 677.0, 325.0, 161.0, 79.0, 65.0, 33.0, 16.0, 16.0, 20.0, 11.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-7.69140625, -7.46148681640625, -7.2315673828125, -7.00164794921875, -6.771728515625, -6.54180908203125, -6.3118896484375, -6.08197021484375, -5.85205078125, -5.62213134765625, -5.3922119140625, -5.16229248046875, -4.932373046875, -4.70245361328125, -4.4725341796875, -4.24261474609375, -4.0126953125, -3.78277587890625, -3.5528564453125, -3.32293701171875, -3.093017578125, -2.86309814453125, -2.6331787109375, -2.40325927734375, -2.17333984375, -1.94342041015625, -1.7135009765625, -1.48358154296875, -1.253662109375, -1.02374267578125, -0.7938232421875, -0.56390380859375, -0.333984375, -0.10406494140625, 0.1258544921875, 0.35577392578125, 0.585693359375, 0.81561279296875, 1.0455322265625, 1.27545166015625, 1.50537109375, 1.73529052734375, 1.9652099609375, 2.19512939453125, 2.425048828125, 2.65496826171875, 2.8848876953125, 3.11480712890625, 3.3447265625, 3.57464599609375, 3.8045654296875, 4.03448486328125, 4.264404296875, 4.49432373046875, 4.7242431640625, 4.95416259765625, 5.18408203125, 5.41400146484375, 5.6439208984375, 5.87384033203125, 6.103759765625, 6.33367919921875, 6.5635986328125, 6.79351806640625, 7.0234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 10.0, 14.0, 10.0, 9.0, 28.0, 20.0, 29.0, 36.0, 49.0, 43.0, 69.0, 110.0, 141.0, 119.0, 55.0, 46.0, 27.0, 36.0, 27.0, 16.0, 19.0, 13.0, 14.0, 8.0, 7.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0008974075317382812, -0.0008689090609550476, -0.000840410590171814, -0.0008119121193885803, -0.0007834136486053467, -0.000754915177822113, -0.0007264167070388794, -0.0006979182362556458, -0.0006694197654724121, -0.0006409212946891785, -0.0006124228239059448, -0.0005839243531227112, -0.0005554258823394775, -0.0005269274115562439, -0.0004984289407730103, -0.0004699304699897766, -0.00044143199920654297, -0.0004129335284233093, -0.0003844350576400757, -0.00035593658685684204, -0.0003274381160736084, -0.00029893964529037476, -0.0002704411745071411, -0.00024194270372390747, -0.00021344423294067383, -0.00018494576215744019, -0.00015644729137420654, -0.0001279488205909729, -9.945034980773926e-05, -7.095187902450562e-05, -4.245340824127197e-05, -1.395493745803833e-05, 1.4543533325195312e-05, 4.3042004108428955e-05, 7.15404748916626e-05, 0.00010003894567489624, 0.00012853741645812988, 0.00015703588724136353, 0.00018553435802459717, 0.0002140328288078308, 0.00024253129959106445, 0.0002710297703742981, 0.00029952824115753174, 0.0003280267119407654, 0.000356525182723999, 0.00038502365350723267, 0.0004135221242904663, 0.00044202059507369995, 0.0004705190658569336, 0.0004990175366401672, 0.0005275160074234009, 0.0005560144782066345, 0.0005845129489898682, 0.0006130114197731018, 0.0006415098905563354, 0.0006700083613395691, 0.0006985068321228027, 0.0007270053029060364, 0.00075550377368927, 0.0007840022444725037, 0.0008125007152557373, 0.000840999186038971, 0.0008694976568222046, 0.0008979961276054382, 0.0009264945983886719]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 9.0, 4.0, 8.0, 11.0, 12.0, 22.0, 17.0, 34.0, 51.0, 63.0, 83.0, 166.0, 257.0, 484.0, 1026.0, 2534.0, 8574.0, 55348.0, 828955.0, 131100.0, 13446.0, 3506.0, 1330.0, 614.0, 342.0, 222.0, 110.0, 64.0, 43.0, 33.0, 27.0, 13.0, 16.0, 10.0, 2.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.12890625, -5.928955078125, -5.72900390625, -5.529052734375, -5.3291015625, -5.129150390625, -4.92919921875, -4.729248046875, -4.529296875, -4.329345703125, -4.12939453125, -3.929443359375, -3.7294921875, -3.529541015625, -3.32958984375, -3.129638671875, -2.9296875, -2.729736328125, -2.52978515625, -2.329833984375, -2.1298828125, -1.929931640625, -1.72998046875, -1.530029296875, -1.330078125, -1.130126953125, -0.93017578125, -0.730224609375, -0.5302734375, -0.330322265625, -0.13037109375, 0.069580078125, 0.26953125, 0.469482421875, 0.66943359375, 0.869384765625, 1.0693359375, 1.269287109375, 1.46923828125, 1.669189453125, 1.869140625, 2.069091796875, 2.26904296875, 2.468994140625, 2.6689453125, 2.868896484375, 3.06884765625, 3.268798828125, 3.46875, 3.668701171875, 3.86865234375, 4.068603515625, 4.2685546875, 4.468505859375, 4.66845703125, 4.868408203125, 5.068359375, 5.268310546875, 5.46826171875, 5.668212890625, 5.8681640625, 6.068115234375, 6.26806640625, 6.468017578125, 6.66796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 8.0, 8.0, 13.0, 13.0, 16.0, 28.0, 41.0, 68.0, 68.0, 96.0, 129.0, 106.0, 104.0, 67.0, 53.0, 48.0, 32.0, 22.0, 14.0, 19.0, 10.0, 5.0, 9.0, 1.0, 4.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.25390625, -6.08905029296875, -5.9241943359375, -5.75933837890625, -5.594482421875, -5.42962646484375, -5.2647705078125, -5.09991455078125, -4.93505859375, -4.77020263671875, -4.6053466796875, -4.44049072265625, -4.275634765625, -4.11077880859375, -3.9459228515625, -3.78106689453125, -3.6162109375, -3.45135498046875, -3.2864990234375, -3.12164306640625, -2.956787109375, -2.79193115234375, -2.6270751953125, -2.46221923828125, -2.29736328125, -2.13250732421875, -1.9676513671875, -1.80279541015625, -1.637939453125, -1.47308349609375, -1.3082275390625, -1.14337158203125, -0.978515625, -0.81365966796875, -0.6488037109375, -0.48394775390625, -0.319091796875, -0.15423583984375, 0.0106201171875, 0.17547607421875, 0.34033203125, 0.50518798828125, 0.6700439453125, 0.83489990234375, 0.999755859375, 1.16461181640625, 1.3294677734375, 1.49432373046875, 1.6591796875, 1.82403564453125, 1.9888916015625, 2.15374755859375, 2.318603515625, 2.48345947265625, 2.6483154296875, 2.81317138671875, 2.97802734375, 3.14288330078125, 3.3077392578125, 3.47259521484375, 3.637451171875, 3.80230712890625, 3.9671630859375, 4.13201904296875, 4.296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 16.0, 43.0, 73.0, 160.0, 265.0, 235.0, 119.0, 44.0, 19.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.18270874023438, -170.46676635742188, -166.75083923339844, -163.03489685058594, -159.3189697265625, -155.60302734375, -151.8870849609375, -148.17115783691406, -144.45521545410156, -140.73927307128906, -137.02334594726562, -133.30740356445312, -129.5914764404297, -125.87553405761719, -122.15959930419922, -118.44366455078125, -114.72772216796875, -111.01178741455078, -107.29585266113281, -103.57991027832031, -99.86397552490234, -96.14804077148438, -92.4321060180664, -88.71617126464844, -85.00023651123047, -81.2843017578125, -77.56836700439453, -73.85242462158203, -70.13648986816406, -66.4205551147461, -62.704620361328125, -58.98868179321289, -55.27273941040039, -51.55680465698242, -47.84086608886719, -44.12493133544922, -40.408992767333984, -36.693058013916016, -32.97711944580078, -29.261184692382812, -25.54524803161621, -21.82931137084961, -18.113374710083008, -14.397439002990723, -10.681502342224121, -6.965566635131836, -3.2496299743652344, 0.4663066864013672, 4.182243347167969, 7.89818000793457, 11.614116668701172, 15.330052375793457, 19.045989990234375, 22.761924743652344, 26.477861404418945, 30.193798065185547, 33.90973663330078, 37.62567138671875, 41.341609954833984, 45.05754470825195, 48.77348327636719, 52.489418029785156, 56.205352783203125, 59.92129135131836, 63.63722610473633]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 3.0, 8.0, 8.0, 10.0, 8.0, 14.0, 15.0, 11.0, 11.0, 18.0, 22.0, 27.0, 46.0, 47.0, 41.0, 43.0, 53.0, 77.0, 81.0, 78.0, 53.0, 34.0, 43.0, 24.0, 34.0, 29.0, 25.0, 24.0, 13.0, 23.0, 9.0, 12.0, 13.0, 11.0, 4.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.00893783569336, -45.45629119873047, -43.90364074707031, -42.35099411010742, -40.798343658447266, -39.245697021484375, -37.69304656982422, -36.14039993286133, -34.58775329589844, -33.03510665893555, -31.48245620727539, -29.9298095703125, -28.377159118652344, -26.824512481689453, -25.27186393737793, -23.719215393066406, -22.16656494140625, -20.613916397094727, -19.061267852783203, -17.508621215820312, -15.955971717834473, -14.40332317352295, -12.850675582885742, -11.298027038574219, -9.745378494262695, -8.192729949951172, -6.640081882476807, -5.087433815002441, -3.534785270690918, -1.9821367263793945, -0.4294891357421875, 1.123159408569336, 2.675811767578125, 4.228460311889648, 5.781108379364014, 7.333756446838379, 8.886404991149902, 10.439053535461426, 11.991701126098633, 13.544349670410156, 15.09699821472168, 16.649646759033203, 18.202295303344727, 19.75494384765625, 21.30759048461914, 22.860240936279297, 24.412887573242188, 25.96553611755371, 27.518184661865234, 29.070833206176758, 30.62348175048828, 32.17612838745117, 33.72877883911133, 35.28142547607422, 36.834075927734375, 38.386722564697266, 39.939369201660156, 41.49201583862305, 43.0446662902832, 44.597312927246094, 46.14996337890625, 47.70261001586914, 49.25525665283203, 50.80790710449219, 52.360557556152344]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 11.0, 16.0, 21.0, 34.0, 70.0, 95.0, 183.0, 348.0, 703.0, 1717.0, 4714.0, 17269.0, 88455.0, 1157674.0, 2689196.0, 191897.0, 29661.0, 7543.0, 2577.0, 1017.0, 525.0, 226.0, 129.0, 82.0, 44.0, 31.0, 11.0, 8.0, 7.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.56378173828125, -5.3853759765625, -5.20697021484375, -5.028564453125, -4.85015869140625, -4.6717529296875, -4.49334716796875, -4.31494140625, -4.13653564453125, -3.9581298828125, -3.77972412109375, -3.601318359375, -3.42291259765625, -3.2445068359375, -3.06610107421875, -2.8876953125, -2.70928955078125, -2.5308837890625, -2.35247802734375, -2.174072265625, -1.99566650390625, -1.8172607421875, -1.63885498046875, -1.46044921875, -1.28204345703125, -1.1036376953125, -0.92523193359375, -0.746826171875, -0.56842041015625, -0.3900146484375, -0.21160888671875, -0.033203125, 0.14520263671875, 0.3236083984375, 0.50201416015625, 0.680419921875, 0.85882568359375, 1.0372314453125, 1.21563720703125, 1.39404296875, 1.57244873046875, 1.7508544921875, 1.92926025390625, 2.107666015625, 2.28607177734375, 2.4644775390625, 2.64288330078125, 2.8212890625, 2.99969482421875, 3.1781005859375, 3.35650634765625, 3.534912109375, 3.71331787109375, 3.8917236328125, 4.07012939453125, 4.24853515625, 4.42694091796875, 4.6053466796875, 4.78375244140625, 4.962158203125, 5.14056396484375, 5.3189697265625, 5.49737548828125, 5.67578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 12.0, 15.0, 11.0, 21.0, 31.0, 31.0, 33.0, 41.0, 52.0, 47.0, 62.0, 52.0, 57.0, 54.0, 70.0, 48.0, 51.0, 33.0, 55.0, 41.0, 34.0, 25.0, 25.0, 22.0, 19.0, 8.0, 13.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.76934814453125, -2.6715087890625, -2.57366943359375, -2.475830078125, -2.37799072265625, -2.2801513671875, -2.18231201171875, -2.08447265625, -1.98663330078125, -1.8887939453125, -1.79095458984375, -1.693115234375, -1.59527587890625, -1.4974365234375, -1.39959716796875, -1.3017578125, -1.20391845703125, -1.1060791015625, -1.00823974609375, -0.910400390625, -0.81256103515625, -0.7147216796875, -0.61688232421875, -0.51904296875, -0.42120361328125, -0.3233642578125, -0.22552490234375, -0.127685546875, -0.02984619140625, 0.0679931640625, 0.16583251953125, 0.263671875, 0.36151123046875, 0.4593505859375, 0.55718994140625, 0.655029296875, 0.75286865234375, 0.8507080078125, 0.94854736328125, 1.04638671875, 1.14422607421875, 1.2420654296875, 1.33990478515625, 1.437744140625, 1.53558349609375, 1.6334228515625, 1.73126220703125, 1.8291015625, 1.92694091796875, 2.0247802734375, 2.12261962890625, 2.220458984375, 2.31829833984375, 2.4161376953125, 2.51397705078125, 2.61181640625, 2.70965576171875, 2.8074951171875, 2.90533447265625, 3.003173828125, 3.10101318359375, 3.1988525390625, 3.29669189453125, 3.39453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 16.0, 14.0, 26.0, 51.0, 46.0, 88.0, 129.0, 225.0, 476.0, 1017.0, 3274.0, 20689.0, 497659.0, 3571612.0, 86116.0, 9273.0, 2033.0, 730.0, 332.0, 180.0, 93.0, 68.0, 42.0, 21.0, 29.0, 10.0, 6.0, 9.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.15625, -14.7796630859375, -14.403076171875, -14.0264892578125, -13.64990234375, -13.2733154296875, -12.896728515625, -12.5201416015625, -12.1435546875, -11.7669677734375, -11.390380859375, -11.0137939453125, -10.63720703125, -10.2606201171875, -9.884033203125, -9.5074462890625, -9.130859375, -8.7542724609375, -8.377685546875, -8.0010986328125, -7.62451171875, -7.2479248046875, -6.871337890625, -6.4947509765625, -6.1181640625, -5.7415771484375, -5.364990234375, -4.9884033203125, -4.61181640625, -4.2352294921875, -3.858642578125, -3.4820556640625, -3.10546875, -2.7288818359375, -2.352294921875, -1.9757080078125, -1.59912109375, -1.2225341796875, -0.845947265625, -0.4693603515625, -0.0927734375, 0.2838134765625, 0.660400390625, 1.0369873046875, 1.41357421875, 1.7901611328125, 2.166748046875, 2.5433349609375, 2.919921875, 3.2965087890625, 3.673095703125, 4.0496826171875, 4.42626953125, 4.8028564453125, 5.179443359375, 5.5560302734375, 5.9326171875, 6.3092041015625, 6.685791015625, 7.0623779296875, 7.43896484375, 7.8155517578125, 8.192138671875, 8.5687255859375, 8.9453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 12.0, 15.0, 11.0, 20.0, 40.0, 46.0, 114.0, 167.0, 311.0, 556.0, 871.0, 761.0, 435.0, 245.0, 141.0, 95.0, 53.0, 44.0, 35.0, 22.0, 15.0, 14.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0234375, -7.7628173828125, -7.502197265625, -7.2415771484375, -6.98095703125, -6.7203369140625, -6.459716796875, -6.1990966796875, -5.9384765625, -5.6778564453125, -5.417236328125, -5.1566162109375, -4.89599609375, -4.6353759765625, -4.374755859375, -4.1141357421875, -3.853515625, -3.5928955078125, -3.332275390625, -3.0716552734375, -2.81103515625, -2.5504150390625, -2.289794921875, -2.0291748046875, -1.7685546875, -1.5079345703125, -1.247314453125, -0.9866943359375, -0.72607421875, -0.4654541015625, -0.204833984375, 0.0557861328125, 0.31640625, 0.5770263671875, 0.837646484375, 1.0982666015625, 1.35888671875, 1.6195068359375, 1.880126953125, 2.1407470703125, 2.4013671875, 2.6619873046875, 2.922607421875, 3.1832275390625, 3.44384765625, 3.7044677734375, 3.965087890625, 4.2257080078125, 4.486328125, 4.7469482421875, 5.007568359375, 5.2681884765625, 5.52880859375, 5.7894287109375, 6.050048828125, 6.3106689453125, 6.5712890625, 6.8319091796875, 7.092529296875, 7.3531494140625, 7.61376953125, 7.8743896484375, 8.135009765625, 8.3956298828125, 8.65625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 30.0, 78.0, 227.0, 348.0, 200.0, 64.0, 25.0, 6.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.24658966064453, -60.713897705078125, -56.18120574951172, -51.64851379394531, -47.115821838378906, -42.5831298828125, -38.05044174194336, -33.51774978637695, -28.985057830810547, -24.45236587524414, -19.919673919677734, -15.386983871459961, -10.854291915893555, -6.321599960327148, -1.788909912109375, 2.7437820434570312, 7.2764739990234375, 11.809165954589844, 16.34185791015625, 20.874547958374023, 25.40723991394043, 29.939931869506836, 34.47262191772461, 39.005313873291016, 43.53800582885742, 48.07069778442383, 52.603389739990234, 57.136077880859375, 61.66876983642578, 66.20146179199219, 70.7341537475586, 75.266845703125, 79.79954528808594, 84.33223724365234, 88.86492919921875, 93.39762115478516, 97.93031311035156, 102.46300506591797, 106.99569702148438, 111.52838134765625, 116.06108093261719, 120.5937728881836, 125.12646484375, 129.65914916992188, 134.1918487548828, 138.7245330810547, 143.25723266601562, 147.7899169921875, 152.32260131835938, 156.85528564453125, 161.3879852294922, 165.92066955566406, 170.453369140625, 174.98605346679688, 179.5187530517578, 184.0514373779297, 188.58413696289062, 193.1168212890625, 197.64952087402344, 202.1822052001953, 206.71490478515625, 211.24758911132812, 215.78028869628906, 220.31297302246094, 224.84567260742188]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 8.0, 6.0, 14.0, 9.0, 19.0, 26.0, 21.0, 25.0, 30.0, 40.0, 46.0, 50.0, 56.0, 51.0, 57.0, 75.0, 54.0, 54.0, 49.0, 43.0, 48.0, 38.0, 38.0, 29.0, 26.0, 19.0, 12.0, 16.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.97605514526367, -34.665931701660156, -33.355804443359375, -32.04568099975586, -30.735557556152344, -29.425434112548828, -28.11530876159668, -26.80518341064453, -25.495059967041016, -24.1849365234375, -22.87481117248535, -21.564685821533203, -20.254562377929688, -18.944438934326172, -17.634313583374023, -16.324188232421875, -15.01406478881836, -13.703940391540527, -12.393815994262695, -11.083691596984863, -9.773567199707031, -8.4634428024292, -7.153318405151367, -5.843194007873535, -4.533069610595703, -3.222945213317871, -1.912820816040039, -0.602696418762207, 0.707427978515625, 2.017552375793457, 3.327676773071289, 4.637801170349121, 5.947929382324219, 7.258053779602051, 8.568178176879883, 9.878302574157715, 11.188426971435547, 12.498551368713379, 13.808675765991211, 15.118800163269043, 16.428924560546875, 17.73904800415039, 19.04917335510254, 20.359298706054688, 21.669422149658203, 22.97954559326172, 24.289670944213867, 25.599796295166016, 26.90991973876953, 28.220043182373047, 29.530168533325195, 30.840293884277344, 32.15041732788086, 33.460540771484375, 34.770668029785156, 36.08079147338867, 37.39091491699219, 38.7010383605957, 40.01116180419922, 41.3212890625, 42.631412506103516, 43.94153594970703, 45.25166320800781, 46.56178665161133, 47.871910095214844]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 19.0, 17.0, 39.0, 51.0, 86.0, 122.0, 239.0, 412.0, 870.0, 1781.0, 3842.0, 9402.0, 25101.0, 79635.0, 303053.0, 435641.0, 127588.0, 37541.0, 13001.0, 5342.0, 2335.0, 1135.0, 569.0, 298.0, 163.0, 100.0, 67.0, 36.0, 28.0, 14.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.56396484375, -6.3310546875, -6.09814453125, -5.865234375, -5.63232421875, -5.3994140625, -5.16650390625, -4.93359375, -4.70068359375, -4.4677734375, -4.23486328125, -4.001953125, -3.76904296875, -3.5361328125, -3.30322265625, -3.0703125, -2.83740234375, -2.6044921875, -2.37158203125, -2.138671875, -1.90576171875, -1.6728515625, -1.43994140625, -1.20703125, -0.97412109375, -0.7412109375, -0.50830078125, -0.275390625, -0.04248046875, 0.1904296875, 0.42333984375, 0.65625, 0.88916015625, 1.1220703125, 1.35498046875, 1.587890625, 1.82080078125, 2.0537109375, 2.28662109375, 2.51953125, 2.75244140625, 2.9853515625, 3.21826171875, 3.451171875, 3.68408203125, 3.9169921875, 4.14990234375, 4.3828125, 4.61572265625, 4.8486328125, 5.08154296875, 5.314453125, 5.54736328125, 5.7802734375, 6.01318359375, 6.24609375, 6.47900390625, 6.7119140625, 6.94482421875, 7.177734375, 7.41064453125, 7.6435546875, 7.87646484375, 8.109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 5.0, 8.0, 15.0, 15.0, 12.0, 18.0, 20.0, 18.0, 16.0, 23.0, 33.0, 29.0, 31.0, 35.0, 34.0, 50.0, 49.0, 35.0, 38.0, 45.0, 40.0, 54.0, 33.0, 30.0, 31.0, 28.0, 24.0, 31.0, 31.0, 26.0, 23.0, 17.0, 18.0, 8.0, 11.0, 11.0, 8.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.36328125, -2.289337158203125, -2.21539306640625, -2.141448974609375, -2.0675048828125, -1.993560791015625, -1.91961669921875, -1.845672607421875, -1.771728515625, -1.697784423828125, -1.62384033203125, -1.549896240234375, -1.4759521484375, -1.402008056640625, -1.32806396484375, -1.254119873046875, -1.18017578125, -1.106231689453125, -1.03228759765625, -0.958343505859375, -0.8843994140625, -0.810455322265625, -0.73651123046875, -0.662567138671875, -0.588623046875, -0.514678955078125, -0.44073486328125, -0.366790771484375, -0.2928466796875, -0.218902587890625, -0.14495849609375, -0.071014404296875, 0.0029296875, 0.076873779296875, 0.15081787109375, 0.224761962890625, 0.2987060546875, 0.372650146484375, 0.44659423828125, 0.520538330078125, 0.594482421875, 0.668426513671875, 0.74237060546875, 0.816314697265625, 0.8902587890625, 0.964202880859375, 1.03814697265625, 1.112091064453125, 1.18603515625, 1.259979248046875, 1.33392333984375, 1.407867431640625, 1.4818115234375, 1.555755615234375, 1.62969970703125, 1.703643798828125, 1.777587890625, 1.851531982421875, 1.92547607421875, 1.999420166015625, 2.0733642578125, 2.147308349609375, 2.22125244140625, 2.295196533203125, 2.369140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 6.0, 3.0, 4.0, 8.0, 9.0, 16.0, 26.0, 33.0, 47.0, 91.0, 155.0, 250.0, 497.0, 1030.0, 2760.0, 11814.0, 167894.0, 819683.0, 35681.0, 5285.0, 1709.0, 699.0, 348.0, 198.0, 127.0, 63.0, 41.0, 21.0, 19.0, 11.0, 4.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.81494140625, -17.1611328125, -16.50732421875, -15.853515625, -15.19970703125, -14.5458984375, -13.89208984375, -13.23828125, -12.58447265625, -11.9306640625, -11.27685546875, -10.623046875, -9.96923828125, -9.3154296875, -8.66162109375, -8.0078125, -7.35400390625, -6.7001953125, -6.04638671875, -5.392578125, -4.73876953125, -4.0849609375, -3.43115234375, -2.77734375, -2.12353515625, -1.4697265625, -0.81591796875, -0.162109375, 0.49169921875, 1.1455078125, 1.79931640625, 2.453125, 3.10693359375, 3.7607421875, 4.41455078125, 5.068359375, 5.72216796875, 6.3759765625, 7.02978515625, 7.68359375, 8.33740234375, 8.9912109375, 9.64501953125, 10.298828125, 10.95263671875, 11.6064453125, 12.26025390625, 12.9140625, 13.56787109375, 14.2216796875, 14.87548828125, 15.529296875, 16.18310546875, 16.8369140625, 17.49072265625, 18.14453125, 18.79833984375, 19.4521484375, 20.10595703125, 20.759765625, 21.41357421875, 22.0673828125, 22.72119140625, 23.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 8.0, 6.0, 5.0, 14.0, 12.0, 17.0, 18.0, 16.0, 17.0, 25.0, 30.0, 37.0, 32.0, 41.0, 41.0, 35.0, 56.0, 48.0, 35.0, 43.0, 43.0, 40.0, 40.0, 40.0, 30.0, 45.0, 31.0, 28.0, 22.0, 15.0, 16.0, 15.0, 23.0, 10.0, 6.0, 8.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-10.421875, -10.111328125, -9.80078125, -9.490234375, -9.1796875, -8.869140625, -8.55859375, -8.248046875, -7.9375, -7.626953125, -7.31640625, -7.005859375, -6.6953125, -6.384765625, -6.07421875, -5.763671875, -5.453125, -5.142578125, -4.83203125, -4.521484375, -4.2109375, -3.900390625, -3.58984375, -3.279296875, -2.96875, -2.658203125, -2.34765625, -2.037109375, -1.7265625, -1.416015625, -1.10546875, -0.794921875, -0.484375, -0.173828125, 0.13671875, 0.447265625, 0.7578125, 1.068359375, 1.37890625, 1.689453125, 2.0, 2.310546875, 2.62109375, 2.931640625, 3.2421875, 3.552734375, 3.86328125, 4.173828125, 4.484375, 4.794921875, 5.10546875, 5.416015625, 5.7265625, 6.037109375, 6.34765625, 6.658203125, 6.96875, 7.279296875, 7.58984375, 7.900390625, 8.2109375, 8.521484375, 8.83203125, 9.142578125, 9.453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 9.0, 2.0, 11.0, 1.0, 6.0, 11.0, 13.0, 20.0, 26.0, 41.0, 81.0, 87.0, 155.0, 257.0, 447.0, 745.0, 1336.0, 2671.0, 5524.0, 13145.0, 40006.0, 341814.0, 571211.0, 44849.0, 13865.0, 5837.0, 2884.0, 1500.0, 826.0, 409.0, 267.0, 170.0, 125.0, 70.0, 38.0, 30.0, 17.0, 15.0, 13.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.9022216796875, -5.698974609375, -5.4957275390625, -5.29248046875, -5.0892333984375, -4.885986328125, -4.6827392578125, -4.4794921875, -4.2762451171875, -4.072998046875, -3.8697509765625, -3.66650390625, -3.4632568359375, -3.260009765625, -3.0567626953125, -2.853515625, -2.6502685546875, -2.447021484375, -2.2437744140625, -2.04052734375, -1.8372802734375, -1.634033203125, -1.4307861328125, -1.2275390625, -1.0242919921875, -0.821044921875, -0.6177978515625, -0.41455078125, -0.2113037109375, -0.008056640625, 0.1951904296875, 0.3984375, 0.6016845703125, 0.804931640625, 1.0081787109375, 1.21142578125, 1.4146728515625, 1.617919921875, 1.8211669921875, 2.0244140625, 2.2276611328125, 2.430908203125, 2.6341552734375, 2.83740234375, 3.0406494140625, 3.243896484375, 3.4471435546875, 3.650390625, 3.8536376953125, 4.056884765625, 4.2601318359375, 4.46337890625, 4.6666259765625, 4.869873046875, 5.0731201171875, 5.2763671875, 5.4796142578125, 5.682861328125, 5.8861083984375, 6.08935546875, 6.2926025390625, 6.495849609375, 6.6990966796875, 6.90234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 8.0, 14.0, 21.0, 35.0, 35.0, 74.0, 157.0, 274.0, 134.0, 67.0, 42.0, 34.0, 22.0, 17.0, 11.0, 6.0, 7.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0027599334716796875, -0.002688109874725342, -0.002616286277770996, -0.0025444626808166504, -0.0024726390838623047, -0.002400815486907959, -0.0023289918899536133, -0.0022571682929992676, -0.002185344696044922, -0.002113521099090576, -0.0020416975021362305, -0.0019698739051818848, -0.001898050308227539, -0.0018262267112731934, -0.0017544031143188477, -0.001682579517364502, -0.0016107559204101562, -0.0015389323234558105, -0.0014671087265014648, -0.0013952851295471191, -0.0013234615325927734, -0.0012516379356384277, -0.001179814338684082, -0.0011079907417297363, -0.0010361671447753906, -0.0009643435478210449, -0.0008925199508666992, -0.0008206963539123535, -0.0007488727569580078, -0.0006770491600036621, -0.0006052255630493164, -0.0005334019660949707, -0.000461578369140625, -0.0003897547721862793, -0.0003179311752319336, -0.0002461075782775879, -0.0001742839813232422, -0.00010246038436889648, -3.063678741455078e-05, 4.118680953979492e-05, 0.00011301040649414062, 0.00018483400344848633, 0.00025665760040283203, 0.00032848119735717773, 0.00040030479431152344, 0.00047212839126586914, 0.0005439519882202148, 0.0006157755851745605, 0.0006875991821289062, 0.000759422779083252, 0.0008312463760375977, 0.0009030699729919434, 0.0009748935699462891, 0.0010467171669006348, 0.0011185407638549805, 0.0011903643608093262, 0.0012621879577636719, 0.0013340115547180176, 0.0014058351516723633, 0.001477658748626709, 0.0015494823455810547, 0.0016213059425354004, 0.001693129539489746, 0.0017649531364440918, 0.0018367767333984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 3.0, 9.0, 12.0, 7.0, 27.0, 36.0, 49.0, 70.0, 95.0, 150.0, 203.0, 316.0, 529.0, 883.0, 1630.0, 3021.0, 6047.0, 13238.0, 37292.0, 240036.0, 649567.0, 60866.0, 18306.0, 7498.0, 3788.0, 1936.0, 1094.0, 636.0, 407.0, 269.0, 152.0, 106.0, 74.0, 45.0, 49.0, 21.0, 24.0, 12.0, 8.0, 12.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-5.7109375, -5.55303955078125, -5.3951416015625, -5.23724365234375, -5.079345703125, -4.92144775390625, -4.7635498046875, -4.60565185546875, -4.44775390625, -4.28985595703125, -4.1319580078125, -3.97406005859375, -3.816162109375, -3.65826416015625, -3.5003662109375, -3.34246826171875, -3.1845703125, -3.02667236328125, -2.8687744140625, -2.71087646484375, -2.552978515625, -2.39508056640625, -2.2371826171875, -2.07928466796875, -1.92138671875, -1.76348876953125, -1.6055908203125, -1.44769287109375, -1.289794921875, -1.13189697265625, -0.9739990234375, -0.81610107421875, -0.658203125, -0.50030517578125, -0.3424072265625, -0.18450927734375, -0.026611328125, 0.13128662109375, 0.2891845703125, 0.44708251953125, 0.60498046875, 0.76287841796875, 0.9207763671875, 1.07867431640625, 1.236572265625, 1.39447021484375, 1.5523681640625, 1.71026611328125, 1.8681640625, 2.02606201171875, 2.1839599609375, 2.34185791015625, 2.499755859375, 2.65765380859375, 2.8155517578125, 2.97344970703125, 3.13134765625, 3.28924560546875, 3.4471435546875, 3.60504150390625, 3.762939453125, 3.92083740234375, 4.0787353515625, 4.23663330078125, 4.39453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 5.0, 10.0, 18.0, 10.0, 18.0, 21.0, 23.0, 29.0, 38.0, 42.0, 59.0, 96.0, 92.0, 122.0, 89.0, 45.0, 51.0, 40.0, 33.0, 25.0, 17.0, 15.0, 19.0, 7.0, 10.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8828125, -3.76202392578125, -3.6412353515625, -3.52044677734375, -3.399658203125, -3.27886962890625, -3.1580810546875, -3.03729248046875, -2.91650390625, -2.79571533203125, -2.6749267578125, -2.55413818359375, -2.433349609375, -2.31256103515625, -2.1917724609375, -2.07098388671875, -1.9501953125, -1.82940673828125, -1.7086181640625, -1.58782958984375, -1.467041015625, -1.34625244140625, -1.2254638671875, -1.10467529296875, -0.98388671875, -0.86309814453125, -0.7423095703125, -0.62152099609375, -0.500732421875, -0.37994384765625, -0.2591552734375, -0.13836669921875, -0.017578125, 0.10321044921875, 0.2239990234375, 0.34478759765625, 0.465576171875, 0.58636474609375, 0.7071533203125, 0.82794189453125, 0.94873046875, 1.06951904296875, 1.1903076171875, 1.31109619140625, 1.431884765625, 1.55267333984375, 1.6734619140625, 1.79425048828125, 1.9150390625, 2.03582763671875, 2.1566162109375, 2.27740478515625, 2.398193359375, 2.51898193359375, 2.6397705078125, 2.76055908203125, 2.88134765625, 3.00213623046875, 3.1229248046875, 3.24371337890625, 3.364501953125, 3.48529052734375, 3.6060791015625, 3.72686767578125, 3.84765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 15.0, 24.0, 48.0, 61.0, 99.0, 176.0, 247.0, 134.0, 67.0, 37.0, 21.0, 15.0, 8.0, 5.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-128.41885375976562, -124.98292541503906, -121.5469970703125, -118.11106872558594, -114.6751480102539, -111.23921966552734, -107.80329132080078, -104.36736297607422, -100.93144226074219, -97.49551391601562, -94.05958557128906, -90.6236572265625, -87.18773651123047, -83.7518081665039, -80.31587982177734, -76.87995147705078, -73.44402313232422, -70.00809478759766, -66.5721664428711, -63.1362419128418, -59.7003173828125, -56.26438903808594, -52.828460693359375, -49.39253234863281, -45.956607818603516, -42.52067947387695, -39.084754943847656, -35.648826599121094, -32.21289825439453, -28.776973724365234, -25.341045379638672, -21.905118942260742, -18.469192504882812, -15.033266067504883, -11.597338676452637, -8.16141128540039, -4.725484848022461, -1.2895584106445312, 2.1463699340820312, 5.582296371459961, 9.01822280883789, 12.45414924621582, 15.890076637268066, 19.326004028320312, 22.761930465698242, 26.197856903076172, 29.633785247802734, 33.06970977783203, 36.505638122558594, 39.941566467285156, 43.37749099731445, 46.813419342041016, 50.24934387207031, 53.685272216796875, 57.12120056152344, 60.55712890625, 63.9930534362793, 67.4289779663086, 70.86490631103516, 74.30083465576172, 77.73676300048828, 81.17268371582031, 84.60861206054688, 88.04454040527344, 91.48046875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 5.0, 5.0, 4.0, 7.0, 14.0, 19.0, 15.0, 7.0, 14.0, 15.0, 21.0, 33.0, 26.0, 29.0, 26.0, 28.0, 45.0, 59.0, 68.0, 53.0, 69.0, 60.0, 49.0, 33.0, 35.0, 31.0, 35.0, 28.0, 24.0, 16.0, 16.0, 13.0, 15.0, 8.0, 12.0, 12.0, 10.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.85874557495117, -37.50409698486328, -36.149444580078125, -34.794795989990234, -33.44014358520508, -32.08549499511719, -30.730844497680664, -29.37619400024414, -28.021543502807617, -26.666893005371094, -25.31224250793457, -23.957592010498047, -22.602943420410156, -21.248291015625, -19.89364242553711, -18.538991928100586, -17.184341430664062, -15.829690933227539, -14.475040435791016, -13.120390892028809, -11.765740394592285, -10.411089897155762, -9.056440353393555, -7.701789855957031, -6.347139358520508, -4.992488861083984, -3.637838840484619, -2.283188819885254, -0.9285383224487305, 0.42611217498779297, 1.78076171875, 3.1354122161865234, 4.4900665283203125, 5.844717025756836, 7.199367046356201, 8.554017066955566, 9.90866756439209, 11.263318061828613, 12.61796760559082, 13.972618103027344, 15.327268600463867, 16.68191909790039, 18.036569595336914, 19.391220092773438, 20.745868682861328, 22.100521087646484, 23.455169677734375, 24.8098201751709, 26.164470672607422, 27.519121170043945, 28.87377166748047, 30.22842025756836, 31.583072662353516, 32.937721252441406, 34.29237365722656, 35.64702224731445, 37.001670837402344, 38.356319427490234, 39.71097183227539, 41.06562042236328, 42.42027282714844, 43.77492141723633, 45.12957000732422, 46.484222412109375, 47.83887481689453]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 21.0, 15.0, 17.0, 33.0, 54.0, 87.0, 143.0, 324.0, 762.0, 2350.0, 10810.0, 156071.0, 3866026.0, 142854.0, 10752.0, 2361.0, 789.0, 364.0, 158.0, 95.0, 53.0, 37.0, 28.0, 15.0, 12.0, 10.0, 9.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.8052978515625, -10.462158203125, -10.1190185546875, -9.77587890625, -9.4327392578125, -9.089599609375, -8.7464599609375, -8.4033203125, -8.0601806640625, -7.717041015625, -7.3739013671875, -7.03076171875, -6.6876220703125, -6.344482421875, -6.0013427734375, -5.658203125, -5.3150634765625, -4.971923828125, -4.6287841796875, -4.28564453125, -3.9425048828125, -3.599365234375, -3.2562255859375, -2.9130859375, -2.5699462890625, -2.226806640625, -1.8836669921875, -1.54052734375, -1.1973876953125, -0.854248046875, -0.5111083984375, -0.16796875, 0.1751708984375, 0.518310546875, 0.8614501953125, 1.20458984375, 1.5477294921875, 1.890869140625, 2.2340087890625, 2.5771484375, 2.9202880859375, 3.263427734375, 3.6065673828125, 3.94970703125, 4.2928466796875, 4.635986328125, 4.9791259765625, 5.322265625, 5.6654052734375, 6.008544921875, 6.3516845703125, 6.69482421875, 7.0379638671875, 7.381103515625, 7.7242431640625, 8.0673828125, 8.4105224609375, 8.753662109375, 9.0968017578125, 9.43994140625, 9.7830810546875, 10.126220703125, 10.4693603515625, 10.8125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 10.0, 5.0, 17.0, 12.0, 25.0, 26.0, 30.0, 32.0, 35.0, 41.0, 49.0, 52.0, 62.0, 57.0, 57.0, 53.0, 49.0, 49.0, 51.0, 48.0, 48.0, 35.0, 40.0, 27.0, 21.0, 18.0, 3.0, 11.0, 10.0, 3.0, 5.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.6343994140625, -3.532470703125, -3.4305419921875, -3.32861328125, -3.2266845703125, -3.124755859375, -3.0228271484375, -2.9208984375, -2.8189697265625, -2.717041015625, -2.6151123046875, -2.51318359375, -2.4112548828125, -2.309326171875, -2.2073974609375, -2.10546875, -2.0035400390625, -1.901611328125, -1.7996826171875, -1.69775390625, -1.5958251953125, -1.493896484375, -1.3919677734375, -1.2900390625, -1.1881103515625, -1.086181640625, -0.9842529296875, -0.88232421875, -0.7803955078125, -0.678466796875, -0.5765380859375, -0.474609375, -0.3726806640625, -0.270751953125, -0.1688232421875, -0.06689453125, 0.0350341796875, 0.136962890625, 0.2388916015625, 0.3408203125, 0.4427490234375, 0.544677734375, 0.6466064453125, 0.74853515625, 0.8504638671875, 0.952392578125, 1.0543212890625, 1.15625, 1.2581787109375, 1.360107421875, 1.4620361328125, 1.56396484375, 1.6658935546875, 1.767822265625, 1.8697509765625, 1.9716796875, 2.0736083984375, 2.175537109375, 2.2774658203125, 2.37939453125, 2.4813232421875, 2.583251953125, 2.6851806640625, 2.787109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 24.0, 21.0, 42.0, 77.0, 124.0, 206.0, 393.0, 1052.0, 4769.0, 141823.0, 4024308.0, 18276.0, 2005.0, 590.0, 250.0, 149.0, 73.0, 42.0, 19.0, 11.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.78125, -22.968505859375, -22.15576171875, -21.343017578125, -20.5302734375, -19.717529296875, -18.90478515625, -18.092041015625, -17.279296875, -16.466552734375, -15.65380859375, -14.841064453125, -14.0283203125, -13.215576171875, -12.40283203125, -11.590087890625, -10.77734375, -9.964599609375, -9.15185546875, -8.339111328125, -7.5263671875, -6.713623046875, -5.90087890625, -5.088134765625, -4.275390625, -3.462646484375, -2.64990234375, -1.837158203125, -1.0244140625, -0.211669921875, 0.60107421875, 1.413818359375, 2.2265625, 3.039306640625, 3.85205078125, 4.664794921875, 5.4775390625, 6.290283203125, 7.10302734375, 7.915771484375, 8.728515625, 9.541259765625, 10.35400390625, 11.166748046875, 11.9794921875, 12.792236328125, 13.60498046875, 14.417724609375, 15.23046875, 16.043212890625, 16.85595703125, 17.668701171875, 18.4814453125, 19.294189453125, 20.10693359375, 20.919677734375, 21.732421875, 22.545166015625, 23.35791015625, 24.170654296875, 24.9833984375, 25.796142578125, 26.60888671875, 27.421630859375, 28.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 14.0, 39.0, 75.0, 257.0, 1119.0, 1802.0, 492.0, 133.0, 59.0, 29.0, 19.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -24.1197509765625, -23.505126953125, -22.8905029296875, -22.27587890625, -21.6612548828125, -21.046630859375, -20.4320068359375, -19.8173828125, -19.2027587890625, -18.588134765625, -17.9735107421875, -17.35888671875, -16.7442626953125, -16.129638671875, -15.5150146484375, -14.900390625, -14.2857666015625, -13.671142578125, -13.0565185546875, -12.44189453125, -11.8272705078125, -11.212646484375, -10.5980224609375, -9.9833984375, -9.3687744140625, -8.754150390625, -8.1395263671875, -7.52490234375, -6.9102783203125, -6.295654296875, -5.6810302734375, -5.06640625, -4.4517822265625, -3.837158203125, -3.2225341796875, -2.60791015625, -1.9932861328125, -1.378662109375, -0.7640380859375, -0.1494140625, 0.4652099609375, 1.079833984375, 1.6944580078125, 2.30908203125, 2.9237060546875, 3.538330078125, 4.1529541015625, 4.767578125, 5.3822021484375, 5.996826171875, 6.6114501953125, 7.22607421875, 7.8406982421875, 8.455322265625, 9.0699462890625, 9.6845703125, 10.2991943359375, 10.913818359375, 11.5284423828125, 12.14306640625, 12.7576904296875, 13.372314453125, 13.9869384765625, 14.6015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 12.0, 17.0, 40.0, 182.0, 428.0, 233.0, 56.0, 19.0, 6.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-342.37353515625, -335.4742736816406, -328.5749816894531, -321.67572021484375, -314.7764587402344, -307.8771667480469, -300.9779052734375, -294.0786437988281, -287.1793518066406, -280.28009033203125, -273.38079833984375, -266.4815368652344, -259.582275390625, -252.68299865722656, -245.78372192382812, -238.88446044921875, -231.98519897460938, -225.08592224121094, -218.18666076660156, -211.28738403320312, -204.3881072998047, -197.4888458251953, -190.58956909179688, -183.6903076171875, -176.791015625, -169.89173889160156, -162.9924774169922, -156.09320068359375, -149.1939239501953, -142.29466247558594, -135.3953857421875, -128.49612426757812, -121.59684753417969, -114.69757843017578, -107.79830169677734, -100.89903259277344, -93.99976348876953, -87.10049438476562, -80.20121765136719, -73.30194854736328, -66.40267944335938, -59.5034065246582, -52.6041374206543, -45.704864501953125, -38.80559539794922, -31.906322479248047, -25.007049560546875, -18.10778045654297, -11.208503723144531, -4.309232234954834, 2.5900392532348633, 9.489311218261719, 16.388582229614258, 23.287853240966797, 30.18712615966797, 37.086395263671875, 43.98566818237305, 50.88494110107422, 57.784210205078125, 64.68348693847656, 71.58275604248047, 78.48202514648438, 85.38130187988281, 92.28056335449219, 99.17984008789062]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 9.0, 6.0, 12.0, 29.0, 25.0, 32.0, 50.0, 55.0, 91.0, 100.0, 81.0, 104.0, 79.0, 83.0, 63.0, 51.0, 34.0, 24.0, 19.0, 19.0, 12.0, 3.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.29466247558594, -62.9083137512207, -60.52196502685547, -58.13561248779297, -55.749263763427734, -53.3629150390625, -50.976566314697266, -48.59021759033203, -46.20386505126953, -43.8175163269043, -41.43116760253906, -39.04481506347656, -36.65846633911133, -34.272117614746094, -31.88576889038086, -29.499418258666992, -27.11307144165039, -24.726722717285156, -22.34037208557129, -19.954023361206055, -17.567672729492188, -15.181324005126953, -12.794975280761719, -10.408624649047852, -8.022275924682617, -5.635926246643066, -3.249577045440674, -0.8632278442382812, 1.5231218338012695, 3.9094715118408203, 6.295820236206055, 8.682170867919922, 11.068519592285156, 13.454869270324707, 15.841218948364258, 18.227567672729492, 20.61391830444336, 23.000267028808594, 25.386615753173828, 27.772966384887695, 30.15931510925293, 32.5456657409668, 34.93201446533203, 37.318363189697266, 39.7047119140625, 42.091064453125, 44.47740936279297, 46.86376190185547, 49.2501106262207, 51.63645935058594, 54.02280807495117, 56.409156799316406, 58.795509338378906, 61.18185806274414, 63.568206787109375, 65.95455932617188, 68.34090423583984, 70.72725677490234, 73.11360168457031, 75.49995422363281, 77.88629913330078, 80.27265167236328, 82.65899658203125, 85.04534912109375, 87.43170166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 6.0, 2.0, 9.0, 17.0, 27.0, 50.0, 65.0, 150.0, 252.0, 626.0, 1575.0, 4573.0, 15747.0, 73804.0, 361716.0, 453379.0, 105767.0, 21451.0, 5897.0, 1976.0, 819.0, 324.0, 150.0, 77.0, 33.0, 27.0, 15.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.025634765625, -5.78564453125, -5.545654296875, -5.3056640625, -5.065673828125, -4.82568359375, -4.585693359375, -4.345703125, -4.105712890625, -3.86572265625, -3.625732421875, -3.3857421875, -3.145751953125, -2.90576171875, -2.665771484375, -2.42578125, -2.185791015625, -1.94580078125, -1.705810546875, -1.4658203125, -1.225830078125, -0.98583984375, -0.745849609375, -0.505859375, -0.265869140625, -0.02587890625, 0.214111328125, 0.4541015625, 0.694091796875, 0.93408203125, 1.174072265625, 1.4140625, 1.654052734375, 1.89404296875, 2.134033203125, 2.3740234375, 2.614013671875, 2.85400390625, 3.093994140625, 3.333984375, 3.573974609375, 3.81396484375, 4.053955078125, 4.2939453125, 4.533935546875, 4.77392578125, 5.013916015625, 5.25390625, 5.493896484375, 5.73388671875, 5.973876953125, 6.2138671875, 6.453857421875, 6.69384765625, 6.933837890625, 7.173828125, 7.413818359375, 7.65380859375, 7.893798828125, 8.1337890625, 8.373779296875, 8.61376953125, 8.853759765625, 9.09375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 15.0, 22.0, 23.0, 28.0, 30.0, 45.0, 54.0, 54.0, 76.0, 74.0, 68.0, 81.0, 61.0, 69.0, 56.0, 46.0, 48.0, 33.0, 25.0, 24.0, 16.0, 9.0, 9.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48046875, -3.334716796875, -3.18896484375, -3.043212890625, -2.8974609375, -2.751708984375, -2.60595703125, -2.460205078125, -2.314453125, -2.168701171875, -2.02294921875, -1.877197265625, -1.7314453125, -1.585693359375, -1.43994140625, -1.294189453125, -1.1484375, -1.002685546875, -0.85693359375, -0.711181640625, -0.5654296875, -0.419677734375, -0.27392578125, -0.128173828125, 0.017578125, 0.163330078125, 0.30908203125, 0.454833984375, 0.6005859375, 0.746337890625, 0.89208984375, 1.037841796875, 1.18359375, 1.329345703125, 1.47509765625, 1.620849609375, 1.7666015625, 1.912353515625, 2.05810546875, 2.203857421875, 2.349609375, 2.495361328125, 2.64111328125, 2.786865234375, 2.9326171875, 3.078369140625, 3.22412109375, 3.369873046875, 3.515625, 3.661376953125, 3.80712890625, 3.952880859375, 4.0986328125, 4.244384765625, 4.39013671875, 4.535888671875, 4.681640625, 4.827392578125, 4.97314453125, 5.118896484375, 5.2646484375, 5.410400390625, 5.55615234375, 5.701904296875, 5.84765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 6.0, 12.0, 9.0, 19.0, 33.0, 38.0, 52.0, 87.0, 153.0, 246.0, 521.0, 1001.0, 2619.0, 7526.0, 33484.0, 213308.0, 654861.0, 107166.0, 18867.0, 4987.0, 1812.0, 805.0, 370.0, 203.0, 118.0, 60.0, 63.0, 27.0, 22.0, 17.0, 16.0, 11.0, 4.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.5467529296875, -9.241943359375, -8.9371337890625, -8.63232421875, -8.3275146484375, -8.022705078125, -7.7178955078125, -7.4130859375, -7.1082763671875, -6.803466796875, -6.4986572265625, -6.19384765625, -5.8890380859375, -5.584228515625, -5.2794189453125, -4.974609375, -4.6697998046875, -4.364990234375, -4.0601806640625, -3.75537109375, -3.4505615234375, -3.145751953125, -2.8409423828125, -2.5361328125, -2.2313232421875, -1.926513671875, -1.6217041015625, -1.31689453125, -1.0120849609375, -0.707275390625, -0.4024658203125, -0.09765625, 0.2071533203125, 0.511962890625, 0.8167724609375, 1.12158203125, 1.4263916015625, 1.731201171875, 2.0360107421875, 2.3408203125, 2.6456298828125, 2.950439453125, 3.2552490234375, 3.56005859375, 3.8648681640625, 4.169677734375, 4.4744873046875, 4.779296875, 5.0841064453125, 5.388916015625, 5.6937255859375, 5.99853515625, 6.3033447265625, 6.608154296875, 6.9129638671875, 7.2177734375, 7.5225830078125, 7.827392578125, 8.1322021484375, 8.43701171875, 8.7418212890625, 9.046630859375, 9.3514404296875, 9.65625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 8.0, 13.0, 7.0, 11.0, 21.0, 24.0, 23.0, 44.0, 23.0, 43.0, 44.0, 56.0, 57.0, 61.0, 49.0, 65.0, 57.0, 47.0, 46.0, 51.0, 33.0, 55.0, 32.0, 28.0, 21.0, 22.0, 11.0, 17.0, 7.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.484375, -14.016357421875, -13.54833984375, -13.080322265625, -12.6123046875, -12.144287109375, -11.67626953125, -11.208251953125, -10.740234375, -10.272216796875, -9.80419921875, -9.336181640625, -8.8681640625, -8.400146484375, -7.93212890625, -7.464111328125, -6.99609375, -6.528076171875, -6.06005859375, -5.592041015625, -5.1240234375, -4.656005859375, -4.18798828125, -3.719970703125, -3.251953125, -2.783935546875, -2.31591796875, -1.847900390625, -1.3798828125, -0.911865234375, -0.44384765625, 0.024169921875, 0.4921875, 0.960205078125, 1.42822265625, 1.896240234375, 2.3642578125, 2.832275390625, 3.30029296875, 3.768310546875, 4.236328125, 4.704345703125, 5.17236328125, 5.640380859375, 6.1083984375, 6.576416015625, 7.04443359375, 7.512451171875, 7.98046875, 8.448486328125, 8.91650390625, 9.384521484375, 9.8525390625, 10.320556640625, 10.78857421875, 11.256591796875, 11.724609375, 12.192626953125, 12.66064453125, 13.128662109375, 13.5966796875, 14.064697265625, 14.53271484375, 15.000732421875, 15.46875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 9.0, 5.0, 9.0, 12.0, 24.0, 24.0, 58.0, 68.0, 102.0, 139.0, 247.0, 361.0, 586.0, 1068.0, 1879.0, 3518.0, 7019.0, 16125.0, 47420.0, 232192.0, 610915.0, 82617.0, 24015.0, 9742.0, 4570.0, 2395.0, 1340.0, 788.0, 454.0, 322.0, 185.0, 118.0, 62.0, 51.0, 37.0, 33.0, 16.0, 10.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.744140625, -3.64349365234375, -3.5428466796875, -3.44219970703125, -3.341552734375, -3.24090576171875, -3.1402587890625, -3.03961181640625, -2.93896484375, -2.83831787109375, -2.7376708984375, -2.63702392578125, -2.536376953125, -2.43572998046875, -2.3350830078125, -2.23443603515625, -2.1337890625, -2.03314208984375, -1.9324951171875, -1.83184814453125, -1.731201171875, -1.63055419921875, -1.5299072265625, -1.42926025390625, -1.32861328125, -1.22796630859375, -1.1273193359375, -1.02667236328125, -0.926025390625, -0.82537841796875, -0.7247314453125, -0.62408447265625, -0.5234375, -0.42279052734375, -0.3221435546875, -0.22149658203125, -0.120849609375, -0.02020263671875, 0.0804443359375, 0.18109130859375, 0.28173828125, 0.38238525390625, 0.4830322265625, 0.58367919921875, 0.684326171875, 0.78497314453125, 0.8856201171875, 0.98626708984375, 1.0869140625, 1.18756103515625, 1.2882080078125, 1.38885498046875, 1.489501953125, 1.59014892578125, 1.6907958984375, 1.79144287109375, 1.89208984375, 1.99273681640625, 2.0933837890625, 2.19403076171875, 2.294677734375, 2.39532470703125, 2.4959716796875, 2.59661865234375, 2.697265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 11.0, 37.0, 66.0, 206.0, 401.0, 148.0, 46.0, 20.0, 16.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00295257568359375, -0.0028793662786483765, -0.002806156873703003, -0.0027329474687576294, -0.002659738063812256, -0.0025865286588668823, -0.002513319253921509, -0.0024401098489761353, -0.0023669004440307617, -0.002293691039085388, -0.0022204816341400146, -0.002147272229194641, -0.0020740628242492676, -0.002000853419303894, -0.0019276440143585205, -0.001854434609413147, -0.0017812252044677734, -0.0017080157995224, -0.0016348063945770264, -0.0015615969896316528, -0.0014883875846862793, -0.0014151781797409058, -0.0013419687747955322, -0.0012687593698501587, -0.0011955499649047852, -0.0011223405599594116, -0.001049131155014038, -0.0009759217500686646, -0.000902712345123291, -0.0008295029401779175, -0.0007562935352325439, -0.0006830841302871704, -0.0006098747253417969, -0.0005366653203964233, -0.0004634559154510498, -0.00039024651050567627, -0.00031703710556030273, -0.0002438277006149292, -0.00017061829566955566, -9.740889072418213e-05, -2.4199485778808594e-05, 4.900991916656494e-05, 0.00012221932411193848, 0.000195428729057312, 0.00026863813400268555, 0.0003418475389480591, 0.0004150569438934326, 0.00048826634883880615, 0.0005614757537841797, 0.0006346851587295532, 0.0007078945636749268, 0.0007811039686203003, 0.0008543133735656738, 0.0009275227785110474, 0.001000732183456421, 0.0010739415884017944, 0.001147150993347168, 0.0012203603982925415, 0.001293569803237915, 0.0013667792081832886, 0.0014399886131286621, 0.0015131980180740356, 0.0015864074230194092, 0.0016596168279647827, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 9.0, 14.0, 12.0, 24.0, 26.0, 58.0, 66.0, 90.0, 164.0, 289.0, 526.0, 1105.0, 2181.0, 4938.0, 12212.0, 35859.0, 158578.0, 660466.0, 122740.0, 30300.0, 10507.0, 4245.0, 1960.0, 962.0, 483.0, 277.0, 154.0, 103.0, 60.0, 35.0, 25.0, 13.0, 8.0, 13.0, 8.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.030120849609375, -2.92352294921875, -2.816925048828125, -2.7103271484375, -2.603729248046875, -2.49713134765625, -2.390533447265625, -2.283935546875, -2.177337646484375, -2.07073974609375, -1.964141845703125, -1.8575439453125, -1.750946044921875, -1.64434814453125, -1.537750244140625, -1.43115234375, -1.324554443359375, -1.21795654296875, -1.111358642578125, -1.0047607421875, -0.898162841796875, -0.79156494140625, -0.684967041015625, -0.578369140625, -0.471771240234375, -0.36517333984375, -0.258575439453125, -0.1519775390625, -0.045379638671875, 0.06121826171875, 0.167816162109375, 0.2744140625, 0.381011962890625, 0.48760986328125, 0.594207763671875, 0.7008056640625, 0.807403564453125, 0.91400146484375, 1.020599365234375, 1.127197265625, 1.233795166015625, 1.34039306640625, 1.446990966796875, 1.5535888671875, 1.660186767578125, 1.76678466796875, 1.873382568359375, 1.97998046875, 2.086578369140625, 2.19317626953125, 2.299774169921875, 2.4063720703125, 2.512969970703125, 2.61956787109375, 2.726165771484375, 2.832763671875, 2.939361572265625, 3.04595947265625, 3.152557373046875, 3.2591552734375, 3.365753173828125, 3.47235107421875, 3.578948974609375, 3.685546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 18.0, 21.0, 19.0, 26.0, 37.0, 49.0, 60.0, 83.0, 98.0, 98.0, 103.0, 87.0, 67.0, 46.0, 46.0, 24.0, 18.0, 11.0, 14.0, 12.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.109375, -3.993896484375, -3.87841796875, -3.762939453125, -3.6474609375, -3.531982421875, -3.41650390625, -3.301025390625, -3.185546875, -3.070068359375, -2.95458984375, -2.839111328125, -2.7236328125, -2.608154296875, -2.49267578125, -2.377197265625, -2.26171875, -2.146240234375, -2.03076171875, -1.915283203125, -1.7998046875, -1.684326171875, -1.56884765625, -1.453369140625, -1.337890625, -1.222412109375, -1.10693359375, -0.991455078125, -0.8759765625, -0.760498046875, -0.64501953125, -0.529541015625, -0.4140625, -0.298583984375, -0.18310546875, -0.067626953125, 0.0478515625, 0.163330078125, 0.27880859375, 0.394287109375, 0.509765625, 0.625244140625, 0.74072265625, 0.856201171875, 0.9716796875, 1.087158203125, 1.20263671875, 1.318115234375, 1.43359375, 1.549072265625, 1.66455078125, 1.780029296875, 1.8955078125, 2.010986328125, 2.12646484375, 2.241943359375, 2.357421875, 2.472900390625, 2.58837890625, 2.703857421875, 2.8193359375, 2.934814453125, 3.05029296875, 3.165771484375, 3.28125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 24.0, 42.0, 85.0, 184.0, 277.0, 166.0, 85.0, 61.0, 25.0, 16.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.4755859375, -59.53202819824219, -56.588470458984375, -53.64491271972656, -50.70135498046875, -47.75779724121094, -44.81423568725586, -41.87067794799805, -38.927120208740234, -35.98356246948242, -33.04000473022461, -30.096445083618164, -27.15288734436035, -24.20932960510254, -21.265769958496094, -18.32221221923828, -15.378654479980469, -12.435096740722656, -9.491538047790527, -6.547979354858398, -3.604421615600586, -0.6608638763427734, 2.282695770263672, 5.226253509521484, 8.169811248779297, 11.11336898803711, 14.056927680969238, 17.000486373901367, 19.94404411315918, 22.887601852416992, 25.831161499023438, 28.77471923828125, 31.71826934814453, 34.661827087402344, 37.605384826660156, 40.54894256591797, 43.49250030517578, 46.436058044433594, 49.37961959838867, 52.323177337646484, 55.2667350769043, 58.21029281616211, 61.15385055541992, 64.097412109375, 67.04096984863281, 69.98452758789062, 72.92808532714844, 75.87164306640625, 78.81520080566406, 81.75875854492188, 84.70231628417969, 87.6458740234375, 90.58943176269531, 93.53298950195312, 96.47654724121094, 99.42010498046875, 102.36366271972656, 105.30722045898438, 108.25077819824219, 111.1943359375, 114.13789367675781, 117.08145141601562, 120.02500915527344, 122.96856689453125, 125.9121322631836]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 7.0, 11.0, 14.0, 14.0, 11.0, 6.0, 25.0, 27.0, 35.0, 38.0, 38.0, 44.0, 65.0, 73.0, 95.0, 104.0, 50.0, 55.0, 29.0, 40.0, 35.0, 29.0, 22.0, 21.0, 11.0, 18.0, 11.0, 10.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.09502410888672, -58.31275939941406, -56.530494689941406, -54.74822998046875, -52.96596908569336, -51.1837043762207, -49.40143966674805, -47.61917495727539, -45.8369140625, -44.054649353027344, -42.27238464355469, -40.49011993408203, -38.70785903930664, -36.925594329833984, -35.14332962036133, -33.36106491088867, -31.578800201416016, -29.79653549194336, -28.014272689819336, -26.23200798034668, -24.449745178222656, -22.66748046875, -20.885215759277344, -19.102951049804688, -17.320688247680664, -15.538424491882324, -13.756160736083984, -11.973896026611328, -10.191632270812988, -8.409368515014648, -6.627103805541992, -4.844840049743652, -3.062572479248047, -1.280308485031128, 0.501955509185791, 2.284219741821289, 4.066483497619629, 5.848747253417969, 7.631011962890625, 9.413275718688965, 11.195539474487305, 12.977803230285645, 14.760066986083984, 16.54233169555664, 18.324596405029297, 20.10685920715332, 21.889123916625977, 23.67138671875, 25.453651428222656, 27.235916137695312, 29.018178939819336, 30.800443649291992, 32.582706451416016, 34.36497116088867, 36.14723587036133, 37.929500579833984, 39.711761474609375, 41.49402618408203, 43.27629089355469, 45.058555603027344, 46.840816497802734, 48.62308120727539, 50.40534591674805, 52.1876106262207, 53.96987533569336]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 19.0, 17.0, 38.0, 50.0, 85.0, 138.0, 237.0, 469.0, 894.0, 1932.0, 5856.0, 25745.0, 301410.0, 3163251.0, 638962.0, 42279.0, 7871.0, 2579.0, 1157.0, 548.0, 302.0, 172.0, 95.0, 67.0, 38.0, 24.0, 17.0, 4.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.4146728515625, -4.227783203125, -4.0408935546875, -3.85400390625, -3.6671142578125, -3.480224609375, -3.2933349609375, -3.1064453125, -2.9195556640625, -2.732666015625, -2.5457763671875, -2.35888671875, -2.1719970703125, -1.985107421875, -1.7982177734375, -1.611328125, -1.4244384765625, -1.237548828125, -1.0506591796875, -0.86376953125, -0.6768798828125, -0.489990234375, -0.3031005859375, -0.1162109375, 0.0706787109375, 0.257568359375, 0.4444580078125, 0.63134765625, 0.8182373046875, 1.005126953125, 1.1920166015625, 1.37890625, 1.5657958984375, 1.752685546875, 1.9395751953125, 2.12646484375, 2.3133544921875, 2.500244140625, 2.6871337890625, 2.8740234375, 3.0609130859375, 3.247802734375, 3.4346923828125, 3.62158203125, 3.8084716796875, 3.995361328125, 4.1822509765625, 4.369140625, 4.5560302734375, 4.742919921875, 4.9298095703125, 5.11669921875, 5.3035888671875, 5.490478515625, 5.6773681640625, 5.8642578125, 6.0511474609375, 6.238037109375, 6.4249267578125, 6.61181640625, 6.7987060546875, 6.985595703125, 7.1724853515625, 7.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 6.0, 8.0, 8.0, 8.0, 6.0, 5.0, 17.0, 10.0, 21.0, 18.0, 27.0, 20.0, 40.0, 43.0, 36.0, 35.0, 56.0, 60.0, 52.0, 49.0, 59.0, 42.0, 41.0, 48.0, 31.0, 41.0, 24.0, 30.0, 24.0, 25.0, 16.0, 15.0, 18.0, 14.0, 8.0, 7.0, 10.0, 3.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.427734375, -3.328765869140625, -3.22979736328125, -3.130828857421875, -3.0318603515625, -2.932891845703125, -2.83392333984375, -2.734954833984375, -2.635986328125, -2.537017822265625, -2.43804931640625, -2.339080810546875, -2.2401123046875, -2.141143798828125, -2.04217529296875, -1.943206787109375, -1.84423828125, -1.745269775390625, -1.64630126953125, -1.547332763671875, -1.4483642578125, -1.349395751953125, -1.25042724609375, -1.151458740234375, -1.052490234375, -0.953521728515625, -0.85455322265625, -0.755584716796875, -0.6566162109375, -0.557647705078125, -0.45867919921875, -0.359710693359375, -0.2607421875, -0.161773681640625, -0.06280517578125, 0.036163330078125, 0.1351318359375, 0.234100341796875, 0.33306884765625, 0.432037353515625, 0.531005859375, 0.629974365234375, 0.72894287109375, 0.827911376953125, 0.9268798828125, 1.025848388671875, 1.12481689453125, 1.223785400390625, 1.32275390625, 1.421722412109375, 1.52069091796875, 1.619659423828125, 1.7186279296875, 1.817596435546875, 1.91656494140625, 2.015533447265625, 2.114501953125, 2.213470458984375, 2.31243896484375, 2.411407470703125, 2.5103759765625, 2.609344482421875, 2.70831298828125, 2.807281494140625, 2.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 10.0, 11.0, 37.0, 37.0, 76.0, 104.0, 250.0, 517.0, 1535.0, 13374.0, 3686654.0, 483704.0, 6049.0, 1004.0, 446.0, 205.0, 97.0, 67.0, 41.0, 25.0, 16.0, 8.0, 5.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.97607421875, -21.3271484375, -20.67822265625, -20.029296875, -19.38037109375, -18.7314453125, -18.08251953125, -17.43359375, -16.78466796875, -16.1357421875, -15.48681640625, -14.837890625, -14.18896484375, -13.5400390625, -12.89111328125, -12.2421875, -11.59326171875, -10.9443359375, -10.29541015625, -9.646484375, -8.99755859375, -8.3486328125, -7.69970703125, -7.05078125, -6.40185546875, -5.7529296875, -5.10400390625, -4.455078125, -3.80615234375, -3.1572265625, -2.50830078125, -1.859375, -1.21044921875, -0.5615234375, 0.08740234375, 0.736328125, 1.38525390625, 2.0341796875, 2.68310546875, 3.33203125, 3.98095703125, 4.6298828125, 5.27880859375, 5.927734375, 6.57666015625, 7.2255859375, 7.87451171875, 8.5234375, 9.17236328125, 9.8212890625, 10.47021484375, 11.119140625, 11.76806640625, 12.4169921875, 13.06591796875, 13.71484375, 14.36376953125, 15.0126953125, 15.66162109375, 16.310546875, 16.95947265625, 17.6083984375, 18.25732421875, 18.90625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 13.0, 26.0, 45.0, 78.0, 233.0, 620.0, 1390.0, 1001.0, 380.0, 132.0, 51.0, 37.0, 18.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8125, -11.41552734375, -11.0185546875, -10.62158203125, -10.224609375, -9.82763671875, -9.4306640625, -9.03369140625, -8.63671875, -8.23974609375, -7.8427734375, -7.44580078125, -7.048828125, -6.65185546875, -6.2548828125, -5.85791015625, -5.4609375, -5.06396484375, -4.6669921875, -4.27001953125, -3.873046875, -3.47607421875, -3.0791015625, -2.68212890625, -2.28515625, -1.88818359375, -1.4912109375, -1.09423828125, -0.697265625, -0.30029296875, 0.0966796875, 0.49365234375, 0.890625, 1.28759765625, 1.6845703125, 2.08154296875, 2.478515625, 2.87548828125, 3.2724609375, 3.66943359375, 4.06640625, 4.46337890625, 4.8603515625, 5.25732421875, 5.654296875, 6.05126953125, 6.4482421875, 6.84521484375, 7.2421875, 7.63916015625, 8.0361328125, 8.43310546875, 8.830078125, 9.22705078125, 9.6240234375, 10.02099609375, 10.41796875, 10.81494140625, 11.2119140625, 11.60888671875, 12.005859375, 12.40283203125, 12.7998046875, 13.19677734375, 13.59375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 29.0, 35.0, 55.0, 101.0, 148.0, 195.0, 146.0, 116.0, 62.0, 43.0, 20.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-93.1906509399414, -91.10945129394531, -89.02825927734375, -86.94705963134766, -84.86585998535156, -82.78466796875, -80.7034683227539, -78.62227630615234, -76.54107666015625, -74.45987701416016, -72.3786849975586, -70.2974853515625, -68.21629333496094, -66.13509368896484, -64.05389404296875, -61.97269821166992, -59.891502380371094, -57.810306549072266, -55.72911071777344, -53.647911071777344, -51.566715240478516, -49.48551940917969, -47.404319763183594, -45.323123931884766, -43.24192810058594, -41.16073226928711, -39.07953643798828, -36.99833679199219, -34.91714096069336, -32.83594512939453, -30.75474739074707, -28.67354965209961, -26.592361450195312, -24.511165618896484, -22.429967880249023, -20.348770141601562, -18.267574310302734, -16.186378479003906, -14.105180740356445, -12.0239839553833, -9.942787170410156, -7.861590385437012, -5.780393600463867, -3.6991968154907227, -1.6180000305175781, 0.4631967544555664, 2.544393539428711, 4.6255903244018555, 6.706787109375, 8.787983894348145, 10.869180679321289, 12.950377464294434, 15.031574249267578, 17.112770080566406, 19.193967819213867, 21.275165557861328, 23.356361389160156, 25.437557220458984, 27.518754959106445, 29.599952697753906, 31.681148529052734, 33.76234436035156, 35.843544006347656, 37.924739837646484, 40.00593566894531]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 11.0, 9.0, 20.0, 19.0, 31.0, 20.0, 34.0, 40.0, 37.0, 39.0, 33.0, 39.0, 46.0, 59.0, 44.0, 47.0, 43.0, 52.0, 38.0, 41.0, 42.0, 40.0, 33.0, 31.0, 27.0, 22.0, 19.0, 7.0, 11.0, 7.0, 7.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-34.533119201660156, -33.586387634277344, -32.6396598815918, -31.692928314208984, -30.746196746826172, -29.799467086791992, -28.852737426757812, -27.906005859375, -26.95927619934082, -26.01254653930664, -25.065814971923828, -24.11908531188965, -23.17235565185547, -22.225624084472656, -21.278894424438477, -20.332164764404297, -19.385433197021484, -18.438703536987305, -17.491971969604492, -16.545242309570312, -15.598511695861816, -14.65178108215332, -13.70505142211914, -12.758320808410645, -11.811590194702148, -10.864859580993652, -9.918128967285156, -8.971399307250977, -8.02466869354248, -7.077938079833984, -6.1312079429626465, -5.184477806091309, -4.2377471923828125, -3.2910168170928955, -2.3442864418029785, -1.3975560665130615, -0.45082569122314453, 0.49590492248535156, 1.4426350593566895, 2.3893651962280273, 3.3360958099365234, 4.2828264236450195, 5.229556560516357, 6.176286697387695, 7.123017311096191, 8.069747924804688, 9.016477584838867, 9.963208198547363, 10.90993881225586, 11.856669425964355, 12.803400039672852, 13.750129699707031, 14.696860313415527, 15.643590927124023, 16.590320587158203, 17.537052154541016, 18.483781814575195, 19.430511474609375, 20.377243041992188, 21.323972702026367, 22.270702362060547, 23.21743392944336, 24.16416358947754, 25.11089324951172, 26.05762481689453]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 5.0, 2.0, 17.0, 15.0, 48.0, 64.0, 97.0, 160.0, 278.0, 552.0, 1193.0, 2513.0, 5763.0, 14742.0, 42189.0, 135846.0, 377062.0, 313678.0, 101533.0, 32254.0, 11627.0, 4663.0, 2149.0, 970.0, 499.0, 279.0, 124.0, 80.0, 62.0, 35.0, 24.0, 12.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.29339599609375, -4.1336669921875, -3.97393798828125, -3.814208984375, -3.65447998046875, -3.4947509765625, -3.33502197265625, -3.17529296875, -3.01556396484375, -2.8558349609375, -2.69610595703125, -2.536376953125, -2.37664794921875, -2.2169189453125, -2.05718994140625, -1.8974609375, -1.73773193359375, -1.5780029296875, -1.41827392578125, -1.258544921875, -1.09881591796875, -0.9390869140625, -0.77935791015625, -0.61962890625, -0.45989990234375, -0.3001708984375, -0.14044189453125, 0.019287109375, 0.17901611328125, 0.3387451171875, 0.49847412109375, 0.658203125, 0.81793212890625, 0.9776611328125, 1.13739013671875, 1.297119140625, 1.45684814453125, 1.6165771484375, 1.77630615234375, 1.93603515625, 2.09576416015625, 2.2554931640625, 2.41522216796875, 2.574951171875, 2.73468017578125, 2.8944091796875, 3.05413818359375, 3.2138671875, 3.37359619140625, 3.5333251953125, 3.69305419921875, 3.852783203125, 4.01251220703125, 4.1722412109375, 4.33197021484375, 4.49169921875, 4.65142822265625, 4.8111572265625, 4.97088623046875, 5.130615234375, 5.29034423828125, 5.4500732421875, 5.60980224609375, 5.76953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 4.0, 9.0, 14.0, 11.0, 13.0, 12.0, 20.0, 24.0, 23.0, 46.0, 35.0, 41.0, 46.0, 44.0, 54.0, 57.0, 61.0, 59.0, 41.0, 46.0, 45.0, 35.0, 36.0, 29.0, 22.0, 32.0, 29.0, 17.0, 19.0, 10.0, 7.0, 12.0, 7.0, 11.0, 3.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.38336181640625, -3.2725830078125, -3.16180419921875, -3.051025390625, -2.94024658203125, -2.8294677734375, -2.71868896484375, -2.60791015625, -2.49713134765625, -2.3863525390625, -2.27557373046875, -2.164794921875, -2.05401611328125, -1.9432373046875, -1.83245849609375, -1.7216796875, -1.61090087890625, -1.5001220703125, -1.38934326171875, -1.278564453125, -1.16778564453125, -1.0570068359375, -0.94622802734375, -0.83544921875, -0.72467041015625, -0.6138916015625, -0.50311279296875, -0.392333984375, -0.28155517578125, -0.1707763671875, -0.05999755859375, 0.05078125, 0.16156005859375, 0.2723388671875, 0.38311767578125, 0.493896484375, 0.60467529296875, 0.7154541015625, 0.82623291015625, 0.93701171875, 1.04779052734375, 1.1585693359375, 1.26934814453125, 1.380126953125, 1.49090576171875, 1.6016845703125, 1.71246337890625, 1.8232421875, 1.93402099609375, 2.0447998046875, 2.15557861328125, 2.266357421875, 2.37713623046875, 2.4879150390625, 2.59869384765625, 2.70947265625, 2.82025146484375, 2.9310302734375, 3.04180908203125, 3.152587890625, 3.26336669921875, 3.3741455078125, 3.48492431640625, 3.595703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 18.0, 18.0, 21.0, 24.0, 36.0, 50.0, 82.0, 91.0, 153.0, 234.0, 372.0, 717.0, 1457.0, 3888.0, 15240.0, 91688.0, 728362.0, 171968.0, 24266.0, 5625.0, 1956.0, 923.0, 481.0, 279.0, 177.0, 133.0, 68.0, 61.0, 44.0, 33.0, 23.0, 10.0, 17.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.25, -9.93603515625, -9.6220703125, -9.30810546875, -8.994140625, -8.68017578125, -8.3662109375, -8.05224609375, -7.73828125, -7.42431640625, -7.1103515625, -6.79638671875, -6.482421875, -6.16845703125, -5.8544921875, -5.54052734375, -5.2265625, -4.91259765625, -4.5986328125, -4.28466796875, -3.970703125, -3.65673828125, -3.3427734375, -3.02880859375, -2.71484375, -2.40087890625, -2.0869140625, -1.77294921875, -1.458984375, -1.14501953125, -0.8310546875, -0.51708984375, -0.203125, 0.11083984375, 0.4248046875, 0.73876953125, 1.052734375, 1.36669921875, 1.6806640625, 1.99462890625, 2.30859375, 2.62255859375, 2.9365234375, 3.25048828125, 3.564453125, 3.87841796875, 4.1923828125, 4.50634765625, 4.8203125, 5.13427734375, 5.4482421875, 5.76220703125, 6.076171875, 6.39013671875, 6.7041015625, 7.01806640625, 7.33203125, 7.64599609375, 7.9599609375, 8.27392578125, 8.587890625, 8.90185546875, 9.2158203125, 9.52978515625, 9.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 7.0, 13.0, 12.0, 18.0, 28.0, 25.0, 39.0, 26.0, 39.0, 64.0, 58.0, 59.0, 50.0, 53.0, 80.0, 50.0, 55.0, 46.0, 43.0, 42.0, 22.0, 37.0, 21.0, 27.0, 12.0, 12.0, 13.0, 8.0, 8.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.734375, -15.27783203125, -14.8212890625, -14.36474609375, -13.908203125, -13.45166015625, -12.9951171875, -12.53857421875, -12.08203125, -11.62548828125, -11.1689453125, -10.71240234375, -10.255859375, -9.79931640625, -9.3427734375, -8.88623046875, -8.4296875, -7.97314453125, -7.5166015625, -7.06005859375, -6.603515625, -6.14697265625, -5.6904296875, -5.23388671875, -4.77734375, -4.32080078125, -3.8642578125, -3.40771484375, -2.951171875, -2.49462890625, -2.0380859375, -1.58154296875, -1.125, -0.66845703125, -0.2119140625, 0.24462890625, 0.701171875, 1.15771484375, 1.6142578125, 2.07080078125, 2.52734375, 2.98388671875, 3.4404296875, 3.89697265625, 4.353515625, 4.81005859375, 5.2666015625, 5.72314453125, 6.1796875, 6.63623046875, 7.0927734375, 7.54931640625, 8.005859375, 8.46240234375, 8.9189453125, 9.37548828125, 9.83203125, 10.28857421875, 10.7451171875, 11.20166015625, 11.658203125, 12.11474609375, 12.5712890625, 13.02783203125, 13.484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 10.0, 21.0, 22.0, 43.0, 56.0, 108.0, 186.0, 322.0, 608.0, 1217.0, 2637.0, 6521.0, 18532.0, 74848.0, 759821.0, 140047.0, 27937.0, 8861.0, 3453.0, 1580.0, 759.0, 408.0, 208.0, 131.0, 73.0, 44.0, 36.0, 16.0, 12.0, 9.0, 4.0, 8.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.505859375, -3.398529052734375, -3.29119873046875, -3.183868408203125, -3.0765380859375, -2.969207763671875, -2.86187744140625, -2.754547119140625, -2.647216796875, -2.539886474609375, -2.43255615234375, -2.325225830078125, -2.2178955078125, -2.110565185546875, -2.00323486328125, -1.895904541015625, -1.78857421875, -1.681243896484375, -1.57391357421875, -1.466583251953125, -1.3592529296875, -1.251922607421875, -1.14459228515625, -1.037261962890625, -0.929931640625, -0.822601318359375, -0.71527099609375, -0.607940673828125, -0.5006103515625, -0.393280029296875, -0.28594970703125, -0.178619384765625, -0.0712890625, 0.036041259765625, 0.14337158203125, 0.250701904296875, 0.3580322265625, 0.465362548828125, 0.57269287109375, 0.680023193359375, 0.787353515625, 0.894683837890625, 1.00201416015625, 1.109344482421875, 1.2166748046875, 1.324005126953125, 1.43133544921875, 1.538665771484375, 1.64599609375, 1.753326416015625, 1.86065673828125, 1.967987060546875, 2.0753173828125, 2.182647705078125, 2.28997802734375, 2.397308349609375, 2.504638671875, 2.611968994140625, 2.71929931640625, 2.826629638671875, 2.9339599609375, 3.041290283203125, 3.14862060546875, 3.255950927734375, 3.36328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 0.0, 6.0, 13.0, 17.0, 16.0, 36.0, 54.0, 95.0, 179.0, 285.0, 120.0, 50.0, 36.0, 32.0, 18.0, 6.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010408610105514526, -0.0010040700435638428, -0.0009672790765762329, -0.000930488109588623, -0.0008936971426010132, -0.0008569061756134033, -0.0008201152086257935, -0.0007833242416381836, -0.0007465332746505737, -0.0007097423076629639, -0.000672951340675354, -0.0006361603736877441, -0.0005993694067001343, -0.0005625784397125244, -0.0005257874727249146, -0.0004889965057373047, -0.0004522055387496948, -0.00041541457176208496, -0.0003786236047744751, -0.00034183263778686523, -0.00030504167079925537, -0.0002682507038116455, -0.00023145973682403564, -0.00019466876983642578, -0.00015787780284881592, -0.00012108683586120605, -8.429586887359619e-05, -4.750490188598633e-05, -1.0713934898376465e-05, 2.60770320892334e-05, 6.286799907684326e-05, 9.965896606445312e-05, 0.000136449933052063, 0.00017324090003967285, 0.00021003186702728271, 0.0002468228340148926, 0.00028361380100250244, 0.0003204047679901123, 0.00035719573497772217, 0.00039398670196533203, 0.0004307776689529419, 0.00046756863594055176, 0.0005043596029281616, 0.0005411505699157715, 0.0005779415369033813, 0.0006147325038909912, 0.0006515234708786011, 0.0006883144378662109, 0.0007251054048538208, 0.0007618963718414307, 0.0007986873388290405, 0.0008354783058166504, 0.0008722692728042603, 0.0009090602397918701, 0.00094585120677948, 0.0009826421737670898, 0.0010194331407546997, 0.0010562241077423096, 0.0010930150747299194, 0.0011298060417175293, 0.0011665970087051392, 0.001203387975692749, 0.0012401789426803589, 0.0012769699096679688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 20.0, 27.0, 34.0, 65.0, 124.0, 279.0, 684.0, 1735.0, 5351.0, 24953.0, 316848.0, 659040.0, 29851.0, 6120.0, 1953.0, 720.0, 346.0, 172.0, 96.0, 45.0, 24.0, 16.0, 14.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2421875, -5.0733642578125, -4.904541015625, -4.7357177734375, -4.56689453125, -4.3980712890625, -4.229248046875, -4.0604248046875, -3.8916015625, -3.7227783203125, -3.553955078125, -3.3851318359375, -3.21630859375, -3.0474853515625, -2.878662109375, -2.7098388671875, -2.541015625, -2.3721923828125, -2.203369140625, -2.0345458984375, -1.86572265625, -1.6968994140625, -1.528076171875, -1.3592529296875, -1.1904296875, -1.0216064453125, -0.852783203125, -0.6839599609375, -0.51513671875, -0.3463134765625, -0.177490234375, -0.0086669921875, 0.16015625, 0.3289794921875, 0.497802734375, 0.6666259765625, 0.83544921875, 1.0042724609375, 1.173095703125, 1.3419189453125, 1.5107421875, 1.6795654296875, 1.848388671875, 2.0172119140625, 2.18603515625, 2.3548583984375, 2.523681640625, 2.6925048828125, 2.861328125, 3.0301513671875, 3.198974609375, 3.3677978515625, 3.53662109375, 3.7054443359375, 3.874267578125, 4.0430908203125, 4.2119140625, 4.3807373046875, 4.549560546875, 4.7183837890625, 4.88720703125, 5.0560302734375, 5.224853515625, 5.3936767578125, 5.5625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 18.0, 13.0, 22.0, 37.0, 63.0, 89.0, 163.0, 176.0, 138.0, 85.0, 64.0, 31.0, 31.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4544677734375, -4.303466796875, -4.1524658203125, -4.00146484375, -3.8504638671875, -3.699462890625, -3.5484619140625, -3.3974609375, -3.2464599609375, -3.095458984375, -2.9444580078125, -2.79345703125, -2.6424560546875, -2.491455078125, -2.3404541015625, -2.189453125, -2.0384521484375, -1.887451171875, -1.7364501953125, -1.58544921875, -1.4344482421875, -1.283447265625, -1.1324462890625, -0.9814453125, -0.8304443359375, -0.679443359375, -0.5284423828125, -0.37744140625, -0.2264404296875, -0.075439453125, 0.0755615234375, 0.2265625, 0.3775634765625, 0.528564453125, 0.6795654296875, 0.83056640625, 0.9815673828125, 1.132568359375, 1.2835693359375, 1.4345703125, 1.5855712890625, 1.736572265625, 1.8875732421875, 2.03857421875, 2.1895751953125, 2.340576171875, 2.4915771484375, 2.642578125, 2.7935791015625, 2.944580078125, 3.0955810546875, 3.24658203125, 3.3975830078125, 3.548583984375, 3.6995849609375, 3.8505859375, 4.0015869140625, 4.152587890625, 4.3035888671875, 4.45458984375, 4.6055908203125, 4.756591796875, 4.9075927734375, 5.05859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 9.0, 23.0, 44.0, 125.0, 367.0, 250.0, 112.0, 37.0, 17.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-140.16384887695312, -136.2601318359375, -132.3563995361328, -128.4526824951172, -124.54895782470703, -120.64523315429688, -116.74151611328125, -112.8377914428711, -108.93406677246094, -105.03034210205078, -101.12662506103516, -97.222900390625, -93.31917572021484, -89.41545104980469, -85.51173400878906, -81.6080093383789, -77.70428466796875, -73.8005599975586, -69.89684295654297, -65.99311828613281, -62.089393615722656, -58.185672760009766, -54.281951904296875, -50.37822723388672, -46.474510192871094, -42.5707893371582, -38.66706466674805, -34.763343811035156, -30.859619140625, -26.95589828491211, -23.052175521850586, -19.148452758789062, -15.244728088378906, -11.341005325317383, -7.437283039093018, -3.5335607528686523, 0.3701620101928711, 4.273883819580078, 8.177606582641602, 12.081329345703125, 15.985052108764648, 19.888774871826172, 23.792497634887695, 27.69622039794922, 31.59994125366211, 35.503662109375, 39.407386779785156, 43.31111145019531, 47.2148323059082, 51.118553161621094, 55.02227783203125, 58.92599868774414, 62.8297233581543, 66.73344421386719, 70.63716888427734, 74.5408935546875, 78.44461059570312, 82.34833526611328, 86.2520523071289, 90.15577697753906, 94.05950164794922, 97.96322631835938, 101.866943359375, 105.77066802978516, 109.67439270019531]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 3.0, 9.0, 6.0, 6.0, 11.0, 5.0, 10.0, 8.0, 13.0, 24.0, 20.0, 17.0, 24.0, 26.0, 39.0, 35.0, 31.0, 36.0, 53.0, 77.0, 104.0, 84.0, 37.0, 46.0, 29.0, 19.0, 24.0, 23.0, 17.0, 27.0, 21.0, 20.0, 9.0, 15.0, 9.0, 5.0, 11.0, 6.0, 8.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.3431396484375, -37.967628479003906, -36.59211730957031, -35.21660232543945, -33.84109115600586, -32.465579986572266, -31.090068817138672, -29.714555740356445, -28.33904266357422, -26.963531494140625, -25.5880184173584, -24.212507247924805, -22.836994171142578, -21.461483001708984, -20.08597183227539, -18.710458755493164, -17.33494758605957, -15.95943546295166, -14.58392333984375, -13.208412170410156, -11.83289909362793, -10.457387924194336, -9.081875801086426, -7.706363677978516, -6.3308515548706055, -4.955339431762695, -3.5798275470733643, -2.204315662384033, -0.828803539276123, 0.5467085838317871, 1.922220230102539, 3.297732353210449, 4.673244476318359, 6.0487565994262695, 7.42426872253418, 8.799779891967773, 10.17529296875, 11.550804138183594, 12.926316261291504, 14.301828384399414, 15.677340507507324, 17.052852630615234, 18.428363800048828, 19.803876876831055, 21.17938804626465, 22.554901123046875, 23.93041229248047, 25.305923461914062, 26.68143653869629, 28.056947708129883, 29.43246078491211, 30.807971954345703, 32.1834831237793, 33.558998107910156, 34.93450927734375, 36.310020446777344, 37.68553161621094, 39.06104278564453, 40.436553955078125, 41.812068939208984, 43.18758010864258, 44.56309127807617, 45.938602447509766, 47.314117431640625, 48.68962860107422]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 14.0, 10.0, 15.0, 22.0, 23.0, 50.0, 57.0, 80.0, 144.0, 206.0, 318.0, 608.0, 1130.0, 2336.0, 5147.0, 14899.0, 65149.0, 508961.0, 2612558.0, 850565.0, 99557.0, 20184.0, 6456.0, 2672.0, 1268.0, 692.0, 407.0, 257.0, 159.0, 97.0, 62.0, 44.0, 28.0, 35.0, 20.0, 16.0, 8.0, 10.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.81536865234375, -4.6580810546875, -4.50079345703125, -4.343505859375, -4.18621826171875, -4.0289306640625, -3.87164306640625, -3.71435546875, -3.55706787109375, -3.3997802734375, -3.24249267578125, -3.085205078125, -2.92791748046875, -2.7706298828125, -2.61334228515625, -2.4560546875, -2.29876708984375, -2.1414794921875, -1.98419189453125, -1.826904296875, -1.66961669921875, -1.5123291015625, -1.35504150390625, -1.19775390625, -1.04046630859375, -0.8831787109375, -0.72589111328125, -0.568603515625, -0.41131591796875, -0.2540283203125, -0.09674072265625, 0.060546875, 0.21783447265625, 0.3751220703125, 0.53240966796875, 0.689697265625, 0.84698486328125, 1.0042724609375, 1.16156005859375, 1.31884765625, 1.47613525390625, 1.6334228515625, 1.79071044921875, 1.947998046875, 2.10528564453125, 2.2625732421875, 2.41986083984375, 2.5771484375, 2.73443603515625, 2.8917236328125, 3.04901123046875, 3.206298828125, 3.36358642578125, 3.5208740234375, 3.67816162109375, 3.83544921875, 3.99273681640625, 4.1500244140625, 4.30731201171875, 4.464599609375, 4.62188720703125, 4.7791748046875, 4.93646240234375, 5.09375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 7.0, 6.0, 14.0, 12.0, 15.0, 17.0, 18.0, 17.0, 21.0, 21.0, 37.0, 38.0, 39.0, 35.0, 34.0, 46.0, 54.0, 37.0, 44.0, 46.0, 42.0, 47.0, 39.0, 33.0, 32.0, 35.0, 27.0, 24.0, 20.0, 22.0, 19.0, 15.0, 13.0, 10.0, 7.0, 11.0, 7.0, 12.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.775909423828125, -2.68463134765625, -2.593353271484375, -2.5020751953125, -2.410797119140625, -2.31951904296875, -2.228240966796875, -2.136962890625, -2.045684814453125, -1.95440673828125, -1.863128662109375, -1.7718505859375, -1.680572509765625, -1.58929443359375, -1.498016357421875, -1.40673828125, -1.315460205078125, -1.22418212890625, -1.132904052734375, -1.0416259765625, -0.950347900390625, -0.85906982421875, -0.767791748046875, -0.676513671875, -0.585235595703125, -0.49395751953125, -0.402679443359375, -0.3114013671875, -0.220123291015625, -0.12884521484375, -0.037567138671875, 0.0537109375, 0.144989013671875, 0.23626708984375, 0.327545166015625, 0.4188232421875, 0.510101318359375, 0.60137939453125, 0.692657470703125, 0.783935546875, 0.875213623046875, 0.96649169921875, 1.057769775390625, 1.1490478515625, 1.240325927734375, 1.33160400390625, 1.422882080078125, 1.51416015625, 1.605438232421875, 1.69671630859375, 1.787994384765625, 1.8792724609375, 1.970550537109375, 2.06182861328125, 2.153106689453125, 2.244384765625, 2.335662841796875, 2.42694091796875, 2.518218994140625, 2.6094970703125, 2.700775146484375, 2.79205322265625, 2.883331298828125, 2.974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 14.0, 19.0, 22.0, 36.0, 59.0, 93.0, 149.0, 295.0, 1210.0, 11293.0, 3010223.0, 1160799.0, 8378.0, 1018.0, 330.0, 142.0, 74.0, 41.0, 32.0, 19.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.4404296875, -19.708984375, -18.9775390625, -18.24609375, -17.5146484375, -16.783203125, -16.0517578125, -15.3203125, -14.5888671875, -13.857421875, -13.1259765625, -12.39453125, -11.6630859375, -10.931640625, -10.2001953125, -9.46875, -8.7373046875, -8.005859375, -7.2744140625, -6.54296875, -5.8115234375, -5.080078125, -4.3486328125, -3.6171875, -2.8857421875, -2.154296875, -1.4228515625, -0.69140625, 0.0400390625, 0.771484375, 1.5029296875, 2.234375, 2.9658203125, 3.697265625, 4.4287109375, 5.16015625, 5.8916015625, 6.623046875, 7.3544921875, 8.0859375, 8.8173828125, 9.548828125, 10.2802734375, 11.01171875, 11.7431640625, 12.474609375, 13.2060546875, 13.9375, 14.6689453125, 15.400390625, 16.1318359375, 16.86328125, 17.5947265625, 18.326171875, 19.0576171875, 19.7890625, 20.5205078125, 21.251953125, 21.9833984375, 22.71484375, 23.4462890625, 24.177734375, 24.9091796875, 25.640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 9.0, 35.0, 38.0, 57.0, 118.0, 213.0, 419.0, 854.0, 1059.0, 633.0, 288.0, 140.0, 69.0, 45.0, 29.0, 21.0, 12.0, 10.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.390625, -17.006591796875, -16.62255859375, -16.238525390625, -15.8544921875, -15.470458984375, -15.08642578125, -14.702392578125, -14.318359375, -13.934326171875, -13.55029296875, -13.166259765625, -12.7822265625, -12.398193359375, -12.01416015625, -11.630126953125, -11.24609375, -10.862060546875, -10.47802734375, -10.093994140625, -9.7099609375, -9.325927734375, -8.94189453125, -8.557861328125, -8.173828125, -7.789794921875, -7.40576171875, -7.021728515625, -6.6376953125, -6.253662109375, -5.86962890625, -5.485595703125, -5.1015625, -4.717529296875, -4.33349609375, -3.949462890625, -3.5654296875, -3.181396484375, -2.79736328125, -2.413330078125, -2.029296875, -1.645263671875, -1.26123046875, -0.877197265625, -0.4931640625, -0.109130859375, 0.27490234375, 0.658935546875, 1.04296875, 1.427001953125, 1.81103515625, 2.195068359375, 2.5791015625, 2.963134765625, 3.34716796875, 3.731201171875, 4.115234375, 4.499267578125, 4.88330078125, 5.267333984375, 5.6513671875, 6.035400390625, 6.41943359375, 6.803466796875, 7.1875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 0.0, 3.0, 4.0, 10.0, 24.0, 33.0, 56.0, 63.0, 97.0, 121.0, 137.0, 161.0, 91.0, 66.0, 28.0, 38.0, 19.0, 9.0, 7.0, 5.0, 7.0, 7.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.34293746948242, -47.481319427490234, -45.61970520019531, -43.758087158203125, -41.89646911621094, -40.03485107421875, -38.17323684692383, -36.31161880493164, -34.45000457763672, -32.58838653564453, -30.726770401000977, -28.865154266357422, -27.003536224365234, -25.14192008972168, -23.280303955078125, -21.418685913085938, -19.55706787109375, -17.695451736450195, -15.833833694458008, -13.972217559814453, -12.110600471496582, -10.248983383178711, -8.387367248535156, -6.525750160217285, -4.664133071899414, -2.802516222000122, -0.9408993721008301, 0.9207172393798828, 2.782334327697754, 4.643951416015625, 6.50556755065918, 8.36718463897705, 10.228797912597656, 12.090415000915527, 13.952032089233398, 15.813648223876953, 17.67526626586914, 19.536882400512695, 21.39849853515625, 23.260116577148438, 25.121732711791992, 26.983348846435547, 28.844966888427734, 30.70658302307129, 32.568199157714844, 34.42981719970703, 36.29143524169922, 38.15304946899414, 40.01466751098633, 41.876285552978516, 43.73789978027344, 45.599517822265625, 47.46113586425781, 49.32275390625, 51.18436813354492, 53.04598617553711, 54.90760040283203, 56.76921844482422, 58.63083267211914, 60.49245071411133, 62.354068756103516, 64.21568298339844, 66.07730102539062, 67.93891906738281, 69.800537109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 7.0, 11.0, 13.0, 20.0, 20.0, 23.0, 35.0, 40.0, 48.0, 47.0, 48.0, 51.0, 60.0, 62.0, 56.0, 69.0, 59.0, 41.0, 44.0, 36.0, 39.0, 39.0, 23.0, 12.0, 19.0, 15.0, 10.0, 13.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.907562255859375, -37.520904541015625, -36.13424301147461, -34.74758529663086, -33.360923767089844, -31.974266052246094, -30.58760643005371, -29.200946807861328, -27.814289093017578, -26.427629470825195, -25.040969848632812, -23.654312133789062, -22.26765251159668, -20.880992889404297, -19.494333267211914, -18.10767364501953, -16.72101402282715, -15.334354400634766, -13.9476957321167, -12.561036109924316, -11.17437744140625, -9.787717819213867, -8.401058197021484, -7.014399528503418, -5.627739906311035, -4.2410807609558105, -2.854421377182007, -1.4677619934082031, -0.08110284805297852, 1.305556297302246, 2.692215919494629, 4.078874588012695, 5.465534210205078, 6.852193355560303, 8.238852500915527, 9.62551212310791, 11.012170791625977, 12.39883041381836, 13.785490036010742, 15.172148704528809, 16.558807373046875, 17.945466995239258, 19.33212661743164, 20.71878433227539, 22.105443954467773, 23.492103576660156, 24.87876319885254, 26.265422821044922, 27.652082443237305, 29.038742065429688, 30.42540168762207, 31.812061309814453, 33.1987190246582, 34.58538055419922, 35.97203826904297, 37.35869598388672, 38.745357513427734, 40.132015228271484, 41.5186767578125, 42.90533447265625, 44.291996002197266, 45.678653717041016, 47.06531524658203, 48.45197296142578, 49.83863067626953]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 10.0, 11.0, 29.0, 54.0, 96.0, 162.0, 322.0, 577.0, 1142.0, 2283.0, 4807.0, 10552.0, 25984.0, 68747.0, 192895.0, 394685.0, 218155.0, 76849.0, 29092.0, 11852.0, 5241.0, 2474.0, 1195.0, 570.0, 330.0, 175.0, 99.0, 61.0, 34.0, 34.0, 11.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59375, -5.431884765625, -5.27001953125, -5.108154296875, -4.9462890625, -4.784423828125, -4.62255859375, -4.460693359375, -4.298828125, -4.136962890625, -3.97509765625, -3.813232421875, -3.6513671875, -3.489501953125, -3.32763671875, -3.165771484375, -3.00390625, -2.842041015625, -2.68017578125, -2.518310546875, -2.3564453125, -2.194580078125, -2.03271484375, -1.870849609375, -1.708984375, -1.547119140625, -1.38525390625, -1.223388671875, -1.0615234375, -0.899658203125, -0.73779296875, -0.575927734375, -0.4140625, -0.252197265625, -0.09033203125, 0.071533203125, 0.2333984375, 0.395263671875, 0.55712890625, 0.718994140625, 0.880859375, 1.042724609375, 1.20458984375, 1.366455078125, 1.5283203125, 1.690185546875, 1.85205078125, 2.013916015625, 2.17578125, 2.337646484375, 2.49951171875, 2.661376953125, 2.8232421875, 2.985107421875, 3.14697265625, 3.308837890625, 3.470703125, 3.632568359375, 3.79443359375, 3.956298828125, 4.1181640625, 4.280029296875, 4.44189453125, 4.603759765625, 4.765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 0.0, 3.0, 9.0, 5.0, 15.0, 10.0, 11.0, 14.0, 12.0, 21.0, 28.0, 26.0, 31.0, 25.0, 40.0, 37.0, 31.0, 33.0, 37.0, 42.0, 46.0, 42.0, 27.0, 40.0, 36.0, 40.0, 38.0, 39.0, 32.0, 29.0, 32.0, 26.0, 26.0, 19.0, 15.0, 11.0, 8.0, 14.0, 8.0, 11.0, 7.0, 11.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.858123779296875, -2.76507568359375, -2.672027587890625, -2.5789794921875, -2.485931396484375, -2.39288330078125, -2.299835205078125, -2.206787109375, -2.113739013671875, -2.02069091796875, -1.927642822265625, -1.8345947265625, -1.741546630859375, -1.64849853515625, -1.555450439453125, -1.46240234375, -1.369354248046875, -1.27630615234375, -1.183258056640625, -1.0902099609375, -0.997161865234375, -0.90411376953125, -0.811065673828125, -0.718017578125, -0.624969482421875, -0.53192138671875, -0.438873291015625, -0.3458251953125, -0.252777099609375, -0.15972900390625, -0.066680908203125, 0.0263671875, 0.119415283203125, 0.21246337890625, 0.305511474609375, 0.3985595703125, 0.491607666015625, 0.58465576171875, 0.677703857421875, 0.770751953125, 0.863800048828125, 0.95684814453125, 1.049896240234375, 1.1429443359375, 1.235992431640625, 1.32904052734375, 1.422088623046875, 1.51513671875, 1.608184814453125, 1.70123291015625, 1.794281005859375, 1.8873291015625, 1.980377197265625, 2.07342529296875, 2.166473388671875, 2.259521484375, 2.352569580078125, 2.44561767578125, 2.538665771484375, 2.6317138671875, 2.724761962890625, 2.81781005859375, 2.910858154296875, 3.00390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 11.0, 7.0, 18.0, 14.0, 24.0, 24.0, 40.0, 69.0, 89.0, 110.0, 194.0, 272.0, 381.0, 625.0, 1024.0, 1899.0, 5051.0, 20485.0, 156625.0, 767096.0, 74843.0, 12098.0, 3524.0, 1549.0, 888.0, 534.0, 311.0, 207.0, 154.0, 110.0, 78.0, 42.0, 50.0, 26.0, 18.0, 20.0, 11.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.875, -11.5389404296875, -11.202880859375, -10.8668212890625, -10.53076171875, -10.1947021484375, -9.858642578125, -9.5225830078125, -9.1865234375, -8.8504638671875, -8.514404296875, -8.1783447265625, -7.84228515625, -7.5062255859375, -7.170166015625, -6.8341064453125, -6.498046875, -6.1619873046875, -5.825927734375, -5.4898681640625, -5.15380859375, -4.8177490234375, -4.481689453125, -4.1456298828125, -3.8095703125, -3.4735107421875, -3.137451171875, -2.8013916015625, -2.46533203125, -2.1292724609375, -1.793212890625, -1.4571533203125, -1.12109375, -0.7850341796875, -0.448974609375, -0.1129150390625, 0.22314453125, 0.5592041015625, 0.895263671875, 1.2313232421875, 1.5673828125, 1.9034423828125, 2.239501953125, 2.5755615234375, 2.91162109375, 3.2476806640625, 3.583740234375, 3.9197998046875, 4.255859375, 4.5919189453125, 4.927978515625, 5.2640380859375, 5.60009765625, 5.9361572265625, 6.272216796875, 6.6082763671875, 6.9443359375, 7.2803955078125, 7.616455078125, 7.9525146484375, 8.28857421875, 8.6246337890625, 8.960693359375, 9.2967529296875, 9.6328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 10.0, 11.0, 9.0, 18.0, 19.0, 23.0, 31.0, 53.0, 48.0, 50.0, 82.0, 64.0, 58.0, 67.0, 78.0, 70.0, 52.0, 43.0, 44.0, 39.0, 34.0, 26.0, 15.0, 12.0, 14.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.515625, -20.9686279296875, -20.421630859375, -19.8746337890625, -19.32763671875, -18.7806396484375, -18.233642578125, -17.6866455078125, -17.1396484375, -16.5926513671875, -16.045654296875, -15.4986572265625, -14.95166015625, -14.4046630859375, -13.857666015625, -13.3106689453125, -12.763671875, -12.2166748046875, -11.669677734375, -11.1226806640625, -10.57568359375, -10.0286865234375, -9.481689453125, -8.9346923828125, -8.3876953125, -7.8406982421875, -7.293701171875, -6.7467041015625, -6.19970703125, -5.6527099609375, -5.105712890625, -4.5587158203125, -4.01171875, -3.4647216796875, -2.917724609375, -2.3707275390625, -1.82373046875, -1.2767333984375, -0.729736328125, -0.1827392578125, 0.3642578125, 0.9112548828125, 1.458251953125, 2.0052490234375, 2.55224609375, 3.0992431640625, 3.646240234375, 4.1932373046875, 4.740234375, 5.2872314453125, 5.834228515625, 6.3812255859375, 6.92822265625, 7.4752197265625, 8.022216796875, 8.5692138671875, 9.1162109375, 9.6632080078125, 10.210205078125, 10.7572021484375, 11.30419921875, 11.8511962890625, 12.398193359375, 12.9451904296875, 13.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 11.0, 7.0, 9.0, 10.0, 16.0, 26.0, 55.0, 67.0, 102.0, 239.0, 555.0, 1593.0, 6985.0, 66482.0, 924843.0, 40169.0, 5130.0, 1273.0, 408.0, 218.0, 113.0, 58.0, 48.0, 31.0, 24.0, 20.0, 5.0, 12.0, 5.0, 4.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.4609375, -5.30224609375, -5.1435546875, -4.98486328125, -4.826171875, -4.66748046875, -4.5087890625, -4.35009765625, -4.19140625, -4.03271484375, -3.8740234375, -3.71533203125, -3.556640625, -3.39794921875, -3.2392578125, -3.08056640625, -2.921875, -2.76318359375, -2.6044921875, -2.44580078125, -2.287109375, -2.12841796875, -1.9697265625, -1.81103515625, -1.65234375, -1.49365234375, -1.3349609375, -1.17626953125, -1.017578125, -0.85888671875, -0.7001953125, -0.54150390625, -0.3828125, -0.22412109375, -0.0654296875, 0.09326171875, 0.251953125, 0.41064453125, 0.5693359375, 0.72802734375, 0.88671875, 1.04541015625, 1.2041015625, 1.36279296875, 1.521484375, 1.68017578125, 1.8388671875, 1.99755859375, 2.15625, 2.31494140625, 2.4736328125, 2.63232421875, 2.791015625, 2.94970703125, 3.1083984375, 3.26708984375, 3.42578125, 3.58447265625, 3.7431640625, 3.90185546875, 4.060546875, 4.21923828125, 4.3779296875, 4.53662109375, 4.6953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 10.0, 8.0, 16.0, 13.0, 17.0, 14.0, 30.0, 30.0, 37.0, 90.0, 155.0, 213.0, 109.0, 59.0, 50.0, 25.0, 15.0, 22.0, 22.0, 7.0, 9.0, 2.0, 8.0, 7.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007507205009460449, -0.0007232427597045898, -0.0006957650184631348, -0.0006682872772216797, -0.0006408095359802246, -0.0006133317947387695, -0.0005858540534973145, -0.0005583763122558594, -0.0005308985710144043, -0.0005034208297729492, -0.00047594308853149414, -0.00044846534729003906, -0.000420987606048584, -0.0003935098648071289, -0.00036603212356567383, -0.00033855438232421875, -0.00031107664108276367, -0.0002835988998413086, -0.0002561211585998535, -0.00022864341735839844, -0.00020116567611694336, -0.00017368793487548828, -0.0001462101936340332, -0.00011873245239257812, -9.125471115112305e-05, -6.377696990966797e-05, -3.629922866821289e-05, -8.821487426757812e-06, 1.8656253814697266e-05, 4.6133995056152344e-05, 7.361173629760742e-05, 0.0001010894775390625, 0.00012856721878051758, 0.00015604496002197266, 0.00018352270126342773, 0.0002110004425048828, 0.0002384781837463379, 0.00026595592498779297, 0.00029343366622924805, 0.0003209114074707031, 0.0003483891487121582, 0.0003758668899536133, 0.00040334463119506836, 0.00043082237243652344, 0.0004583001136779785, 0.0004857778549194336, 0.0005132555961608887, 0.0005407333374023438, 0.0005682110786437988, 0.0005956888198852539, 0.000623166561126709, 0.0006506443023681641, 0.0006781220436096191, 0.0007055997848510742, 0.0007330775260925293, 0.0007605552673339844, 0.0007880330085754395, 0.0008155107498168945, 0.0008429884910583496, 0.0008704662322998047, 0.0008979439735412598, 0.0009254217147827148, 0.0009528994560241699, 0.000980377197265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 6.0, 9.0, 20.0, 37.0, 36.0, 57.0, 92.0, 117.0, 198.0, 334.0, 567.0, 1194.0, 2630.0, 6710.0, 22599.0, 116138.0, 765448.0, 100745.0, 20355.0, 6145.0, 2428.0, 1154.0, 591.0, 299.0, 201.0, 134.0, 76.0, 61.0, 38.0, 42.0, 13.0, 14.0, 7.0, 10.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.772613525390625, -2.68975830078125, -2.606903076171875, -2.5240478515625, -2.441192626953125, -2.35833740234375, -2.275482177734375, -2.192626953125, -2.109771728515625, -2.02691650390625, -1.944061279296875, -1.8612060546875, -1.778350830078125, -1.69549560546875, -1.612640380859375, -1.52978515625, -1.446929931640625, -1.36407470703125, -1.281219482421875, -1.1983642578125, -1.115509033203125, -1.03265380859375, -0.949798583984375, -0.866943359375, -0.784088134765625, -0.70123291015625, -0.618377685546875, -0.5355224609375, -0.452667236328125, -0.36981201171875, -0.286956787109375, -0.2041015625, -0.121246337890625, -0.03839111328125, 0.044464111328125, 0.1273193359375, 0.210174560546875, 0.29302978515625, 0.375885009765625, 0.458740234375, 0.541595458984375, 0.62445068359375, 0.707305908203125, 0.7901611328125, 0.873016357421875, 0.95587158203125, 1.038726806640625, 1.12158203125, 1.204437255859375, 1.28729248046875, 1.370147705078125, 1.4530029296875, 1.535858154296875, 1.61871337890625, 1.701568603515625, 1.784423828125, 1.867279052734375, 1.95013427734375, 2.032989501953125, 2.1158447265625, 2.198699951171875, 2.28155517578125, 2.364410400390625, 2.447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 13.0, 11.0, 15.0, 21.0, 35.0, 47.0, 76.0, 108.0, 126.0, 151.0, 105.0, 71.0, 60.0, 38.0, 23.0, 22.0, 19.0, 15.0, 10.0, 6.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8582763671875, -2.763427734375, -2.6685791015625, -2.57373046875, -2.4788818359375, -2.384033203125, -2.2891845703125, -2.1943359375, -2.0994873046875, -2.004638671875, -1.9097900390625, -1.81494140625, -1.7200927734375, -1.625244140625, -1.5303955078125, -1.435546875, -1.3406982421875, -1.245849609375, -1.1510009765625, -1.05615234375, -0.9613037109375, -0.866455078125, -0.7716064453125, -0.6767578125, -0.5819091796875, -0.487060546875, -0.3922119140625, -0.29736328125, -0.2025146484375, -0.107666015625, -0.0128173828125, 0.08203125, 0.1768798828125, 0.271728515625, 0.3665771484375, 0.46142578125, 0.5562744140625, 0.651123046875, 0.7459716796875, 0.8408203125, 0.9356689453125, 1.030517578125, 1.1253662109375, 1.22021484375, 1.3150634765625, 1.409912109375, 1.5047607421875, 1.599609375, 1.6944580078125, 1.789306640625, 1.8841552734375, 1.97900390625, 2.0738525390625, 2.168701171875, 2.2635498046875, 2.3583984375, 2.4532470703125, 2.548095703125, 2.6429443359375, 2.73779296875, 2.8326416015625, 2.927490234375, 3.0223388671875, 3.1171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 13.0, 33.0, 116.0, 491.0, 236.0, 70.0, 18.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.6720962524414, -114.6357650756836, -109.59943389892578, -104.56310272216797, -99.52677154541016, -94.49044036865234, -89.45410919189453, -84.41777801513672, -79.3814468383789, -74.3451156616211, -69.30878448486328, -64.27245330810547, -59.236122131347656, -54.199790954589844, -49.16345977783203, -44.12712860107422, -39.090797424316406, -34.054466247558594, -29.01813507080078, -23.98180389404297, -18.945472717285156, -13.909141540527344, -8.872810363769531, -3.8364791870117188, 1.1998519897460938, 6.236183166503906, 11.272514343261719, 16.30884552001953, 21.345176696777344, 26.381507873535156, 31.41783905029297, 36.45417022705078, 41.490509033203125, 46.52684020996094, 51.56317138671875, 56.59950256347656, 61.635833740234375, 66.67216491699219, 71.70849609375, 76.74482727050781, 81.78115844726562, 86.81748962402344, 91.85382080078125, 96.89015197753906, 101.92648315429688, 106.96281433105469, 111.9991455078125, 117.03547668457031, 122.07180786132812, 127.10813903808594, 132.14447021484375, 137.18080139160156, 142.21713256835938, 147.2534637451172, 152.289794921875, 157.3261260986328, 162.36245727539062, 167.39878845214844, 172.43511962890625, 177.47145080566406, 182.50778198242188, 187.5441131591797, 192.5804443359375, 197.6167755126953, 202.65310668945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 7.0, 7.0, 4.0, 9.0, 10.0, 14.0, 13.0, 11.0, 16.0, 19.0, 21.0, 27.0, 37.0, 30.0, 24.0, 36.0, 52.0, 128.0, 154.0, 70.0, 40.0, 35.0, 23.0, 28.0, 23.0, 24.0, 27.0, 18.0, 14.0, 12.0, 12.0, 9.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.93780517578125, -55.3607177734375, -53.783626556396484, -52.206539154052734, -50.62944793701172, -49.05236053466797, -47.47527313232422, -45.89818572998047, -44.32109451293945, -42.7440071105957, -41.16691589355469, -39.58982849121094, -38.01274108886719, -36.43564987182617, -34.85856246948242, -33.281471252441406, -31.704383850097656, -30.127294540405273, -28.55020523071289, -26.97311782836914, -25.396028518676758, -23.818939208984375, -22.241851806640625, -20.664762496948242, -19.08767318725586, -17.510583877563477, -15.93349552154541, -14.356407165527344, -12.779317855834961, -11.202228546142578, -9.625140190124512, -8.048051834106445, -6.4709625244140625, -4.893873691558838, -3.3167848587036133, -1.7396960258483887, -0.16260719299316406, 1.4144816398620605, 2.991570472717285, 4.568658828735352, 6.145748138427734, 7.722836971282959, 9.299925804138184, 10.87701416015625, 12.454103469848633, 14.031192779541016, 15.608281135559082, 17.18536949157715, 18.76245880126953, 20.339548110961914, 21.916637420654297, 23.493724822998047, 25.07081413269043, 26.647903442382812, 28.224990844726562, 29.802080154418945, 31.379169464111328, 32.95625686645508, 34.533348083496094, 36.110435485839844, 37.687522888183594, 39.26461410522461, 40.84170150756836, 42.418792724609375, 43.995880126953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 12.0, 7.0, 7.0, 19.0, 20.0, 28.0, 44.0, 70.0, 97.0, 142.0, 245.0, 368.0, 607.0, 1024.0, 1928.0, 3849.0, 8776.0, 24282.0, 99219.0, 646034.0, 2308881.0, 912529.0, 136179.0, 29837.0, 10402.0, 4372.0, 2192.0, 1254.0, 673.0, 399.0, 269.0, 172.0, 98.0, 73.0, 52.0, 33.0, 32.0, 17.0, 13.0, 12.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5234375, -5.3428955078125, -5.162353515625, -4.9818115234375, -4.80126953125, -4.6207275390625, -4.440185546875, -4.2596435546875, -4.0791015625, -3.8985595703125, -3.718017578125, -3.5374755859375, -3.35693359375, -3.1763916015625, -2.995849609375, -2.8153076171875, -2.634765625, -2.4542236328125, -2.273681640625, -2.0931396484375, -1.91259765625, -1.7320556640625, -1.551513671875, -1.3709716796875, -1.1904296875, -1.0098876953125, -0.829345703125, -0.6488037109375, -0.46826171875, -0.2877197265625, -0.107177734375, 0.0733642578125, 0.25390625, 0.4344482421875, 0.614990234375, 0.7955322265625, 0.97607421875, 1.1566162109375, 1.337158203125, 1.5177001953125, 1.6982421875, 1.8787841796875, 2.059326171875, 2.2398681640625, 2.42041015625, 2.6009521484375, 2.781494140625, 2.9620361328125, 3.142578125, 3.3231201171875, 3.503662109375, 3.6842041015625, 3.86474609375, 4.0452880859375, 4.225830078125, 4.4063720703125, 4.5869140625, 4.7674560546875, 4.947998046875, 5.1285400390625, 5.30908203125, 5.4896240234375, 5.670166015625, 5.8507080078125, 6.03125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 13.0, 5.0, 13.0, 14.0, 16.0, 16.0, 35.0, 21.0, 24.0, 36.0, 38.0, 25.0, 33.0, 41.0, 45.0, 46.0, 40.0, 39.0, 42.0, 53.0, 33.0, 41.0, 36.0, 35.0, 28.0, 37.0, 25.0, 22.0, 28.0, 11.0, 16.0, 9.0, 4.0, 7.0, 7.0, 5.0, 10.0, 7.0, 5.0, 5.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.65234375, -2.567138671875, -2.48193359375, -2.396728515625, -2.3115234375, -2.226318359375, -2.14111328125, -2.055908203125, -1.970703125, -1.885498046875, -1.80029296875, -1.715087890625, -1.6298828125, -1.544677734375, -1.45947265625, -1.374267578125, -1.2890625, -1.203857421875, -1.11865234375, -1.033447265625, -0.9482421875, -0.863037109375, -0.77783203125, -0.692626953125, -0.607421875, -0.522216796875, -0.43701171875, -0.351806640625, -0.2666015625, -0.181396484375, -0.09619140625, -0.010986328125, 0.07421875, 0.159423828125, 0.24462890625, 0.329833984375, 0.4150390625, 0.500244140625, 0.58544921875, 0.670654296875, 0.755859375, 0.841064453125, 0.92626953125, 1.011474609375, 1.0966796875, 1.181884765625, 1.26708984375, 1.352294921875, 1.4375, 1.522705078125, 1.60791015625, 1.693115234375, 1.7783203125, 1.863525390625, 1.94873046875, 2.033935546875, 2.119140625, 2.204345703125, 2.28955078125, 2.374755859375, 2.4599609375, 2.545166015625, 2.63037109375, 2.715576171875, 2.80078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 31.0, 26.0, 48.0, 70.0, 131.0, 216.0, 372.0, 826.0, 2411.0, 20429.0, 4044546.0, 117929.0, 4775.0, 1250.0, 509.0, 264.0, 150.0, 91.0, 56.0, 33.0, 23.0, 15.0, 10.0, 7.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -28.89453125, -27.8515625, -26.80859375, -25.765625, -24.72265625, -23.6796875, -22.63671875, -21.59375, -20.55078125, -19.5078125, -18.46484375, -17.421875, -16.37890625, -15.3359375, -14.29296875, -13.25, -12.20703125, -11.1640625, -10.12109375, -9.078125, -8.03515625, -6.9921875, -5.94921875, -4.90625, -3.86328125, -2.8203125, -1.77734375, -0.734375, 0.30859375, 1.3515625, 2.39453125, 3.4375, 4.48046875, 5.5234375, 6.56640625, 7.609375, 8.65234375, 9.6953125, 10.73828125, 11.78125, 12.82421875, 13.8671875, 14.91015625, 15.953125, 16.99609375, 18.0390625, 19.08203125, 20.125, 21.16796875, 22.2109375, 23.25390625, 24.296875, 25.33984375, 26.3828125, 27.42578125, 28.46875, 29.51171875, 30.5546875, 31.59765625, 32.640625, 33.68359375, 34.7265625, 35.76953125, 36.8125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 20.0, 22.0, 21.0, 53.0, 88.0, 177.0, 368.0, 1002.0, 1276.0, 582.0, 230.0, 107.0, 60.0, 31.0, 9.0, 13.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.812744140625, -19.10986328125, -18.406982421875, -17.7041015625, -17.001220703125, -16.29833984375, -15.595458984375, -14.892578125, -14.189697265625, -13.48681640625, -12.783935546875, -12.0810546875, -11.378173828125, -10.67529296875, -9.972412109375, -9.26953125, -8.566650390625, -7.86376953125, -7.160888671875, -6.4580078125, -5.755126953125, -5.05224609375, -4.349365234375, -3.646484375, -2.943603515625, -2.24072265625, -1.537841796875, -0.8349609375, -0.132080078125, 0.57080078125, 1.273681640625, 1.9765625, 2.679443359375, 3.38232421875, 4.085205078125, 4.7880859375, 5.490966796875, 6.19384765625, 6.896728515625, 7.599609375, 8.302490234375, 9.00537109375, 9.708251953125, 10.4111328125, 11.114013671875, 11.81689453125, 12.519775390625, 13.22265625, 13.925537109375, 14.62841796875, 15.331298828125, 16.0341796875, 16.737060546875, 17.43994140625, 18.142822265625, 18.845703125, 19.548583984375, 20.25146484375, 20.954345703125, 21.6572265625, 22.360107421875, 23.06298828125, 23.765869140625, 24.46875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 25.0, 34.0, 45.0, 117.0, 226.0, 241.0, 144.0, 73.0, 28.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.3430938720703, -158.51947021484375, -152.6958465576172, -146.87222290039062, -141.04859924316406, -135.2249755859375, -129.4013671875, -123.5777359008789, -117.75411224365234, -111.93048858642578, -106.10686492919922, -100.28324890136719, -94.45962524414062, -88.63600158691406, -82.8123779296875, -76.98875427246094, -71.16513061523438, -65.34150695800781, -59.51788330078125, -53.69426345825195, -47.87063980102539, -42.04701614379883, -36.22339630126953, -30.39977264404297, -24.576148986816406, -18.752525329589844, -12.928903579711914, -7.105281829833984, -1.2816581726074219, 4.541965484619141, 10.365585327148438, 16.189208984375, 22.012847900390625, 27.836471557617188, 33.66009521484375, 39.48371505737305, 45.30733871459961, 51.13096237182617, 56.95458221435547, 62.77820587158203, 68.6018295288086, 74.42545318603516, 80.24907684326172, 86.07269287109375, 91.89631652832031, 97.71994018554688, 103.54356384277344, 109.3671875, 115.19081115722656, 121.01443481445312, 126.83805847167969, 132.66168212890625, 138.4853057861328, 144.30892944335938, 150.13253784179688, 155.9561767578125, 161.77978515625, 167.60340881347656, 173.42703247070312, 179.2506561279297, 185.07427978515625, 190.8979034423828, 196.72152709960938, 202.54513549804688, 208.3687744140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 10.0, 9.0, 5.0, 11.0, 20.0, 34.0, 38.0, 58.0, 61.0, 73.0, 71.0, 85.0, 83.0, 91.0, 61.0, 58.0, 51.0, 36.0, 29.0, 29.0, 25.0, 16.0, 13.0, 7.0, 5.0, 6.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.46734619140625, -96.44294738769531, -93.41854858398438, -90.39414978027344, -87.3697509765625, -84.34534454345703, -81.3209457397461, -78.29654693603516, -75.27214813232422, -72.24774932861328, -69.22335052490234, -66.1989517211914, -63.1745491027832, -60.150150299072266, -57.12574768066406, -54.101348876953125, -51.07695007324219, -48.05255126953125, -45.02815246582031, -42.00374984741211, -38.97935104370117, -35.954952239990234, -32.93054962158203, -29.906150817871094, -26.881752014160156, -23.85735321044922, -20.83295249938965, -17.808551788330078, -14.78415298461914, -11.759753227233887, -8.735353469848633, -5.7109527587890625, -2.6865615844726562, 0.33783817291259766, 3.3622379302978516, 6.3866376876831055, 9.41103744506836, 12.435437202453613, 15.459836959838867, 18.484237670898438, 21.508636474609375, 24.533035278320312, 27.557435989379883, 30.581836700439453, 33.60623550415039, 36.63063430786133, 39.65503692626953, 42.67943572998047, 45.703834533691406, 48.728233337402344, 51.75263214111328, 54.777034759521484, 57.80143356323242, 60.82583236694336, 63.85023498535156, 66.8746337890625, 69.89903259277344, 72.92343139648438, 75.94783020019531, 78.97222900390625, 81.99662780761719, 85.02103424072266, 88.0454330444336, 91.06983184814453, 94.09423065185547]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 7.0, 10.0, 25.0, 23.0, 37.0, 45.0, 57.0, 66.0, 114.0, 182.0, 234.0, 372.0, 580.0, 842.0, 1289.0, 2007.0, 3529.0, 5958.0, 10996.0, 21867.0, 48110.0, 120887.0, 354096.0, 291513.0, 101111.0, 41497.0, 19227.0, 9805.0, 5401.0, 3125.0, 1924.0, 1234.0, 767.0, 493.0, 349.0, 237.0, 146.0, 120.0, 86.0, 57.0, 42.0, 23.0, 14.0, 11.0, 10.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0], "bins": [-4.51171875, -4.382476806640625, -4.25323486328125, -4.123992919921875, -3.9947509765625, -3.865509033203125, -3.73626708984375, -3.607025146484375, -3.477783203125, -3.348541259765625, -3.21929931640625, -3.090057373046875, -2.9608154296875, -2.831573486328125, -2.70233154296875, -2.573089599609375, -2.44384765625, -2.314605712890625, -2.18536376953125, -2.056121826171875, -1.9268798828125, -1.797637939453125, -1.66839599609375, -1.539154052734375, -1.409912109375, -1.280670166015625, -1.15142822265625, -1.022186279296875, -0.8929443359375, -0.763702392578125, -0.63446044921875, -0.505218505859375, -0.3759765625, -0.246734619140625, -0.11749267578125, 0.011749267578125, 0.1409912109375, 0.270233154296875, 0.39947509765625, 0.528717041015625, 0.657958984375, 0.787200927734375, 0.91644287109375, 1.045684814453125, 1.1749267578125, 1.304168701171875, 1.43341064453125, 1.562652587890625, 1.69189453125, 1.821136474609375, 1.95037841796875, 2.079620361328125, 2.2088623046875, 2.338104248046875, 2.46734619140625, 2.596588134765625, 2.725830078125, 2.855072021484375, 2.98431396484375, 3.113555908203125, 3.2427978515625, 3.372039794921875, 3.50128173828125, 3.630523681640625, 3.759765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 11.0, 19.0, 18.0, 13.0, 27.0, 39.0, 37.0, 32.0, 51.0, 52.0, 43.0, 45.0, 51.0, 60.0, 48.0, 55.0, 46.0, 61.0, 41.0, 42.0, 38.0, 34.0, 27.0, 22.0, 17.0, 14.0, 12.0, 5.0, 5.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.1414794921875, -4.005615234375, -3.8697509765625, -3.73388671875, -3.5980224609375, -3.462158203125, -3.3262939453125, -3.1904296875, -3.0545654296875, -2.918701171875, -2.7828369140625, -2.64697265625, -2.5111083984375, -2.375244140625, -2.2393798828125, -2.103515625, -1.9676513671875, -1.831787109375, -1.6959228515625, -1.56005859375, -1.4241943359375, -1.288330078125, -1.1524658203125, -1.0166015625, -0.8807373046875, -0.744873046875, -0.6090087890625, -0.47314453125, -0.3372802734375, -0.201416015625, -0.0655517578125, 0.0703125, 0.2061767578125, 0.342041015625, 0.4779052734375, 0.61376953125, 0.7496337890625, 0.885498046875, 1.0213623046875, 1.1572265625, 1.2930908203125, 1.428955078125, 1.5648193359375, 1.70068359375, 1.8365478515625, 1.972412109375, 2.1082763671875, 2.244140625, 2.3800048828125, 2.515869140625, 2.6517333984375, 2.78759765625, 2.9234619140625, 3.059326171875, 3.1951904296875, 3.3310546875, 3.4669189453125, 3.602783203125, 3.7386474609375, 3.87451171875, 4.0103759765625, 4.146240234375, 4.2821044921875, 4.41796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 9.0, 6.0, 16.0, 22.0, 22.0, 41.0, 54.0, 56.0, 73.0, 97.0, 168.0, 269.0, 383.0, 810.0, 1812.0, 5321.0, 23781.0, 234301.0, 721511.0, 46078.0, 8614.0, 2480.0, 1050.0, 502.0, 315.0, 217.0, 125.0, 95.0, 64.0, 50.0, 41.0, 28.0, 23.0, 20.0, 16.0, 15.0, 11.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.15716552734375, -6.9276123046875, -6.69805908203125, -6.468505859375, -6.23895263671875, -6.0093994140625, -5.77984619140625, -5.55029296875, -5.32073974609375, -5.0911865234375, -4.86163330078125, -4.632080078125, -4.40252685546875, -4.1729736328125, -3.94342041015625, -3.7138671875, -3.48431396484375, -3.2547607421875, -3.02520751953125, -2.795654296875, -2.56610107421875, -2.3365478515625, -2.10699462890625, -1.87744140625, -1.64788818359375, -1.4183349609375, -1.18878173828125, -0.959228515625, -0.72967529296875, -0.5001220703125, -0.27056884765625, -0.041015625, 0.18853759765625, 0.4180908203125, 0.64764404296875, 0.877197265625, 1.10675048828125, 1.3363037109375, 1.56585693359375, 1.79541015625, 2.02496337890625, 2.2545166015625, 2.48406982421875, 2.713623046875, 2.94317626953125, 3.1727294921875, 3.40228271484375, 3.6318359375, 3.86138916015625, 4.0909423828125, 4.32049560546875, 4.550048828125, 4.77960205078125, 5.0091552734375, 5.23870849609375, 5.46826171875, 5.69781494140625, 5.9273681640625, 6.15692138671875, 6.386474609375, 6.61602783203125, 6.8455810546875, 7.07513427734375, 7.3046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 12.0, 8.0, 8.0, 9.0, 13.0, 17.0, 25.0, 14.0, 29.0, 26.0, 26.0, 41.0, 52.0, 64.0, 69.0, 81.0, 74.0, 76.0, 52.0, 51.0, 39.0, 33.0, 16.0, 24.0, 22.0, 13.0, 15.0, 13.0, 11.0, 15.0, 8.0, 8.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7578125, -15.2735595703125, -14.789306640625, -14.3050537109375, -13.82080078125, -13.3365478515625, -12.852294921875, -12.3680419921875, -11.8837890625, -11.3995361328125, -10.915283203125, -10.4310302734375, -9.94677734375, -9.4625244140625, -8.978271484375, -8.4940185546875, -8.009765625, -7.5255126953125, -7.041259765625, -6.5570068359375, -6.07275390625, -5.5885009765625, -5.104248046875, -4.6199951171875, -4.1357421875, -3.6514892578125, -3.167236328125, -2.6829833984375, -2.19873046875, -1.7144775390625, -1.230224609375, -0.7459716796875, -0.26171875, 0.2225341796875, 0.706787109375, 1.1910400390625, 1.67529296875, 2.1595458984375, 2.643798828125, 3.1280517578125, 3.6123046875, 4.0965576171875, 4.580810546875, 5.0650634765625, 5.54931640625, 6.0335693359375, 6.517822265625, 7.0020751953125, 7.486328125, 7.9705810546875, 8.454833984375, 8.9390869140625, 9.42333984375, 9.9075927734375, 10.391845703125, 10.8760986328125, 11.3603515625, 11.8446044921875, 12.328857421875, 12.8131103515625, 13.29736328125, 13.7816162109375, 14.265869140625, 14.7501220703125, 15.234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 18.0, 27.0, 30.0, 65.0, 102.0, 135.0, 273.0, 520.0, 1041.0, 2476.0, 7462.0, 32240.0, 800992.0, 173478.0, 20453.0, 5510.0, 1919.0, 773.0, 417.0, 208.0, 122.0, 82.0, 52.0, 39.0, 28.0, 16.0, 9.0, 13.0, 7.0, 7.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2294921875, -1.1896514892578125, -1.149810791015625, -1.1099700927734375, -1.07012939453125, -1.0302886962890625, -0.990447998046875, -0.9506072998046875, -0.9107666015625, -0.8709259033203125, -0.831085205078125, -0.7912445068359375, -0.75140380859375, -0.7115631103515625, -0.671722412109375, -0.6318817138671875, -0.592041015625, -0.5522003173828125, -0.512359619140625, -0.4725189208984375, -0.43267822265625, -0.3928375244140625, -0.352996826171875, -0.3131561279296875, -0.2733154296875, -0.2334747314453125, -0.193634033203125, -0.1537933349609375, -0.11395263671875, -0.0741119384765625, -0.034271240234375, 0.0055694580078125, 0.04541015625, 0.0852508544921875, 0.125091552734375, 0.1649322509765625, 0.20477294921875, 0.2446136474609375, 0.284454345703125, 0.3242950439453125, 0.3641357421875, 0.4039764404296875, 0.443817138671875, 0.4836578369140625, 0.52349853515625, 0.5633392333984375, 0.603179931640625, 0.6430206298828125, 0.682861328125, 0.7227020263671875, 0.762542724609375, 0.8023834228515625, 0.84222412109375, 0.8820648193359375, 0.921905517578125, 0.9617462158203125, 1.0015869140625, 1.0414276123046875, 1.081268310546875, 1.1211090087890625, 1.16094970703125, 1.2007904052734375, 1.240631103515625, 1.2804718017578125, 1.3203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 5.0, 15.0, 12.0, 9.0, 24.0, 28.0, 30.0, 42.0, 81.0, 91.0, 126.0, 165.0, 111.0, 68.0, 45.0, 29.0, 24.0, 14.0, 14.0, 12.0, 8.0, 7.0, 4.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003459453582763672, -0.0003336705267429352, -0.0003213956952095032, -0.00030912086367607117, -0.00029684603214263916, -0.00028457120060920715, -0.00027229636907577515, -0.00026002153754234314, -0.00024774670600891113, -0.00023547187447547913, -0.00022319704294204712, -0.0002109222114086151, -0.0001986473798751831, -0.0001863725483417511, -0.0001740977168083191, -0.00016182288527488708, -0.00014954805374145508, -0.00013727322220802307, -0.00012499839067459106, -0.00011272355914115906, -0.00010044872760772705, -8.817389607429504e-05, -7.589906454086304e-05, -6.362423300743103e-05, -5.1349401473999023e-05, -3.9074569940567017e-05, -2.679973840713501e-05, -1.4524906873703003e-05, -2.250075340270996e-06, 1.002475619316101e-05, 2.2299587726593018e-05, 3.4574419260025024e-05, 4.684925079345703e-05, 5.912408232688904e-05, 7.139891386032104e-05, 8.367374539375305e-05, 9.594857692718506e-05, 0.00010822340846061707, 0.00012049823999404907, 0.00013277307152748108, 0.00014504790306091309, 0.0001573227345943451, 0.0001695975661277771, 0.0001818723976612091, 0.0001941472291946411, 0.00020642206072807312, 0.00021869689226150513, 0.00023097172379493713, 0.00024324655532836914, 0.00025552138686180115, 0.00026779621839523315, 0.00028007104992866516, 0.00029234588146209717, 0.0003046207129955292, 0.0003168955445289612, 0.0003291703760623932, 0.0003414452075958252, 0.0003537200391292572, 0.0003659948706626892, 0.0003782697021961212, 0.0003905445337295532, 0.00040281936526298523, 0.00041509419679641724, 0.00042736902832984924, 0.00043964385986328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 6.0, 11.0, 13.0, 11.0, 28.0, 23.0, 39.0, 49.0, 76.0, 136.0, 232.0, 387.0, 698.0, 1355.0, 2651.0, 5584.0, 13678.0, 39809.0, 268637.0, 637377.0, 48883.0, 16115.0, 6568.0, 2900.0, 1445.0, 773.0, 399.0, 271.0, 136.0, 95.0, 50.0, 43.0, 26.0, 9.0, 14.0, 9.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96728515625, -0.9351272583007812, -0.9029693603515625, -0.8708114624023438, -0.838653564453125, -0.8064956665039062, -0.7743377685546875, -0.7421798706054688, -0.71002197265625, -0.6778640747070312, -0.6457061767578125, -0.6135482788085938, -0.581390380859375, -0.5492324829101562, -0.5170745849609375, -0.48491668701171875, -0.4527587890625, -0.42060089111328125, -0.3884429931640625, -0.35628509521484375, -0.324127197265625, -0.29196929931640625, -0.2598114013671875, -0.22765350341796875, -0.19549560546875, -0.16333770751953125, -0.1311798095703125, -0.09902191162109375, -0.066864013671875, -0.03470611572265625, -0.0025482177734375, 0.02960968017578125, 0.061767578125, 0.09392547607421875, 0.1260833740234375, 0.15824127197265625, 0.190399169921875, 0.22255706787109375, 0.2547149658203125, 0.28687286376953125, 0.31903076171875, 0.35118865966796875, 0.3833465576171875, 0.41550445556640625, 0.447662353515625, 0.47982025146484375, 0.5119781494140625, 0.5441360473632812, 0.5762939453125, 0.6084518432617188, 0.6406097412109375, 0.6727676391601562, 0.704925537109375, 0.7370834350585938, 0.7692413330078125, 0.8013992309570312, 0.83355712890625, 0.8657150268554688, 0.8978729248046875, 0.9300308227539062, 0.962188720703125, 0.9943466186523438, 1.0265045166015625, 1.0586624145507812, 1.0908203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 9.0, 5.0, 10.0, 6.0, 13.0, 17.0, 17.0, 25.0, 69.0, 82.0, 110.0, 144.0, 141.0, 107.0, 77.0, 37.0, 33.0, 16.0, 10.0, 16.0, 11.0, 5.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.7490234375, -1.702728271484375, -1.65643310546875, -1.610137939453125, -1.5638427734375, -1.517547607421875, -1.47125244140625, -1.424957275390625, -1.378662109375, -1.332366943359375, -1.28607177734375, -1.239776611328125, -1.1934814453125, -1.147186279296875, -1.10089111328125, -1.054595947265625, -1.00830078125, -0.962005615234375, -0.91571044921875, -0.869415283203125, -0.8231201171875, -0.776824951171875, -0.73052978515625, -0.684234619140625, -0.637939453125, -0.591644287109375, -0.54534912109375, -0.499053955078125, -0.4527587890625, -0.406463623046875, -0.36016845703125, -0.313873291015625, -0.267578125, -0.221282958984375, -0.17498779296875, -0.128692626953125, -0.0823974609375, -0.036102294921875, 0.01019287109375, 0.056488037109375, 0.102783203125, 0.149078369140625, 0.19537353515625, 0.241668701171875, 0.2879638671875, 0.334259033203125, 0.38055419921875, 0.426849365234375, 0.47314453125, 0.519439697265625, 0.56573486328125, 0.612030029296875, 0.6583251953125, 0.704620361328125, 0.75091552734375, 0.797210693359375, 0.843505859375, 0.889801025390625, 0.93609619140625, 0.982391357421875, 1.0286865234375, 1.074981689453125, 1.12127685546875, 1.167572021484375, 1.2138671875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 52.0, 96.0, 531.0, 192.0, 80.0, 23.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.45187377929688, -104.05889129638672, -100.66590881347656, -97.2729263305664, -93.87994384765625, -90.48696899414062, -87.09397888183594, -83.70100402832031, -80.30802154541016, -76.9150390625, -73.52205657958984, -70.12907409667969, -66.73609161376953, -63.34311294555664, -59.950130462646484, -56.557151794433594, -53.16416549682617, -49.771183013916016, -46.37820053100586, -42.98522186279297, -39.59223937988281, -36.199256896972656, -32.8062744140625, -29.413293838500977, -26.02031135559082, -22.627328872680664, -19.23434829711914, -15.841365814208984, -12.448384284973145, -9.055402755737305, -5.662420272827148, -2.269439697265625, 1.1235427856445312, 4.516524314880371, 7.909506320953369, 11.302488327026367, 14.695469856262207, 18.088451385498047, 21.481433868408203, 24.874414443969727, 28.267396926879883, 31.66037940979004, 35.05335998535156, 38.44634246826172, 41.839324951171875, 45.23230743408203, 48.62528991699219, 52.01826858520508, 55.411251068115234, 58.80423355102539, 62.19721603393555, 65.59019470214844, 68.9831771850586, 72.37615966796875, 75.7691421508789, 79.16212463378906, 82.55510711669922, 85.94808959960938, 89.34107208251953, 92.73405456542969, 96.12703704833984, 99.52001953125, 102.91299438476562, 106.30597686767578, 109.69895935058594]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 11.0, 11.0, 13.0, 11.0, 14.0, 25.0, 22.0, 21.0, 17.0, 34.0, 22.0, 129.0, 134.0, 48.0, 68.0, 139.0, 48.0, 35.0, 20.0, 16.0, 18.0, 15.0, 17.0, 13.0, 10.0, 12.0, 7.0, 6.0, 8.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-50.79786682128906, -49.41446304321289, -48.031063079833984, -46.64765930175781, -45.264259338378906, -43.880855560302734, -42.49745178222656, -41.114051818847656, -39.730648040771484, -38.34724426269531, -36.963844299316406, -35.580440521240234, -34.19704055786133, -32.813636779785156, -31.430234909057617, -30.046833038330078, -28.66343116760254, -27.280029296875, -25.89662742614746, -24.513225555419922, -23.12982177734375, -21.74641990661621, -20.363018035888672, -18.9796142578125, -17.596214294433594, -16.212812423706055, -14.8294095993042, -13.44600772857666, -12.062604904174805, -10.679203033447266, -9.295801162719727, -7.912398338317871, -6.528995513916016, -5.145593166351318, -3.7621910572052, -2.378788948059082, -0.9953866004943848, 0.3880157470703125, 1.7714176177978516, 3.154820442199707, 4.538222312927246, 5.921624660491943, 7.305027008056641, 8.68842887878418, 10.071830749511719, 11.455233573913574, 12.838635444641113, 14.222038269042969, 15.605440139770508, 16.988842010498047, 18.372243881225586, 19.755645751953125, 21.139049530029297, 22.522451400756836, 23.905853271484375, 25.289257049560547, 26.672657012939453, 28.056058883666992, 29.43946075439453, 30.822864532470703, 32.20626449584961, 33.58966827392578, 34.97306823730469, 36.35647201538086, 37.73987579345703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 17.0, 9.0, 15.0, 20.0, 34.0, 52.0, 37.0, 54.0, 111.0, 344.0, 79.0, 62.0, 40.0, 34.0, 34.0, 19.0, 16.0, 2.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.3515625, -9.1136474609375, -8.875732421875, -8.6378173828125, -8.39990234375, -8.1619873046875, -7.924072265625, -7.6861572265625, -7.4482421875, -7.2103271484375, -6.972412109375, -6.7344970703125, -6.49658203125, -6.2586669921875, -6.020751953125, -5.7828369140625, -5.544921875, -5.3070068359375, -5.069091796875, -4.8311767578125, -4.59326171875, -4.3553466796875, -4.117431640625, -3.8795166015625, -3.6416015625, -3.4036865234375, -3.165771484375, -2.9278564453125, -2.68994140625, -2.4520263671875, -2.214111328125, -1.9761962890625, -1.73828125, -1.5003662109375, -1.262451171875, -1.0245361328125, -0.78662109375, -0.5487060546875, -0.310791015625, -0.0728759765625, 0.1650390625, 0.4029541015625, 0.640869140625, 0.8787841796875, 1.11669921875, 1.3546142578125, 1.592529296875, 1.8304443359375, 2.068359375, 2.3062744140625, 2.544189453125, 2.7821044921875, 3.02001953125, 3.2579345703125, 3.495849609375, 3.7337646484375, 3.9716796875, 4.2095947265625, 4.447509765625, 4.6854248046875, 4.92333984375, 5.1612548828125, 5.399169921875, 5.6370849609375, 5.875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 11.0, 19.0, 16.0, 8.0, 13.0, 23.0, 32.0, 75.0, 84.0, 129.0, 243.0, 410.0, 868.0, 2506.0, 10594.0, 8305511.0, 59722.0, 5268.0, 1558.0, 626.0, 271.0, 208.0, 120.0, 81.0, 45.0, 35.0, 23.0, 19.0, 17.0, 7.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-54.406837463378906, -52.967220306396484, -51.52760696411133, -50.087989807128906, -48.64837646484375, -47.20875930786133, -45.769142150878906, -44.32952880859375, -42.88991165161133, -41.450294494628906, -40.01068115234375, -38.57106399536133, -37.131446838378906, -35.69183349609375, -34.25221633911133, -32.812599182128906, -31.37298583984375, -29.93337059020996, -28.493755340576172, -27.05413818359375, -25.61452293395996, -24.174907684326172, -22.73529052734375, -21.29567527770996, -19.856060028076172, -18.416444778442383, -16.976829528808594, -15.537212371826172, -14.097597122192383, -12.657981872558594, -11.218365669250488, -9.778749465942383, -8.339130401611328, -6.899514675140381, -5.459898948669434, -4.020283222198486, -2.580667495727539, -1.1410517692565918, 0.29856395721435547, 1.738180160522461, 3.17779541015625, 4.617411136627197, 6.0570268630981445, 7.496642589569092, 8.936258316040039, 10.375873565673828, 11.815489768981934, 13.255105972290039, 14.694721221923828, 16.134336471557617, 17.573951721191406, 19.013568878173828, 20.453184127807617, 21.892799377441406, 23.332416534423828, 24.772031784057617, 26.211647033691406, 27.651262283325195, 29.090877532958984, 30.530494689941406, 31.970109939575195, 33.409725189208984, 34.849342346191406, 36.28895568847656, 37.728572845458984]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 1.0, 6.0, 4.0, 4.0, 1.0, 10.0, 4.0, 5.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.792640686035156, -45.144046783447266, -42.495452880859375, -39.84686279296875, -37.19826889038086, -34.54967498779297, -31.90108299255371, -29.252490997314453, -26.603897094726562, -23.955303192138672, -21.306711196899414, -18.658119201660156, -16.009525299072266, -13.360932350158691, -10.712339401245117, -8.06374740600586, -5.415153503417969, -2.7665605545043945, -0.11796760559082031, 2.530625343322754, 5.179218292236328, 7.827811241149902, 10.476404190063477, 13.124996185302734, 15.773590087890625, 18.422183990478516, 21.070775985717773, 23.71936798095703, 26.367961883544922, 29.016555786132812, 31.66514778137207, 34.31373977661133, 36.96234130859375, 39.61093521118164, 42.25952911376953, 44.908119201660156, 47.55671310424805, 50.20530700683594, 52.85389709472656, 55.50249099731445, 58.151084899902344, 60.799678802490234, 63.448272705078125, 66.09686279296875, 68.74545288085938, 71.39405059814453, 74.04264068603516, 76.69123840332031, 79.33982849121094, 81.98841857910156, 84.63701629638672, 87.28560638427734, 89.9342041015625, 92.58279418945312, 95.23138427734375, 97.87997436523438, 100.52857208251953, 103.17716217041016, 105.82575988769531, 108.47434997558594, 111.12294006347656, 113.77153778076172, 116.42012786865234, 119.0687255859375, 121.71731567382812]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 17.0, 23.0, 26.0, 35.0, 36.0, 52.0, 71.0, 109.0, 147.0, 202.0, 280.0, 464.0, 703.0, 1184.0, 1978.0, 3248.0, 5947.0, 11949.0, 24309.0, 51950.0, 108293.0, 144897.0, 86700.0, 39839.0, 19073.0, 9605.0, 5069.0, 2924.0, 1693.0, 1109.0, 649.0, 517.0, 320.0, 207.0, 158.0, 125.0, 78.0, 60.0, 41.0, 39.0, 31.0, 21.0, 8.0, 5.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0], "bins": [-28.15625, -27.359375, -26.5625, -25.765625, -24.96875, -24.171875, -23.375, -22.578125, -21.78125, -20.984375, -20.1875, -19.390625, -18.59375, -17.796875, -17.0, -16.203125, -15.40625, -14.609375, -13.8125, -13.015625, -12.21875, -11.421875, -10.625, -9.828125, -9.03125, -8.234375, -7.4375, -6.640625, -5.84375, -5.046875, -4.25, -3.453125, -2.65625, -1.859375, -1.0625, -0.265625, 0.53125, 1.328125, 2.125, 2.921875, 3.71875, 4.515625, 5.3125, 6.109375, 6.90625, 7.703125, 8.5, 9.296875, 10.09375, 10.890625, 11.6875, 12.484375, 13.28125, 14.078125, 14.875, 15.671875, 16.46875, 17.265625, 18.0625, 18.859375, 19.65625, 20.453125, 21.25, 22.046875, 22.84375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 6.0, 8.0, 10.0, 16.0, 16.0, 17.0, 21.0, 28.0, 54.0, 51.0, 71.0, 90.0, 71.0, 73.0, 80.0, 62.0, 59.0, 62.0, 49.0, 30.0, 35.0, 19.0, 20.0, 12.0, 8.0, 13.0, 5.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.667236328125, -4.48291015625, -4.298583984375, -4.1142578125, -3.929931640625, -3.74560546875, -3.561279296875, -3.376953125, -3.192626953125, -3.00830078125, -2.823974609375, -2.6396484375, -2.455322265625, -2.27099609375, -2.086669921875, -1.90234375, -1.718017578125, -1.53369140625, -1.349365234375, -1.1650390625, -0.980712890625, -0.79638671875, -0.612060546875, -0.427734375, -0.243408203125, -0.05908203125, 0.125244140625, 0.3095703125, 0.493896484375, 0.67822265625, 0.862548828125, 1.046875, 1.231201171875, 1.41552734375, 1.599853515625, 1.7841796875, 1.968505859375, 2.15283203125, 2.337158203125, 2.521484375, 2.705810546875, 2.89013671875, 3.074462890625, 3.2587890625, 3.443115234375, 3.62744140625, 3.811767578125, 3.99609375, 4.180419921875, 4.36474609375, 4.549072265625, 4.7333984375, 4.917724609375, 5.10205078125, 5.286376953125, 5.470703125, 5.655029296875, 5.83935546875, 6.023681640625, 6.2080078125, 6.392333984375, 6.57666015625, 6.760986328125, 6.9453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 10.0, 19.0, 24.0, 65.0, 97.0, 116.0, 65.0, 32.0, 20.0, 9.0, 7.0, 8.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-73.39955139160156, -71.52816772460938, -69.65678405761719, -67.78539276123047, -65.91400909423828, -64.0426254272461, -62.171241760253906, -60.29985427856445, -58.428466796875, -56.55708312988281, -54.68569564819336, -52.81431198120117, -50.94292449951172, -49.07154083251953, -47.200157165527344, -45.32876968383789, -43.4573860168457, -41.586002349853516, -39.71461486816406, -37.843231201171875, -35.97184371948242, -34.100460052490234, -32.22907257080078, -30.357688903808594, -28.486303329467773, -26.614917755126953, -24.743532180786133, -22.872146606445312, -21.000762939453125, -19.129375457763672, -17.257991790771484, -15.386606216430664, -13.515220642089844, -11.643835067749023, -9.772449493408203, -7.901064872741699, -6.029679298400879, -4.158293724060059, -2.2869091033935547, -0.4155235290527344, 1.455862045288086, 3.327247381210327, 5.198632717132568, 7.0700178146362305, 8.94140338897705, 10.812788963317871, 12.684173583984375, 14.555559158325195, 16.426944732666016, 18.298330307006836, 20.169715881347656, 22.041099548339844, 23.912487030029297, 25.783870697021484, 27.655256271362305, 29.526641845703125, 31.398027420043945, 33.269412994384766, 35.14079666137695, 37.012184143066406, 38.883567810058594, 40.75495529174805, 42.626338958740234, 44.49772644042969, 46.369110107421875]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 12.0, 7.0, 4.0, 14.0, 21.0, 15.0, 30.0, 42.0, 47.0, 51.0, 48.0, 32.0, 28.0, 20.0, 31.0, 19.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.70725440979004, -21.948942184448242, -21.190629959106445, -20.43231773376465, -19.67400550842285, -18.915693283081055, -18.157379150390625, -17.399066925048828, -16.64075469970703, -15.882442474365234, -15.124130249023438, -14.36581802368164, -13.607505798339844, -12.849193572998047, -12.090880393981934, -11.332568168640137, -10.574256896972656, -9.81594467163086, -9.057632446289062, -8.299320220947266, -7.5410075187683105, -6.782695293426514, -6.024382591247559, -5.266070365905762, -4.507758140563965, -3.749445915222168, -2.991133451461792, -2.232820987701416, -1.4745087623596191, -0.7161965370178223, 0.04211616516113281, 0.8004283905029297, 1.5587406158447266, 2.3170528411865234, 3.0753653049468994, 3.8336777687072754, 4.591989994049072, 5.350302219390869, 6.108614921569824, 6.866927146911621, 7.625239372253418, 8.383551597595215, 9.141863822937012, 9.900177001953125, 10.658489227294922, 11.416801452636719, 12.175113677978516, 12.933425903320312, 13.69173812866211, 14.450050354003906, 15.208362579345703, 15.9666748046875, 16.724987030029297, 17.483299255371094, 18.24161148071289, 18.999923706054688, 19.758235931396484, 20.51654815673828, 21.274860382080078, 22.033172607421875, 22.791484832763672, 23.54979705810547, 24.308109283447266, 25.066421508789062, 25.824735641479492]}, "eval/loss": 1.837830901145935, "eval/wer": 0.2812177707259024, "eval/runtime": 833.3263, "eval/samples_per_second": 3.17, "eval/steps_per_second": 0.397} \ No newline at end of file +{"train/loss": 0.1162, "train/learning_rate": 2.396080760095012e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 100541, "_timestamp": 1647475083, "_step": 16510, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 5.0, 7.0, 13.0, 13.0, 14.0, 16.0, 24.0, 18.0, 27.0, 22.0, 32.0, 34.0, 39.0, 42.0, 38.0, 50.0, 41.0, 35.0, 45.0, 52.0, 49.0, 63.0, 53.0, 49.0, 31.0, 29.0, 28.0, 28.0, 19.0, 22.0, 11.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.658233642578125, -22.21038818359375, -21.762540817260742, -21.314695358276367, -20.86684799194336, -20.419002532958984, -19.971155166625977, -19.5233097076416, -19.075462341308594, -18.62761688232422, -18.17976951599121, -17.731924057006836, -17.284076690673828, -16.836231231689453, -16.388383865356445, -15.940537452697754, -15.492691040039062, -15.044844627380371, -14.59699821472168, -14.149151802062988, -13.701305389404297, -13.253458976745605, -12.805612564086914, -12.357766151428223, -11.909920692443848, -11.462074279785156, -11.014227867126465, -10.566381454467773, -10.118535041809082, -9.67068862915039, -9.2228422164917, -8.774995803833008, -8.3271484375, -7.879302024841309, -7.431455612182617, -6.983609199523926, -6.535762786865234, -6.087916374206543, -5.640069961547852, -5.19222354888916, -4.744378089904785, -4.296531677246094, -3.8486852645874023, -3.400838851928711, -2.9529924392700195, -2.5051462650299072, -2.057299852371216, -1.6094534397125244, -1.161606788635254, -0.7137603759765625, -0.26591402292251587, 0.18193233013153076, 0.6297787427902222, 1.077625036239624, 1.5254714488983154, 1.9733178615570068, 2.4211642742156982, 2.8690106868743896, 3.316857099533081, 3.7647032737731934, 4.212549686431885, 4.660396099090576, 5.108242511749268, 5.556088924407959, 6.00393533706665]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 7.0, 12.0, 8.0, 7.0, 10.0, 10.0, 20.0, 22.0, 27.0, 22.0, 36.0, 28.0, 40.0, 23.0, 43.0, 36.0, 40.0, 39.0, 40.0, 48.0, 36.0, 49.0, 35.0, 33.0, 41.0, 34.0, 25.0, 38.0, 39.0, 23.0, 17.0, 28.0, 7.0, 15.0, 11.0, 10.0, 9.0, 12.0, 3.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.937238693237305, -10.542332649230957, -10.147427558898926, -9.752521514892578, -9.357616424560547, -8.9627103805542, -8.567804336547852, -8.17289924621582, -7.777993202209473, -7.383087635040283, -6.988182067871094, -6.593276023864746, -6.198370456695557, -5.803464889526367, -5.4085588455200195, -5.01365327835083, -4.618747711181641, -4.223842144012451, -3.8289363384246826, -3.434030532836914, -3.0391249656677246, -2.644219398498535, -2.2493135929107666, -1.854407787322998, -1.4595022201538086, -1.0645965337753296, -0.6696908473968506, -0.2747851610183716, 0.12012052536010742, 0.5150262117385864, 0.9099318981170654, 1.304837703704834, 1.699742317199707, 2.0946478843688965, 2.489553689956665, 2.8844594955444336, 3.279365062713623, 3.6742706298828125, 4.06917667388916, 4.46408224105835, 4.858987808227539, 5.2538933753967285, 5.648798942565918, 6.043704986572266, 6.438610553741455, 6.8335161209106445, 7.228422164916992, 7.623327732086182, 8.018233299255371, 8.413139343261719, 8.80804443359375, 9.202950477600098, 9.597856521606445, 9.992761611938477, 10.387667655944824, 10.782573699951172, 11.177478790283203, 11.57238483428955, 11.967289924621582, 12.36219596862793, 12.757101058959961, 13.152007102966309, 13.546913146972656, 13.941818237304688, 14.336724281311035]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 16.0, 27.0, 40.0, 75.0, 105.0, 241.0, 342.0, 591.0, 1024.0, 1733.0, 2988.0, 4942.0, 8143.0, 13582.0, 22324.0, 37715.0, 63581.0, 108695.0, 185973.0, 320843.0, 535980.0, 767567.0, 776799.0, 548884.0, 328997.0, 190928.0, 111553.0, 65327.0, 38960.0, 23011.0, 13550.0, 8066.0, 4879.0, 2877.0, 1628.0, 953.0, 583.0, 347.0, 172.0, 108.0, 65.0, 35.0, 16.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.03125, -26.212646484375, -25.39404296875, -24.575439453125, -23.7568359375, -22.938232421875, -22.11962890625, -21.301025390625, -20.482421875, -19.663818359375, -18.84521484375, -18.026611328125, -17.2080078125, -16.389404296875, -15.57080078125, -14.752197265625, -13.93359375, -13.114990234375, -12.29638671875, -11.477783203125, -10.6591796875, -9.840576171875, -9.02197265625, -8.203369140625, -7.384765625, -6.566162109375, -5.74755859375, -4.928955078125, -4.1103515625, -3.291748046875, -2.47314453125, -1.654541015625, -0.8359375, -0.017333984375, 0.80126953125, 1.619873046875, 2.4384765625, 3.257080078125, 4.07568359375, 4.894287109375, 5.712890625, 6.531494140625, 7.35009765625, 8.168701171875, 8.9873046875, 9.805908203125, 10.62451171875, 11.443115234375, 12.26171875, 13.080322265625, 13.89892578125, 14.717529296875, 15.5361328125, 16.354736328125, 17.17333984375, 17.991943359375, 18.810546875, 19.629150390625, 20.44775390625, 21.266357421875, 22.0849609375, 22.903564453125, 23.72216796875, 24.540771484375, 25.359375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 5.0, 13.0, 13.0, 14.0, 25.0, 18.0, 20.0, 29.0, 26.0, 34.0, 26.0, 36.0, 31.0, 35.0, 55.0, 31.0, 37.0, 41.0, 42.0, 39.0, 41.0, 30.0, 38.0, 34.0, 32.0, 29.0, 32.0, 30.0, 29.0, 21.0, 27.0, 13.0, 11.0, 10.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.9453125, -13.50341796875, -13.0615234375, -12.61962890625, -12.177734375, -11.73583984375, -11.2939453125, -10.85205078125, -10.41015625, -9.96826171875, -9.5263671875, -9.08447265625, -8.642578125, -8.20068359375, -7.7587890625, -7.31689453125, -6.875, -6.43310546875, -5.9912109375, -5.54931640625, -5.107421875, -4.66552734375, -4.2236328125, -3.78173828125, -3.33984375, -2.89794921875, -2.4560546875, -2.01416015625, -1.572265625, -1.13037109375, -0.6884765625, -0.24658203125, 0.1953125, 0.63720703125, 1.0791015625, 1.52099609375, 1.962890625, 2.40478515625, 2.8466796875, 3.28857421875, 3.73046875, 4.17236328125, 4.6142578125, 5.05615234375, 5.498046875, 5.93994140625, 6.3818359375, 6.82373046875, 7.265625, 7.70751953125, 8.1494140625, 8.59130859375, 9.033203125, 9.47509765625, 9.9169921875, 10.35888671875, 10.80078125, 11.24267578125, 11.6845703125, 12.12646484375, 12.568359375, 13.01025390625, 13.4521484375, 13.89404296875, 14.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 18.0, 19.0, 34.0, 44.0, 62.0, 103.0, 178.0, 257.0, 453.0, 740.0, 1197.0, 1903.0, 3084.0, 5115.0, 8553.0, 13968.0, 23589.0, 39481.0, 65885.0, 110372.0, 183649.0, 295675.0, 451137.0, 617613.0, 685910.0, 585661.0, 417225.0, 268178.0, 165987.0, 99795.0, 59373.0, 35570.0, 21445.0, 12669.0, 7592.0, 4454.0, 2816.0, 1727.0, 1038.0, 632.0, 412.0, 227.0, 171.0, 91.0, 66.0, 40.0, 21.0, 24.0, 10.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-20.390625, -19.76123046875, -19.1318359375, -18.50244140625, -17.873046875, -17.24365234375, -16.6142578125, -15.98486328125, -15.35546875, -14.72607421875, -14.0966796875, -13.46728515625, -12.837890625, -12.20849609375, -11.5791015625, -10.94970703125, -10.3203125, -9.69091796875, -9.0615234375, -8.43212890625, -7.802734375, -7.17333984375, -6.5439453125, -5.91455078125, -5.28515625, -4.65576171875, -4.0263671875, -3.39697265625, -2.767578125, -2.13818359375, -1.5087890625, -0.87939453125, -0.25, 0.37939453125, 1.0087890625, 1.63818359375, 2.267578125, 2.89697265625, 3.5263671875, 4.15576171875, 4.78515625, 5.41455078125, 6.0439453125, 6.67333984375, 7.302734375, 7.93212890625, 8.5615234375, 9.19091796875, 9.8203125, 10.44970703125, 11.0791015625, 11.70849609375, 12.337890625, 12.96728515625, 13.5966796875, 14.22607421875, 14.85546875, 15.48486328125, 16.1142578125, 16.74365234375, 17.373046875, 18.00244140625, 18.6318359375, 19.26123046875, 19.890625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 2.0, 10.0, 13.0, 16.0, 17.0, 24.0, 33.0, 37.0, 55.0, 60.0, 68.0, 77.0, 102.0, 92.0, 135.0, 159.0, 152.0, 156.0, 184.0, 223.0, 237.0, 213.0, 245.0, 223.0, 227.0, 198.0, 161.0, 126.0, 119.0, 121.0, 90.0, 72.0, 75.0, 74.0, 53.0, 49.0, 44.0, 26.0, 20.0, 16.0, 16.0, 13.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.68359375, -7.44696044921875, -7.2103271484375, -6.97369384765625, -6.737060546875, -6.50042724609375, -6.2637939453125, -6.02716064453125, -5.79052734375, -5.55389404296875, -5.3172607421875, -5.08062744140625, -4.843994140625, -4.60736083984375, -4.3707275390625, -4.13409423828125, -3.8974609375, -3.66082763671875, -3.4241943359375, -3.18756103515625, -2.950927734375, -2.71429443359375, -2.4776611328125, -2.24102783203125, -2.00439453125, -1.76776123046875, -1.5311279296875, -1.29449462890625, -1.057861328125, -0.82122802734375, -0.5845947265625, -0.34796142578125, -0.111328125, 0.12530517578125, 0.3619384765625, 0.59857177734375, 0.835205078125, 1.07183837890625, 1.3084716796875, 1.54510498046875, 1.78173828125, 2.01837158203125, 2.2550048828125, 2.49163818359375, 2.728271484375, 2.96490478515625, 3.2015380859375, 3.43817138671875, 3.6748046875, 3.91143798828125, 4.1480712890625, 4.38470458984375, 4.621337890625, 4.85797119140625, 5.0946044921875, 5.33123779296875, 5.56787109375, 5.80450439453125, 6.0411376953125, 6.27777099609375, 6.514404296875, 6.75103759765625, 6.9876708984375, 7.22430419921875, 7.4609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 3.0, 11.0, 16.0, 10.0, 17.0, 14.0, 11.0, 17.0, 22.0, 33.0, 24.0, 40.0, 42.0, 52.0, 48.0, 45.0, 48.0, 56.0, 48.0, 58.0, 40.0, 54.0, 42.0, 32.0, 38.0, 30.0, 23.0, 24.0, 18.0, 13.0, 11.0, 13.0, 15.0, 2.0, 10.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-21.853532791137695, -21.262256622314453, -20.67098045349121, -20.07970428466797, -19.488426208496094, -18.89715003967285, -18.30587387084961, -17.714597702026367, -17.123321533203125, -16.532045364379883, -15.94076919555664, -15.349492073059082, -14.75821590423584, -14.166939735412598, -13.575662612915039, -12.984386444091797, -12.393110275268555, -11.801834106445312, -11.21055793762207, -10.619280815124512, -10.02800464630127, -9.436728477478027, -8.845451354980469, -8.254175186157227, -7.662899017333984, -7.071622848510742, -6.480346202850342, -5.889069557189941, -5.297793388366699, -4.706517219543457, -4.115240573883057, -3.5239639282226562, -2.9326858520507812, -2.34140944480896, -1.7501330375671387, -1.1588566303253174, -0.5675802230834961, 0.023696184158325195, 0.6149725914001465, 1.2062492370605469, 1.797525405883789, 2.3888018131256104, 2.9800782203674316, 3.571354627609253, 4.162631034851074, 4.753907203674316, 5.345183849334717, 5.936460494995117, 6.527736663818359, 7.119012832641602, 7.710289478302002, 8.301566123962402, 8.892842292785645, 9.484118461608887, 10.075395584106445, 10.666671752929688, 11.25794792175293, 11.849224090576172, 12.440500259399414, 13.031777381896973, 13.623053550720215, 14.214329719543457, 14.805606842041016, 15.396883010864258, 15.9881591796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 7.0, 6.0, 4.0, 9.0, 16.0, 15.0, 22.0, 22.0, 22.0, 29.0, 34.0, 34.0, 41.0, 39.0, 39.0, 68.0, 43.0, 45.0, 40.0, 36.0, 43.0, 50.0, 42.0, 24.0, 45.0, 40.0, 36.0, 25.0, 26.0, 25.0, 22.0, 18.0, 12.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.031862258911133, -19.448139190673828, -18.864416122436523, -18.28069305419922, -17.696971893310547, -17.113248825073242, -16.529525756835938, -15.945802688598633, -15.362079620361328, -14.778356552124023, -14.194633483886719, -13.61091136932373, -13.027188301086426, -12.443465232849121, -11.859743118286133, -11.276020050048828, -10.692296981811523, -10.108573913574219, -9.524850845336914, -8.941128730773926, -8.357405662536621, -7.773682594299316, -7.18996000289917, -6.606237411499023, -6.022514343261719, -5.438791275024414, -4.855068683624268, -4.271346092224121, -3.6876230239868164, -3.103900194168091, -2.5201773643493652, -1.9364547729492188, -1.352731704711914, -0.7690088748931885, -0.1852860450744629, 0.3984367847442627, 0.9821596145629883, 1.5658824443817139, 2.1496052742004395, 2.733327865600586, 3.3170509338378906, 3.900773763656616, 4.484496593475342, 5.068219184875488, 5.651942253112793, 6.235665321350098, 6.819387912750244, 7.403110504150391, 7.986833572387695, 8.570556640625, 9.154279708862305, 9.738001823425293, 10.321724891662598, 10.905447959899902, 11.48917007446289, 12.072893142700195, 12.6566162109375, 13.240339279174805, 13.82406234741211, 14.407784461975098, 14.991507530212402, 15.575230598449707, 16.158952713012695, 16.74267578125, 17.326398849487305]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 15.0, 22.0, 26.0, 45.0, 48.0, 90.0, 141.0, 209.0, 347.0, 511.0, 838.0, 1243.0, 1891.0, 2847.0, 4529.0, 7163.0, 11241.0, 18091.0, 29620.0, 48936.0, 81046.0, 127757.0, 172123.0, 176952.0, 136577.0, 87651.0, 53496.0, 32030.0, 19619.0, 12188.0, 7591.0, 4799.0, 3084.0, 2051.0, 1308.0, 812.0, 553.0, 368.0, 234.0, 155.0, 99.0, 66.0, 52.0, 30.0, 21.0, 10.0, 8.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.59375, -8.3172607421875, -8.040771484375, -7.7642822265625, -7.48779296875, -7.2113037109375, -6.934814453125, -6.6583251953125, -6.3818359375, -6.1053466796875, -5.828857421875, -5.5523681640625, -5.27587890625, -4.9993896484375, -4.722900390625, -4.4464111328125, -4.169921875, -3.8934326171875, -3.616943359375, -3.3404541015625, -3.06396484375, -2.7874755859375, -2.510986328125, -2.2344970703125, -1.9580078125, -1.6815185546875, -1.405029296875, -1.1285400390625, -0.85205078125, -0.5755615234375, -0.299072265625, -0.0225830078125, 0.25390625, 0.5303955078125, 0.806884765625, 1.0833740234375, 1.35986328125, 1.6363525390625, 1.912841796875, 2.1893310546875, 2.4658203125, 2.7423095703125, 3.018798828125, 3.2952880859375, 3.57177734375, 3.8482666015625, 4.124755859375, 4.4012451171875, 4.677734375, 4.9542236328125, 5.230712890625, 5.5072021484375, 5.78369140625, 6.0601806640625, 6.336669921875, 6.6131591796875, 6.8896484375, 7.1661376953125, 7.442626953125, 7.7191162109375, 7.99560546875, 8.2720947265625, 8.548583984375, 8.8250732421875, 9.1015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 8.0, 10.0, 16.0, 17.0, 18.0, 22.0, 22.0, 34.0, 32.0, 32.0, 44.0, 41.0, 41.0, 55.0, 54.0, 42.0, 38.0, 40.0, 44.0, 48.0, 39.0, 33.0, 38.0, 45.0, 29.0, 29.0, 28.0, 15.0, 27.0, 18.0, 11.0, 6.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.078125, -20.46337890625, -19.8486328125, -19.23388671875, -18.619140625, -18.00439453125, -17.3896484375, -16.77490234375, -16.16015625, -15.54541015625, -14.9306640625, -14.31591796875, -13.701171875, -13.08642578125, -12.4716796875, -11.85693359375, -11.2421875, -10.62744140625, -10.0126953125, -9.39794921875, -8.783203125, -8.16845703125, -7.5537109375, -6.93896484375, -6.32421875, -5.70947265625, -5.0947265625, -4.47998046875, -3.865234375, -3.25048828125, -2.6357421875, -2.02099609375, -1.40625, -0.79150390625, -0.1767578125, 0.43798828125, 1.052734375, 1.66748046875, 2.2822265625, 2.89697265625, 3.51171875, 4.12646484375, 4.7412109375, 5.35595703125, 5.970703125, 6.58544921875, 7.2001953125, 7.81494140625, 8.4296875, 9.04443359375, 9.6591796875, 10.27392578125, 10.888671875, 11.50341796875, 12.1181640625, 12.73291015625, 13.34765625, 13.96240234375, 14.5771484375, 15.19189453125, 15.806640625, 16.42138671875, 17.0361328125, 17.65087890625, 18.265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 10.0, 13.0, 18.0, 17.0, 17.0, 30.0, 41.0, 86.0, 117.0, 182.0, 281.0, 408.0, 581.0, 1013.0, 1684.0, 2686.0, 4575.0, 7883.0, 15408.0, 34345.0, 772232.0, 152409.0, 25802.0, 12240.0, 6522.0, 3807.0, 2179.0, 1470.0, 835.0, 571.0, 344.0, 230.0, 161.0, 110.0, 72.0, 46.0, 37.0, 24.0, 15.0, 15.0, 9.0, 1.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.234375, -19.598876953125, -18.96337890625, -18.327880859375, -17.6923828125, -17.056884765625, -16.42138671875, -15.785888671875, -15.150390625, -14.514892578125, -13.87939453125, -13.243896484375, -12.6083984375, -11.972900390625, -11.33740234375, -10.701904296875, -10.06640625, -9.430908203125, -8.79541015625, -8.159912109375, -7.5244140625, -6.888916015625, -6.25341796875, -5.617919921875, -4.982421875, -4.346923828125, -3.71142578125, -3.075927734375, -2.4404296875, -1.804931640625, -1.16943359375, -0.533935546875, 0.1015625, 0.737060546875, 1.37255859375, 2.008056640625, 2.6435546875, 3.279052734375, 3.91455078125, 4.550048828125, 5.185546875, 5.821044921875, 6.45654296875, 7.092041015625, 7.7275390625, 8.363037109375, 8.99853515625, 9.634033203125, 10.26953125, 10.905029296875, 11.54052734375, 12.176025390625, 12.8115234375, 13.447021484375, 14.08251953125, 14.718017578125, 15.353515625, 15.989013671875, 16.62451171875, 17.260009765625, 17.8955078125, 18.531005859375, 19.16650390625, 19.802001953125, 20.4375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 11.0, 8.0, 8.0, 11.0, 15.0, 25.0, 19.0, 25.0, 20.0, 33.0, 36.0, 23.0, 31.0, 35.0, 39.0, 44.0, 39.0, 47.0, 51.0, 45.0, 28.0, 39.0, 38.0, 45.0, 33.0, 42.0, 24.0, 32.0, 20.0, 22.0, 17.0, 15.0, 10.0, 12.0, 9.0, 5.0, 10.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.047607421875, -9.69677734375, -9.345947265625, -8.9951171875, -8.644287109375, -8.29345703125, -7.942626953125, -7.591796875, -7.240966796875, -6.89013671875, -6.539306640625, -6.1884765625, -5.837646484375, -5.48681640625, -5.135986328125, -4.78515625, -4.434326171875, -4.08349609375, -3.732666015625, -3.3818359375, -3.031005859375, -2.68017578125, -2.329345703125, -1.978515625, -1.627685546875, -1.27685546875, -0.926025390625, -0.5751953125, -0.224365234375, 0.12646484375, 0.477294921875, 0.828125, 1.178955078125, 1.52978515625, 1.880615234375, 2.2314453125, 2.582275390625, 2.93310546875, 3.283935546875, 3.634765625, 3.985595703125, 4.33642578125, 4.687255859375, 5.0380859375, 5.388916015625, 5.73974609375, 6.090576171875, 6.44140625, 6.792236328125, 7.14306640625, 7.493896484375, 7.8447265625, 8.195556640625, 8.54638671875, 8.897216796875, 9.248046875, 9.598876953125, 9.94970703125, 10.300537109375, 10.6513671875, 11.002197265625, 11.35302734375, 11.703857421875, 12.0546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 13.0, 7.0, 15.0, 21.0, 21.0, 43.0, 63.0, 82.0, 109.0, 148.0, 255.0, 470.0, 881.0, 1911.0, 4782.0, 15182.0, 113771.0, 877510.0, 21996.0, 6358.0, 2371.0, 1062.0, 547.0, 291.0, 194.0, 144.0, 77.0, 52.0, 44.0, 27.0, 21.0, 19.0, 17.0, 9.0, 3.0, 6.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.478515625, -2.401397705078125, -2.32427978515625, -2.247161865234375, -2.1700439453125, -2.092926025390625, -2.01580810546875, -1.938690185546875, -1.861572265625, -1.784454345703125, -1.70733642578125, -1.630218505859375, -1.5531005859375, -1.475982666015625, -1.39886474609375, -1.321746826171875, -1.24462890625, -1.167510986328125, -1.09039306640625, -1.013275146484375, -0.9361572265625, -0.859039306640625, -0.78192138671875, -0.704803466796875, -0.627685546875, -0.550567626953125, -0.47344970703125, -0.396331787109375, -0.3192138671875, -0.242095947265625, -0.16497802734375, -0.087860107421875, -0.0107421875, 0.066375732421875, 0.14349365234375, 0.220611572265625, 0.2977294921875, 0.374847412109375, 0.45196533203125, 0.529083251953125, 0.606201171875, 0.683319091796875, 0.76043701171875, 0.837554931640625, 0.9146728515625, 0.991790771484375, 1.06890869140625, 1.146026611328125, 1.22314453125, 1.300262451171875, 1.37738037109375, 1.454498291015625, 1.5316162109375, 1.608734130859375, 1.68585205078125, 1.762969970703125, 1.840087890625, 1.917205810546875, 1.99432373046875, 2.071441650390625, 2.1485595703125, 2.225677490234375, 2.30279541015625, 2.379913330078125, 2.45703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 12.0, 12.0, 22.0, 34.0, 28.0, 43.0, 43.0, 63.0, 71.0, 78.0, 89.0, 69.0, 78.0, 74.0, 47.0, 41.0, 32.0, 25.0, 18.0, 20.0, 13.0, 6.0, 13.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00010019540786743164, -9.726919233798981e-05, -9.434297680854797e-05, -9.141676127910614e-05, -8.84905457496643e-05, -8.556433022022247e-05, -8.263811469078064e-05, -7.97118991613388e-05, -7.678568363189697e-05, -7.385946810245514e-05, -7.09332525730133e-05, -6.800703704357147e-05, -6.508082151412964e-05, -6.21546059846878e-05, -5.922839045524597e-05, -5.630217492580414e-05, -5.3375959396362305e-05, -5.044974386692047e-05, -4.752352833747864e-05, -4.4597312808036804e-05, -4.167109727859497e-05, -3.874488174915314e-05, -3.5818666219711304e-05, -3.289245069026947e-05, -2.9966235160827637e-05, -2.7040019631385803e-05, -2.411380410194397e-05, -2.1187588572502136e-05, -1.8261373043060303e-05, -1.533515751361847e-05, -1.2408941984176636e-05, -9.482726454734802e-06, -6.556510925292969e-06, -3.6302953958511353e-06, -7.040798664093018e-07, 2.2221356630325317e-06, 5.148351192474365e-06, 8.074566721916199e-06, 1.1000782251358032e-05, 1.3926997780799866e-05, 1.68532133102417e-05, 1.9779428839683533e-05, 2.2705644369125366e-05, 2.56318598985672e-05, 2.8558075428009033e-05, 3.148429095745087e-05, 3.44105064868927e-05, 3.7336722016334534e-05, 4.026293754577637e-05, 4.31891530752182e-05, 4.6115368604660034e-05, 4.904158413410187e-05, 5.19677996635437e-05, 5.4894015192985535e-05, 5.782023072242737e-05, 6.07464462518692e-05, 6.367266178131104e-05, 6.659887731075287e-05, 6.95250928401947e-05, 7.245130836963654e-05, 7.537752389907837e-05, 7.83037394285202e-05, 8.122995495796204e-05, 8.415617048740387e-05, 8.70823860168457e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 10.0, 17.0, 28.0, 45.0, 46.0, 72.0, 88.0, 138.0, 242.0, 260.0, 439.0, 716.0, 985.0, 1606.0, 2622.0, 4642.0, 8802.0, 18326.0, 41479.0, 97150.0, 208848.0, 298741.0, 196944.0, 90855.0, 38240.0, 17392.0, 8282.0, 4460.0, 2575.0, 1498.0, 1022.0, 595.0, 426.0, 295.0, 228.0, 117.0, 112.0, 61.0, 50.0, 21.0, 17.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.869140625, -1.809722900390625, -1.75030517578125, -1.690887451171875, -1.6314697265625, -1.572052001953125, -1.51263427734375, -1.453216552734375, -1.393798828125, -1.334381103515625, -1.27496337890625, -1.215545654296875, -1.1561279296875, -1.096710205078125, -1.03729248046875, -0.977874755859375, -0.91845703125, -0.859039306640625, -0.79962158203125, -0.740203857421875, -0.6807861328125, -0.621368408203125, -0.56195068359375, -0.502532958984375, -0.443115234375, -0.383697509765625, -0.32427978515625, -0.264862060546875, -0.2054443359375, -0.146026611328125, -0.08660888671875, -0.027191162109375, 0.0322265625, 0.091644287109375, 0.15106201171875, 0.210479736328125, 0.2698974609375, 0.329315185546875, 0.38873291015625, 0.448150634765625, 0.507568359375, 0.566986083984375, 0.62640380859375, 0.685821533203125, 0.7452392578125, 0.804656982421875, 0.86407470703125, 0.923492431640625, 0.98291015625, 1.042327880859375, 1.10174560546875, 1.161163330078125, 1.2205810546875, 1.279998779296875, 1.33941650390625, 1.398834228515625, 1.458251953125, 1.517669677734375, 1.57708740234375, 1.636505126953125, 1.6959228515625, 1.755340576171875, 1.81475830078125, 1.874176025390625, 1.93359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 11.0, 6.0, 12.0, 10.0, 18.0, 32.0, 33.0, 31.0, 56.0, 60.0, 75.0, 79.0, 95.0, 101.0, 74.0, 62.0, 53.0, 56.0, 43.0, 20.0, 24.0, 9.0, 10.0, 10.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46533203125, -0.44701385498046875, -0.4286956787109375, -0.41037750244140625, -0.392059326171875, -0.37374114990234375, -0.3554229736328125, -0.33710479736328125, -0.31878662109375, -0.30046844482421875, -0.2821502685546875, -0.26383209228515625, -0.245513916015625, -0.22719573974609375, -0.2088775634765625, -0.19055938720703125, -0.1722412109375, -0.15392303466796875, -0.1356048583984375, -0.11728668212890625, -0.098968505859375, -0.08065032958984375, -0.0623321533203125, -0.04401397705078125, -0.02569580078125, -0.00737762451171875, 0.0109405517578125, 0.02925872802734375, 0.047576904296875, 0.06589508056640625, 0.0842132568359375, 0.10253143310546875, 0.120849609375, 0.13916778564453125, 0.1574859619140625, 0.17580413818359375, 0.194122314453125, 0.21244049072265625, 0.2307586669921875, 0.24907684326171875, 0.26739501953125, 0.28571319580078125, 0.3040313720703125, 0.32234954833984375, 0.340667724609375, 0.35898590087890625, 0.3773040771484375, 0.39562225341796875, 0.4139404296875, 0.43225860595703125, 0.4505767822265625, 0.46889495849609375, 0.487213134765625, 0.5055313110351562, 0.5238494873046875, 0.5421676635742188, 0.56048583984375, 0.5788040161132812, 0.5971221923828125, 0.6154403686523438, 0.633758544921875, 0.6520767211914062, 0.6703948974609375, 0.6887130737304688, 0.70703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 14.0, 13.0, 6.0, 14.0, 18.0, 13.0, 22.0, 21.0, 31.0, 34.0, 43.0, 41.0, 47.0, 38.0, 43.0, 50.0, 49.0, 56.0, 49.0, 51.0, 41.0, 43.0, 32.0, 34.0, 25.0, 33.0, 29.0, 15.0, 13.0, 11.0, 11.0, 8.0, 11.0, 2.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-20.51023292541504, -19.919540405273438, -19.328847885131836, -18.738155364990234, -18.147464752197266, -17.556772232055664, -16.966079711914062, -16.37538719177246, -15.78469467163086, -15.194002151489258, -14.603309631347656, -14.012618064880371, -13.42192554473877, -12.831233024597168, -12.240541458129883, -11.649848937988281, -11.05915641784668, -10.468463897705078, -9.877771377563477, -9.287079811096191, -8.69638729095459, -8.105694770812988, -7.515002727508545, -6.924310684204102, -6.3336181640625, -5.742925643920898, -5.152233600616455, -4.561541557312012, -3.97084903717041, -3.3801567554473877, -2.7894644737243652, -2.198772430419922, -1.6080780029296875, -1.017385721206665, -0.4266934394836426, 0.16399884223937988, 0.7546911239624023, 1.3453834056854248, 1.9360756874084473, 2.5267677307128906, 3.117460250854492, 3.7081525325775146, 4.298844814300537, 4.8895368576049805, 5.480229377746582, 6.070921897888184, 6.661613941192627, 7.25230598449707, 7.842998504638672, 8.433691024780273, 9.024383544921875, 9.61507511138916, 10.205767631530762, 10.796460151672363, 11.387151718139648, 11.97784423828125, 12.568536758422852, 13.159229278564453, 13.749921798706055, 14.34061336517334, 14.931305885314941, 15.521998405456543, 16.112689971923828, 16.70338249206543, 17.29407501220703]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 3.0, 9.0, 10.0, 13.0, 22.0, 16.0, 22.0, 25.0, 33.0, 30.0, 32.0, 43.0, 47.0, 48.0, 51.0, 52.0, 39.0, 44.0, 36.0, 52.0, 49.0, 29.0, 35.0, 44.0, 37.0, 32.0, 28.0, 29.0, 18.0, 25.0, 11.0, 11.0, 10.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.121078491210938, -20.501134872436523, -19.881189346313477, -19.261245727539062, -18.641300201416016, -18.0213565826416, -17.401411056518555, -16.78146743774414, -16.161521911621094, -15.541577339172363, -14.921632766723633, -14.301688194274902, -13.681743621826172, -13.061799049377441, -12.441854476928711, -11.821910858154297, -11.201966285705566, -10.582021713256836, -9.962077140808105, -9.342132568359375, -8.722187995910645, -8.102243423461914, -7.482299327850342, -6.862354755401611, -6.242410182952881, -5.62246561050415, -5.00252103805542, -4.382576942443848, -3.762632131576538, -3.1426875591278076, -2.5227432250976562, -1.9027986526489258, -1.2828540802001953, -0.6629095673561096, -0.042965054512023926, 0.576979398727417, 1.1969239711761475, 1.816868543624878, 2.4368128776550293, 3.0567574501037598, 3.6767020225524902, 4.296646595001221, 4.916591167449951, 5.536535263061523, 6.156479835510254, 6.776424407958984, 7.396368980407715, 8.016313552856445, 8.636258125305176, 9.256202697753906, 9.876147270202637, 10.496091842651367, 11.116036415100098, 11.735980987548828, 12.355924606323242, 12.975870132446289, 13.595813751220703, 14.215758323669434, 14.835702896118164, 15.455647468566895, 16.075592041015625, 16.69553565979004, 17.315481185913086, 17.9354248046875, 18.555370330810547]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 10.0, 18.0, 21.0, 19.0, 56.0, 58.0, 84.0, 153.0, 232.0, 315.0, 507.0, 809.0, 1224.0, 1860.0, 3126.0, 4933.0, 8125.0, 13310.0, 22242.0, 35294.0, 56007.0, 82729.0, 111818.0, 134880.0, 142595.0, 128090.0, 101655.0, 72562.0, 47660.0, 30061.0, 18635.0, 11205.0, 6797.0, 4191.0, 2675.0, 1712.0, 965.0, 676.0, 432.0, 289.0, 174.0, 111.0, 83.0, 50.0, 28.0, 19.0, 14.0, 15.0, 8.0, 1.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.578125, -19.921142578125, -19.26416015625, -18.607177734375, -17.9501953125, -17.293212890625, -16.63623046875, -15.979248046875, -15.322265625, -14.665283203125, -14.00830078125, -13.351318359375, -12.6943359375, -12.037353515625, -11.38037109375, -10.723388671875, -10.06640625, -9.409423828125, -8.75244140625, -8.095458984375, -7.4384765625, -6.781494140625, -6.12451171875, -5.467529296875, -4.810546875, -4.153564453125, -3.49658203125, -2.839599609375, -2.1826171875, -1.525634765625, -0.86865234375, -0.211669921875, 0.4453125, 1.102294921875, 1.75927734375, 2.416259765625, 3.0732421875, 3.730224609375, 4.38720703125, 5.044189453125, 5.701171875, 6.358154296875, 7.01513671875, 7.672119140625, 8.3291015625, 8.986083984375, 9.64306640625, 10.300048828125, 10.95703125, 11.614013671875, 12.27099609375, 12.927978515625, 13.5849609375, 14.241943359375, 14.89892578125, 15.555908203125, 16.212890625, 16.869873046875, 17.52685546875, 18.183837890625, 18.8408203125, 19.497802734375, 20.15478515625, 20.811767578125, 21.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 7.0, 5.0, 13.0, 13.0, 18.0, 23.0, 20.0, 20.0, 37.0, 29.0, 36.0, 45.0, 38.0, 47.0, 59.0, 51.0, 36.0, 43.0, 39.0, 48.0, 47.0, 33.0, 36.0, 44.0, 41.0, 27.0, 23.0, 27.0, 23.0, 19.0, 16.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.912353515625, -19.30908203125, -18.705810546875, -18.1025390625, -17.499267578125, -16.89599609375, -16.292724609375, -15.689453125, -15.086181640625, -14.48291015625, -13.879638671875, -13.2763671875, -12.673095703125, -12.06982421875, -11.466552734375, -10.86328125, -10.260009765625, -9.65673828125, -9.053466796875, -8.4501953125, -7.846923828125, -7.24365234375, -6.640380859375, -6.037109375, -5.433837890625, -4.83056640625, -4.227294921875, -3.6240234375, -3.020751953125, -2.41748046875, -1.814208984375, -1.2109375, -0.607666015625, -0.00439453125, 0.598876953125, 1.2021484375, 1.805419921875, 2.40869140625, 3.011962890625, 3.615234375, 4.218505859375, 4.82177734375, 5.425048828125, 6.0283203125, 6.631591796875, 7.23486328125, 7.838134765625, 8.44140625, 9.044677734375, 9.64794921875, 10.251220703125, 10.8544921875, 11.457763671875, 12.06103515625, 12.664306640625, 13.267578125, 13.870849609375, 14.47412109375, 15.077392578125, 15.6806640625, 16.283935546875, 16.88720703125, 17.490478515625, 18.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 9.0, 23.0, 18.0, 32.0, 48.0, 84.0, 128.0, 203.0, 276.0, 494.0, 765.0, 1184.0, 1936.0, 3232.0, 5568.0, 9548.0, 16760.0, 29738.0, 51739.0, 87075.0, 132070.0, 168528.0, 172393.0, 139316.0, 94008.0, 56871.0, 32555.0, 18262.0, 10408.0, 6029.0, 3543.0, 2111.0, 1338.0, 820.0, 521.0, 356.0, 190.0, 124.0, 88.0, 53.0, 39.0, 26.0, 16.0, 13.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.078125, -26.177978515625, -25.27783203125, -24.377685546875, -23.4775390625, -22.577392578125, -21.67724609375, -20.777099609375, -19.876953125, -18.976806640625, -18.07666015625, -17.176513671875, -16.2763671875, -15.376220703125, -14.47607421875, -13.575927734375, -12.67578125, -11.775634765625, -10.87548828125, -9.975341796875, -9.0751953125, -8.175048828125, -7.27490234375, -6.374755859375, -5.474609375, -4.574462890625, -3.67431640625, -2.774169921875, -1.8740234375, -0.973876953125, -0.07373046875, 0.826416015625, 1.7265625, 2.626708984375, 3.52685546875, 4.427001953125, 5.3271484375, 6.227294921875, 7.12744140625, 8.027587890625, 8.927734375, 9.827880859375, 10.72802734375, 11.628173828125, 12.5283203125, 13.428466796875, 14.32861328125, 15.228759765625, 16.12890625, 17.029052734375, 17.92919921875, 18.829345703125, 19.7294921875, 20.629638671875, 21.52978515625, 22.429931640625, 23.330078125, 24.230224609375, 25.13037109375, 26.030517578125, 26.9306640625, 27.830810546875, 28.73095703125, 29.631103515625, 30.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 1.0, 7.0, 2.0, 11.0, 2.0, 13.0, 15.0, 11.0, 18.0, 20.0, 18.0, 14.0, 26.0, 27.0, 34.0, 35.0, 38.0, 36.0, 44.0, 45.0, 31.0, 40.0, 41.0, 34.0, 40.0, 35.0, 47.0, 38.0, 36.0, 29.0, 24.0, 25.0, 28.0, 20.0, 19.0, 15.0, 18.0, 15.0, 15.0, 8.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.380615234375, -8.05029296875, -7.719970703125, -7.3896484375, -7.059326171875, -6.72900390625, -6.398681640625, -6.068359375, -5.738037109375, -5.40771484375, -5.077392578125, -4.7470703125, -4.416748046875, -4.08642578125, -3.756103515625, -3.42578125, -3.095458984375, -2.76513671875, -2.434814453125, -2.1044921875, -1.774169921875, -1.44384765625, -1.113525390625, -0.783203125, -0.452880859375, -0.12255859375, 0.207763671875, 0.5380859375, 0.868408203125, 1.19873046875, 1.529052734375, 1.859375, 2.189697265625, 2.52001953125, 2.850341796875, 3.1806640625, 3.510986328125, 3.84130859375, 4.171630859375, 4.501953125, 4.832275390625, 5.16259765625, 5.492919921875, 5.8232421875, 6.153564453125, 6.48388671875, 6.814208984375, 7.14453125, 7.474853515625, 7.80517578125, 8.135498046875, 8.4658203125, 8.796142578125, 9.12646484375, 9.456787109375, 9.787109375, 10.117431640625, 10.44775390625, 10.778076171875, 11.1083984375, 11.438720703125, 11.76904296875, 12.099365234375, 12.4296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 6.0, 12.0, 21.0, 25.0, 38.0, 64.0, 72.0, 103.0, 137.0, 196.0, 324.0, 446.0, 621.0, 968.0, 1309.0, 1976.0, 2962.0, 4349.0, 6750.0, 10155.0, 15735.0, 23949.0, 36895.0, 55979.0, 80572.0, 108088.0, 130340.0, 136305.0, 123227.0, 97454.0, 70580.0, 48111.0, 31588.0, 20135.0, 13222.0, 8559.0, 5575.0, 3697.0, 2568.0, 1692.0, 1101.0, 864.0, 558.0, 386.0, 289.0, 170.0, 124.0, 84.0, 64.0, 35.0, 23.0, 13.0, 19.0, 11.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.3125, -4.16534423828125, -4.0181884765625, -3.87103271484375, -3.723876953125, -3.57672119140625, -3.4295654296875, -3.28240966796875, -3.13525390625, -2.98809814453125, -2.8409423828125, -2.69378662109375, -2.546630859375, -2.39947509765625, -2.2523193359375, -2.10516357421875, -1.9580078125, -1.81085205078125, -1.6636962890625, -1.51654052734375, -1.369384765625, -1.22222900390625, -1.0750732421875, -0.92791748046875, -0.78076171875, -0.63360595703125, -0.4864501953125, -0.33929443359375, -0.192138671875, -0.04498291015625, 0.1021728515625, 0.24932861328125, 0.396484375, 0.54364013671875, 0.6907958984375, 0.83795166015625, 0.985107421875, 1.13226318359375, 1.2794189453125, 1.42657470703125, 1.57373046875, 1.72088623046875, 1.8680419921875, 2.01519775390625, 2.162353515625, 2.30950927734375, 2.4566650390625, 2.60382080078125, 2.7509765625, 2.89813232421875, 3.0452880859375, 3.19244384765625, 3.339599609375, 3.48675537109375, 3.6339111328125, 3.78106689453125, 3.92822265625, 4.07537841796875, 4.2225341796875, 4.36968994140625, 4.516845703125, 4.66400146484375, 4.8111572265625, 4.95831298828125, 5.10546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 2.0, 12.0, 8.0, 22.0, 14.0, 20.0, 24.0, 31.0, 43.0, 41.0, 43.0, 43.0, 53.0, 49.0, 50.0, 53.0, 63.0, 53.0, 54.0, 49.0, 39.0, 31.0, 34.0, 30.0, 22.0, 25.0, 15.0, 10.0, 12.0, 5.0, 4.0, 7.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00061798095703125, -0.0005995109677314758, -0.0005810409784317017, -0.0005625709891319275, -0.0005441009998321533, -0.0005256310105323792, -0.000507161021232605, -0.0004886910319328308, -0.00047022104263305664, -0.00045175105333328247, -0.0004332810640335083, -0.00041481107473373413, -0.00039634108543395996, -0.0003778710961341858, -0.0003594011068344116, -0.00034093111753463745, -0.0003224611282348633, -0.0003039911389350891, -0.00028552114963531494, -0.00026705116033554077, -0.0002485811710357666, -0.00023011118173599243, -0.00021164119243621826, -0.0001931712031364441, -0.00017470121383666992, -0.00015623122453689575, -0.00013776123523712158, -0.00011929124593734741, -0.00010082125663757324, -8.235126733779907e-05, -6.38812780380249e-05, -4.541128873825073e-05, -2.6941299438476562e-05, -8.471310138702393e-06, 9.998679161071777e-06, 2.8468668460845947e-05, 4.693865776062012e-05, 6.540864706039429e-05, 8.387863636016846e-05, 0.00010234862565994263, 0.0001208186149597168, 0.00013928860425949097, 0.00015775859355926514, 0.0001762285828590393, 0.00019469857215881348, 0.00021316856145858765, 0.00023163855075836182, 0.000250108540058136, 0.00026857852935791016, 0.0002870485186576843, 0.0003055185079574585, 0.00032398849725723267, 0.00034245848655700684, 0.000360928475856781, 0.0003793984651565552, 0.00039786845445632935, 0.0004163384437561035, 0.0004348084330558777, 0.00045327842235565186, 0.000471748411655426, 0.0004902184009552002, 0.0005086883902549744, 0.0005271583795547485, 0.0005456283688545227, 0.0005640983581542969]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 15.0, 25.0, 32.0, 44.0, 71.0, 101.0, 160.0, 248.0, 373.0, 587.0, 914.0, 1346.0, 1995.0, 3249.0, 5051.0, 7831.0, 12122.0, 18975.0, 29749.0, 45453.0, 67500.0, 94879.0, 122283.0, 138508.0, 133624.0, 112476.0, 84316.0, 58314.0, 38401.0, 24856.0, 16118.0, 10337.0, 6660.0, 4204.0, 2699.0, 1786.0, 1185.0, 673.0, 488.0, 321.0, 218.0, 127.0, 85.0, 60.0, 36.0, 17.0, 14.0, 12.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.1171875, -4.9658203125, -4.814453125, -4.6630859375, -4.51171875, -4.3603515625, -4.208984375, -4.0576171875, -3.90625, -3.7548828125, -3.603515625, -3.4521484375, -3.30078125, -3.1494140625, -2.998046875, -2.8466796875, -2.6953125, -2.5439453125, -2.392578125, -2.2412109375, -2.08984375, -1.9384765625, -1.787109375, -1.6357421875, -1.484375, -1.3330078125, -1.181640625, -1.0302734375, -0.87890625, -0.7275390625, -0.576171875, -0.4248046875, -0.2734375, -0.1220703125, 0.029296875, 0.1806640625, 0.33203125, 0.4833984375, 0.634765625, 0.7861328125, 0.9375, 1.0888671875, 1.240234375, 1.3916015625, 1.54296875, 1.6943359375, 1.845703125, 1.9970703125, 2.1484375, 2.2998046875, 2.451171875, 2.6025390625, 2.75390625, 2.9052734375, 3.056640625, 3.2080078125, 3.359375, 3.5107421875, 3.662109375, 3.8134765625, 3.96484375, 4.1162109375, 4.267578125, 4.4189453125, 4.5703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 9.0, 11.0, 12.0, 21.0, 18.0, 18.0, 27.0, 19.0, 34.0, 25.0, 43.0, 34.0, 56.0, 51.0, 41.0, 36.0, 49.0, 55.0, 34.0, 43.0, 46.0, 42.0, 29.0, 31.0, 26.0, 33.0, 25.0, 22.0, 12.0, 9.0, 16.0, 8.0, 9.0, 7.0, 10.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.837890625, -1.781646728515625, -1.72540283203125, -1.669158935546875, -1.6129150390625, -1.556671142578125, -1.50042724609375, -1.444183349609375, -1.387939453125, -1.331695556640625, -1.27545166015625, -1.219207763671875, -1.1629638671875, -1.106719970703125, -1.05047607421875, -0.994232177734375, -0.93798828125, -0.881744384765625, -0.82550048828125, -0.769256591796875, -0.7130126953125, -0.656768798828125, -0.60052490234375, -0.544281005859375, -0.488037109375, -0.431793212890625, -0.37554931640625, -0.319305419921875, -0.2630615234375, -0.206817626953125, -0.15057373046875, -0.094329833984375, -0.0380859375, 0.018157958984375, 0.07440185546875, 0.130645751953125, 0.1868896484375, 0.243133544921875, 0.29937744140625, 0.355621337890625, 0.411865234375, 0.468109130859375, 0.52435302734375, 0.580596923828125, 0.6368408203125, 0.693084716796875, 0.74932861328125, 0.805572509765625, 0.86181640625, 0.918060302734375, 0.97430419921875, 1.030548095703125, 1.0867919921875, 1.143035888671875, 1.19927978515625, 1.255523681640625, 1.311767578125, 1.368011474609375, 1.42425537109375, 1.480499267578125, 1.5367431640625, 1.592987060546875, 1.64923095703125, 1.705474853515625, 1.76171875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 4.0, 3.0, 9.0, 6.0, 10.0, 12.0, 15.0, 21.0, 22.0, 29.0, 39.0, 33.0, 40.0, 44.0, 58.0, 61.0, 60.0, 58.0, 57.0, 53.0, 49.0, 51.0, 35.0, 38.0, 38.0, 24.0, 24.0, 28.0, 15.0, 13.0, 11.0, 7.0, 10.0, 6.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-24.08905601501465, -23.41295623779297, -22.736854553222656, -22.060752868652344, -21.384653091430664, -20.708553314208984, -20.032451629638672, -19.35634994506836, -18.68025016784668, -18.004150390625, -17.328048706054688, -16.651947021484375, -15.975847244262695, -15.2997465133667, -14.623645782470703, -13.947545051574707, -13.271444320678711, -12.595343589782715, -11.919242858886719, -11.243142127990723, -10.567041397094727, -9.89094066619873, -9.214839935302734, -8.538739204406738, -7.862638473510742, -7.186537742614746, -6.51043701171875, -5.834336280822754, -5.158235549926758, -4.482134819030762, -3.8060340881347656, -3.1299333572387695, -2.4538326263427734, -1.7777318954467773, -1.1016311645507812, -0.42553043365478516, 0.25057029724121094, 0.926671028137207, 1.6027717590332031, 2.278872489929199, 2.9549732208251953, 3.6310739517211914, 4.3071746826171875, 4.983275413513184, 5.65937614440918, 6.335476875305176, 7.011577606201172, 7.687678337097168, 8.363779067993164, 9.03987979888916, 9.715980529785156, 10.392081260681152, 11.068181991577148, 11.744282722473145, 12.42038345336914, 13.096484184265137, 13.772584915161133, 14.448685646057129, 15.124786376953125, 15.800887107849121, 16.476987838745117, 17.153087615966797, 17.82918930053711, 18.505290985107422, 19.1813907623291]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 9.0, 14.0, 27.0, 23.0, 29.0, 29.0, 46.0, 34.0, 38.0, 52.0, 45.0, 41.0, 39.0, 46.0, 55.0, 52.0, 46.0, 37.0, 35.0, 35.0, 40.0, 44.0, 28.0, 29.0, 22.0, 20.0, 15.0, 10.0, 10.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734127044677734, -18.0801944732666, -17.426259994506836, -16.772327423095703, -16.118392944335938, -15.464460372924805, -14.810526847839355, -14.156593322753906, -13.502660751342773, -12.848727226257324, -12.194793701171875, -11.540861129760742, -10.886927604675293, -10.232994079589844, -9.579060554504395, -8.925127029418945, -8.271193504333496, -7.617259979248047, -6.963326930999756, -6.309393405914307, -5.655460357666016, -5.001526832580566, -4.347593307495117, -3.693660259246826, -3.039726734161377, -2.385793447494507, -1.7318600416183472, -1.0779266357421875, -0.4239933490753174, 0.22993993759155273, 0.883873462677002, 1.537806510925293, 2.191740036010742, 2.8456733226776123, 3.4996066093444824, 4.153540134429932, 4.807473182678223, 5.461406707763672, 6.115340232849121, 6.769273281097412, 7.423206806182861, 8.077139854431152, 8.731073379516602, 9.38500690460205, 10.0389404296875, 10.692873001098633, 11.346807479858398, 12.000740051269531, 12.65467357635498, 13.30860710144043, 13.962540626525879, 14.616474151611328, 15.270406723022461, 15.92434024810791, 16.57827377319336, 17.232206344604492, 17.886140823364258, 18.54007339477539, 19.194007873535156, 19.84794044494629, 20.501874923706055, 21.155807495117188, 21.809741973876953, 22.463674545288086, 23.11760711669922]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 7.0, 20.0, 26.0, 51.0, 87.0, 109.0, 228.0, 392.0, 592.0, 967.0, 1668.0, 2722.0, 4559.0, 7267.0, 11963.0, 19798.0, 32579.0, 54974.0, 91879.0, 155919.0, 265317.0, 430506.0, 620319.0, 717815.0, 636080.0, 450531.0, 278496.0, 165796.0, 96924.0, 57553.0, 34527.0, 21332.0, 12718.0, 8008.0, 4845.0, 2995.0, 1814.0, 1115.0, 683.0, 414.0, 256.0, 161.0, 90.0, 65.0, 41.0, 27.0, 14.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0], "bins": [-22.40625, -21.7578125, -21.109375, -20.4609375, -19.8125, -19.1640625, -18.515625, -17.8671875, -17.21875, -16.5703125, -15.921875, -15.2734375, -14.625, -13.9765625, -13.328125, -12.6796875, -12.03125, -11.3828125, -10.734375, -10.0859375, -9.4375, -8.7890625, -8.140625, -7.4921875, -6.84375, -6.1953125, -5.546875, -4.8984375, -4.25, -3.6015625, -2.953125, -2.3046875, -1.65625, -1.0078125, -0.359375, 0.2890625, 0.9375, 1.5859375, 2.234375, 2.8828125, 3.53125, 4.1796875, 4.828125, 5.4765625, 6.125, 6.7734375, 7.421875, 8.0703125, 8.71875, 9.3671875, 10.015625, 10.6640625, 11.3125, 11.9609375, 12.609375, 13.2578125, 13.90625, 14.5546875, 15.203125, 15.8515625, 16.5, 17.1484375, 17.796875, 18.4453125, 19.09375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 13.0, 28.0, 25.0, 23.0, 27.0, 42.0, 33.0, 47.0, 40.0, 50.0, 47.0, 29.0, 45.0, 48.0, 53.0, 53.0, 38.0, 39.0, 35.0, 37.0, 41.0, 33.0, 33.0, 23.0, 20.0, 14.0, 15.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.17578125, -15.6015625, -15.02734375, -14.453125, -13.87890625, -13.3046875, -12.73046875, -12.15625, -11.58203125, -11.0078125, -10.43359375, -9.859375, -9.28515625, -8.7109375, -8.13671875, -7.5625, -6.98828125, -6.4140625, -5.83984375, -5.265625, -4.69140625, -4.1171875, -3.54296875, -2.96875, -2.39453125, -1.8203125, -1.24609375, -0.671875, -0.09765625, 0.4765625, 1.05078125, 1.625, 2.19921875, 2.7734375, 3.34765625, 3.921875, 4.49609375, 5.0703125, 5.64453125, 6.21875, 6.79296875, 7.3671875, 7.94140625, 8.515625, 9.08984375, 9.6640625, 10.23828125, 10.8125, 11.38671875, 11.9609375, 12.53515625, 13.109375, 13.68359375, 14.2578125, 14.83203125, 15.40625, 15.98046875, 16.5546875, 17.12890625, 17.703125, 18.27734375, 18.8515625, 19.42578125, 20.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 9.0, 5.0, 18.0, 18.0, 31.0, 45.0, 81.0, 105.0, 213.0, 269.0, 507.0, 872.0, 1441.0, 2321.0, 4110.0, 7654.0, 13849.0, 25236.0, 46433.0, 86345.0, 161349.0, 294324.0, 501995.0, 734271.0, 802834.0, 630033.0, 395009.0, 222905.0, 120339.0, 64281.0, 34624.0, 18709.0, 10473.0, 5724.0, 3197.0, 1871.0, 1095.0, 648.0, 375.0, 242.0, 151.0, 104.0, 63.0, 29.0, 30.0, 21.0, 8.0, 4.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.21875, -21.45947265625, -20.7001953125, -19.94091796875, -19.181640625, -18.42236328125, -17.6630859375, -16.90380859375, -16.14453125, -15.38525390625, -14.6259765625, -13.86669921875, -13.107421875, -12.34814453125, -11.5888671875, -10.82958984375, -10.0703125, -9.31103515625, -8.5517578125, -7.79248046875, -7.033203125, -6.27392578125, -5.5146484375, -4.75537109375, -3.99609375, -3.23681640625, -2.4775390625, -1.71826171875, -0.958984375, -0.19970703125, 0.5595703125, 1.31884765625, 2.078125, 2.83740234375, 3.5966796875, 4.35595703125, 5.115234375, 5.87451171875, 6.6337890625, 7.39306640625, 8.15234375, 8.91162109375, 9.6708984375, 10.43017578125, 11.189453125, 11.94873046875, 12.7080078125, 13.46728515625, 14.2265625, 14.98583984375, 15.7451171875, 16.50439453125, 17.263671875, 18.02294921875, 18.7822265625, 19.54150390625, 20.30078125, 21.06005859375, 21.8193359375, 22.57861328125, 23.337890625, 24.09716796875, 24.8564453125, 25.61572265625, 26.375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 8.0, 14.0, 14.0, 21.0, 17.0, 29.0, 37.0, 52.0, 51.0, 70.0, 80.0, 106.0, 123.0, 131.0, 170.0, 202.0, 206.0, 233.0, 234.0, 261.0, 236.0, 248.0, 231.0, 200.0, 173.0, 171.0, 135.0, 100.0, 83.0, 83.0, 54.0, 75.0, 59.0, 34.0, 29.0, 24.0, 16.0, 15.0, 12.0, 10.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.703125, -8.4404296875, -8.177734375, -7.9150390625, -7.65234375, -7.3896484375, -7.126953125, -6.8642578125, -6.6015625, -6.3388671875, -6.076171875, -5.8134765625, -5.55078125, -5.2880859375, -5.025390625, -4.7626953125, -4.5, -4.2373046875, -3.974609375, -3.7119140625, -3.44921875, -3.1865234375, -2.923828125, -2.6611328125, -2.3984375, -2.1357421875, -1.873046875, -1.6103515625, -1.34765625, -1.0849609375, -0.822265625, -0.5595703125, -0.296875, -0.0341796875, 0.228515625, 0.4912109375, 0.75390625, 1.0166015625, 1.279296875, 1.5419921875, 1.8046875, 2.0673828125, 2.330078125, 2.5927734375, 2.85546875, 3.1181640625, 3.380859375, 3.6435546875, 3.90625, 4.1689453125, 4.431640625, 4.6943359375, 4.95703125, 5.2197265625, 5.482421875, 5.7451171875, 6.0078125, 6.2705078125, 6.533203125, 6.7958984375, 7.05859375, 7.3212890625, 7.583984375, 7.8466796875, 8.109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 8.0, 6.0, 19.0, 15.0, 19.0, 20.0, 21.0, 25.0, 36.0, 41.0, 39.0, 50.0, 47.0, 51.0, 53.0, 67.0, 34.0, 48.0, 46.0, 30.0, 43.0, 30.0, 27.0, 25.0, 28.0, 21.0, 21.0, 27.0, 20.0, 12.0, 13.0, 6.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.556360244750977, -18.9261474609375, -18.295934677124023, -17.665721893310547, -17.03550910949707, -16.405296325683594, -15.775084495544434, -15.144871711730957, -14.51465892791748, -13.884446144104004, -13.254233360290527, -12.62402057647705, -11.99380874633789, -11.363595962524414, -10.733383178710938, -10.103170394897461, -9.472957611083984, -8.842744827270508, -8.212532043457031, -7.582319736480713, -6.952106952667236, -6.32189416885376, -5.691681861877441, -5.061469078063965, -4.431256294250488, -3.8010435104370117, -3.1708309650421143, -2.540618419647217, -1.9104056358337402, -1.2801928520202637, -0.6499803066253662, -0.01976776123046875, 0.6104469299316406, 1.2406595945358276, 1.8708722591400146, 2.501084804534912, 3.1312975883483887, 3.7615103721618652, 4.391722679138184, 5.02193546295166, 5.652148246765137, 6.282361030578613, 6.91257381439209, 7.542786121368408, 8.172998428344727, 8.803211212158203, 9.43342399597168, 10.063636779785156, 10.693849563598633, 11.32406234741211, 11.954275131225586, 12.584487915039062, 13.214700698852539, 13.844913482666016, 14.475125312805176, 15.105338096618652, 15.735550880432129, 16.36576271057129, 16.995975494384766, 17.626188278198242, 18.25640106201172, 18.886613845825195, 19.516826629638672, 20.14703941345215, 20.777252197265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 9.0, 13.0, 6.0, 20.0, 21.0, 27.0, 29.0, 30.0, 41.0, 34.0, 36.0, 52.0, 39.0, 60.0, 39.0, 41.0, 32.0, 44.0, 45.0, 43.0, 41.0, 36.0, 34.0, 29.0, 35.0, 27.0, 15.0, 17.0, 16.0, 11.0, 15.0, 7.0, 8.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.36700439453125, -16.73833656311035, -16.109668731689453, -15.481000900268555, -14.852333068847656, -14.223665237426758, -13.594998359680176, -12.966330528259277, -12.337662696838379, -11.70899486541748, -11.080327033996582, -10.451659202575684, -9.822992324829102, -9.194324493408203, -8.565656661987305, -7.936988830566406, -7.308320999145508, -6.679653167724609, -6.050985336303711, -5.422317981719971, -4.793650150299072, -4.164982318878174, -3.5363147258758545, -2.907647132873535, -2.2789793014526367, -1.6503115892410278, -1.021643877029419, -0.39297616481781006, 0.23569154739379883, 0.8643593788146973, 1.4930269718170166, 2.121694564819336, 2.7503604888916016, 3.3790283203125, 4.007696151733398, 4.636363506317139, 5.265031337738037, 5.8936991691589355, 6.522366523742676, 7.151034355163574, 7.779702186584473, 8.408370018005371, 9.03703784942627, 9.665705680847168, 10.29437255859375, 10.923040390014648, 11.551708221435547, 12.180376052856445, 12.809043884277344, 13.437711715698242, 14.06637954711914, 14.695047378540039, 15.323715209960938, 15.952383041381836, 16.581050872802734, 17.209716796875, 17.83838653564453, 18.46705436706543, 19.095722198486328, 19.724390029907227, 20.353057861328125, 20.981725692749023, 21.610393524169922, 22.239059448242188, 22.867727279663086]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 15.0, 20.0, 32.0, 45.0, 69.0, 88.0, 155.0, 231.0, 343.0, 526.0, 745.0, 1234.0, 1809.0, 2685.0, 4290.0, 6668.0, 10294.0, 16160.0, 25090.0, 39195.0, 59423.0, 86717.0, 115382.0, 136243.0, 139457.0, 121552.0, 92839.0, 65307.0, 43573.0, 28046.0, 17980.0, 11471.0, 7323.0, 4736.0, 2974.0, 2008.0, 1282.0, 873.0, 562.0, 404.0, 231.0, 146.0, 113.0, 79.0, 50.0, 28.0, 18.0, 19.0, 9.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.90625, -9.587890625, -9.26953125, -8.951171875, -8.6328125, -8.314453125, -7.99609375, -7.677734375, -7.359375, -7.041015625, -6.72265625, -6.404296875, -6.0859375, -5.767578125, -5.44921875, -5.130859375, -4.8125, -4.494140625, -4.17578125, -3.857421875, -3.5390625, -3.220703125, -2.90234375, -2.583984375, -2.265625, -1.947265625, -1.62890625, -1.310546875, -0.9921875, -0.673828125, -0.35546875, -0.037109375, 0.28125, 0.599609375, 0.91796875, 1.236328125, 1.5546875, 1.873046875, 2.19140625, 2.509765625, 2.828125, 3.146484375, 3.46484375, 3.783203125, 4.1015625, 4.419921875, 4.73828125, 5.056640625, 5.375, 5.693359375, 6.01171875, 6.330078125, 6.6484375, 6.966796875, 7.28515625, 7.603515625, 7.921875, 8.240234375, 8.55859375, 8.876953125, 9.1953125, 9.513671875, 9.83203125, 10.150390625, 10.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 10.0, 10.0, 8.0, 13.0, 18.0, 17.0, 27.0, 20.0, 31.0, 37.0, 38.0, 38.0, 28.0, 51.0, 53.0, 53.0, 43.0, 35.0, 38.0, 42.0, 44.0, 35.0, 45.0, 41.0, 32.0, 31.0, 32.0, 20.0, 17.0, 10.0, 15.0, 15.0, 11.0, 8.0, 9.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.17578125, -17.5078125, -16.83984375, -16.171875, -15.50390625, -14.8359375, -14.16796875, -13.5, -12.83203125, -12.1640625, -11.49609375, -10.828125, -10.16015625, -9.4921875, -8.82421875, -8.15625, -7.48828125, -6.8203125, -6.15234375, -5.484375, -4.81640625, -4.1484375, -3.48046875, -2.8125, -2.14453125, -1.4765625, -0.80859375, -0.140625, 0.52734375, 1.1953125, 1.86328125, 2.53125, 3.19921875, 3.8671875, 4.53515625, 5.203125, 5.87109375, 6.5390625, 7.20703125, 7.875, 8.54296875, 9.2109375, 9.87890625, 10.546875, 11.21484375, 11.8828125, 12.55078125, 13.21875, 13.88671875, 14.5546875, 15.22265625, 15.890625, 16.55859375, 17.2265625, 17.89453125, 18.5625, 19.23046875, 19.8984375, 20.56640625, 21.234375, 21.90234375, 22.5703125, 23.23828125, 23.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 5.0, 11.0, 15.0, 23.0, 24.0, 48.0, 64.0, 106.0, 146.0, 244.0, 316.0, 458.0, 661.0, 921.0, 1361.0, 2029.0, 2961.0, 4400.0, 6965.0, 11065.0, 17233.0, 30391.0, 283939.0, 596326.0, 35195.0, 19606.0, 11785.0, 7439.0, 4827.0, 3192.0, 2169.0, 1398.0, 974.0, 696.0, 455.0, 359.0, 232.0, 168.0, 113.0, 73.0, 47.0, 45.0, 28.0, 12.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-21.65625, -21.021240234375, -20.38623046875, -19.751220703125, -19.1162109375, -18.481201171875, -17.84619140625, -17.211181640625, -16.576171875, -15.941162109375, -15.30615234375, -14.671142578125, -14.0361328125, -13.401123046875, -12.76611328125, -12.131103515625, -11.49609375, -10.861083984375, -10.22607421875, -9.591064453125, -8.9560546875, -8.321044921875, -7.68603515625, -7.051025390625, -6.416015625, -5.781005859375, -5.14599609375, -4.510986328125, -3.8759765625, -3.240966796875, -2.60595703125, -1.970947265625, -1.3359375, -0.700927734375, -0.06591796875, 0.569091796875, 1.2041015625, 1.839111328125, 2.47412109375, 3.109130859375, 3.744140625, 4.379150390625, 5.01416015625, 5.649169921875, 6.2841796875, 6.919189453125, 7.55419921875, 8.189208984375, 8.82421875, 9.459228515625, 10.09423828125, 10.729248046875, 11.3642578125, 11.999267578125, 12.63427734375, 13.269287109375, 13.904296875, 14.539306640625, 15.17431640625, 15.809326171875, 16.4443359375, 17.079345703125, 17.71435546875, 18.349365234375, 18.984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 7.0, 2.0, 6.0, 5.0, 4.0, 14.0, 9.0, 15.0, 14.0, 16.0, 29.0, 25.0, 29.0, 30.0, 23.0, 32.0, 45.0, 25.0, 36.0, 34.0, 39.0, 42.0, 42.0, 34.0, 34.0, 44.0, 31.0, 53.0, 30.0, 22.0, 35.0, 26.0, 15.0, 20.0, 20.0, 21.0, 20.0, 10.0, 11.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.359375, -12.9268798828125, -12.494384765625, -12.0618896484375, -11.62939453125, -11.1968994140625, -10.764404296875, -10.3319091796875, -9.8994140625, -9.4669189453125, -9.034423828125, -8.6019287109375, -8.16943359375, -7.7369384765625, -7.304443359375, -6.8719482421875, -6.439453125, -6.0069580078125, -5.574462890625, -5.1419677734375, -4.70947265625, -4.2769775390625, -3.844482421875, -3.4119873046875, -2.9794921875, -2.5469970703125, -2.114501953125, -1.6820068359375, -1.24951171875, -0.8170166015625, -0.384521484375, 0.0479736328125, 0.48046875, 0.9129638671875, 1.345458984375, 1.7779541015625, 2.21044921875, 2.6429443359375, 3.075439453125, 3.5079345703125, 3.9404296875, 4.3729248046875, 4.805419921875, 5.2379150390625, 5.67041015625, 6.1029052734375, 6.535400390625, 6.9678955078125, 7.400390625, 7.8328857421875, 8.265380859375, 8.6978759765625, 9.13037109375, 9.5628662109375, 9.995361328125, 10.4278564453125, 10.8603515625, 11.2928466796875, 11.725341796875, 12.1578369140625, 12.59033203125, 13.0228271484375, 13.455322265625, 13.8878173828125, 14.3203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 11.0, 11.0, 18.0, 21.0, 32.0, 52.0, 59.0, 114.0, 154.0, 218.0, 353.0, 550.0, 1031.0, 1944.0, 3855.0, 7992.0, 18432.0, 58789.0, 867058.0, 54098.0, 17713.0, 7715.0, 3806.0, 1901.0, 1060.0, 581.0, 334.0, 219.0, 137.0, 101.0, 62.0, 41.0, 17.0, 25.0, 16.0, 10.0, 3.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8759765625, -1.821563720703125, -1.76715087890625, -1.712738037109375, -1.6583251953125, -1.603912353515625, -1.54949951171875, -1.495086669921875, -1.440673828125, -1.386260986328125, -1.33184814453125, -1.277435302734375, -1.2230224609375, -1.168609619140625, -1.11419677734375, -1.059783935546875, -1.00537109375, -0.950958251953125, -0.89654541015625, -0.842132568359375, -0.7877197265625, -0.733306884765625, -0.67889404296875, -0.624481201171875, -0.570068359375, -0.515655517578125, -0.46124267578125, -0.406829833984375, -0.3524169921875, -0.298004150390625, -0.24359130859375, -0.189178466796875, -0.134765625, -0.080352783203125, -0.02593994140625, 0.028472900390625, 0.0828857421875, 0.137298583984375, 0.19171142578125, 0.246124267578125, 0.300537109375, 0.354949951171875, 0.40936279296875, 0.463775634765625, 0.5181884765625, 0.572601318359375, 0.62701416015625, 0.681427001953125, 0.73583984375, 0.790252685546875, 0.84466552734375, 0.899078369140625, 0.9534912109375, 1.007904052734375, 1.06231689453125, 1.116729736328125, 1.171142578125, 1.225555419921875, 1.27996826171875, 1.334381103515625, 1.3887939453125, 1.443206787109375, 1.49761962890625, 1.552032470703125, 1.6064453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 14.0, 6.0, 14.0, 19.0, 18.0, 31.0, 20.0, 45.0, 52.0, 56.0, 75.0, 88.0, 71.0, 71.0, 76.0, 64.0, 59.0, 58.0, 39.0, 26.0, 22.0, 20.0, 13.0, 10.0, 6.0, 4.0, 1.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002963542938232422, -0.0002873167395591736, -0.000278279185295105, -0.0002692416310310364, -0.0002602040767669678, -0.00025116652250289917, -0.00024212896823883057, -0.00023309141397476196, -0.00022405385971069336, -0.00021501630544662476, -0.00020597875118255615, -0.00019694119691848755, -0.00018790364265441895, -0.00017886608839035034, -0.00016982853412628174, -0.00016079097986221313, -0.00015175342559814453, -0.00014271587133407593, -0.00013367831707000732, -0.00012464076280593872, -0.00011560320854187012, -0.00010656565427780151, -9.752810001373291e-05, -8.84905457496643e-05, -7.94529914855957e-05, -7.04154372215271e-05, -6.13778829574585e-05, -5.234032869338989e-05, -4.330277442932129e-05, -3.4265220165252686e-05, -2.5227665901184082e-05, -1.619011163711548e-05, -7.152557373046875e-06, 1.8849968910217285e-06, 1.0922551155090332e-05, 1.9960105419158936e-05, 2.899765968322754e-05, 3.803521394729614e-05, 4.7072768211364746e-05, 5.611032247543335e-05, 6.514787673950195e-05, 7.418543100357056e-05, 8.322298526763916e-05, 9.226053953170776e-05, 0.00010129809379577637, 0.00011033564805984497, 0.00011937320232391357, 0.00012841075658798218, 0.00013744831085205078, 0.00014648586511611938, 0.000155523419380188, 0.0001645609736442566, 0.0001735985279083252, 0.0001826360821723938, 0.0001916736364364624, 0.000200711190700531, 0.0002097487449645996, 0.0002187862992286682, 0.00022782385349273682, 0.00023686140775680542, 0.000245898962020874, 0.0002549365162849426, 0.00026397407054901123, 0.00027301162481307983, 0.00028204917907714844]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 4.0, 18.0, 14.0, 25.0, 34.0, 54.0, 95.0, 130.0, 171.0, 288.0, 386.0, 609.0, 917.0, 1429.0, 1992.0, 2965.0, 4434.0, 6688.0, 10185.0, 15896.0, 24896.0, 41115.0, 68728.0, 116668.0, 176108.0, 196100.0, 147268.0, 89765.0, 52636.0, 31821.0, 19809.0, 12618.0, 8177.0, 5420.0, 3590.0, 2418.0, 1599.0, 1118.0, 776.0, 477.0, 344.0, 244.0, 181.0, 109.0, 82.0, 49.0, 40.0, 18.0, 23.0, 5.0, 3.0, 3.0, 7.0, 2.0, 3.0], "bins": [-0.84423828125, -0.8195877075195312, -0.7949371337890625, -0.7702865600585938, -0.745635986328125, -0.7209854125976562, -0.6963348388671875, -0.6716842651367188, -0.64703369140625, -0.6223831176757812, -0.5977325439453125, -0.5730819702148438, -0.548431396484375, -0.5237808227539062, -0.4991302490234375, -0.47447967529296875, -0.4498291015625, -0.42517852783203125, -0.4005279541015625, -0.37587738037109375, -0.351226806640625, -0.32657623291015625, -0.3019256591796875, -0.27727508544921875, -0.25262451171875, -0.22797393798828125, -0.2033233642578125, -0.17867279052734375, -0.154022216796875, -0.12937164306640625, -0.1047210693359375, -0.08007049560546875, -0.055419921875, -0.03076934814453125, -0.0061187744140625, 0.01853179931640625, 0.043182373046875, 0.06783294677734375, 0.0924835205078125, 0.11713409423828125, 0.14178466796875, 0.16643524169921875, 0.1910858154296875, 0.21573638916015625, 0.240386962890625, 0.26503753662109375, 0.2896881103515625, 0.31433868408203125, 0.3389892578125, 0.36363983154296875, 0.3882904052734375, 0.41294097900390625, 0.437591552734375, 0.46224212646484375, 0.4868927001953125, 0.5115432739257812, 0.53619384765625, 0.5608444213867188, 0.5854949951171875, 0.6101455688476562, 0.634796142578125, 0.6594467163085938, 0.6840972900390625, 0.7087478637695312, 0.7333984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 9.0, 7.0, 9.0, 4.0, 7.0, 10.0, 7.0, 22.0, 22.0, 26.0, 26.0, 47.0, 48.0, 59.0, 58.0, 77.0, 74.0, 70.0, 55.0, 64.0, 58.0, 41.0, 34.0, 40.0, 34.0, 22.0, 12.0, 16.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.25099945068359375, -0.2422332763671875, -0.23346710205078125, -0.224700927734375, -0.21593475341796875, -0.2071685791015625, -0.19840240478515625, -0.18963623046875, -0.18087005615234375, -0.1721038818359375, -0.16333770751953125, -0.154571533203125, -0.14580535888671875, -0.1370391845703125, -0.12827301025390625, -0.1195068359375, -0.11074066162109375, -0.1019744873046875, -0.09320831298828125, -0.084442138671875, -0.07567596435546875, -0.0669097900390625, -0.05814361572265625, -0.04937744140625, -0.04061126708984375, -0.0318450927734375, -0.02307891845703125, -0.014312744140625, -0.00554656982421875, 0.0032196044921875, 0.01198577880859375, 0.020751953125, 0.02951812744140625, 0.0382843017578125, 0.04705047607421875, 0.055816650390625, 0.06458282470703125, 0.0733489990234375, 0.08211517333984375, 0.09088134765625, 0.09964752197265625, 0.1084136962890625, 0.11717987060546875, 0.125946044921875, 0.13471221923828125, 0.1434783935546875, 0.15224456787109375, 0.1610107421875, 0.16977691650390625, 0.1785430908203125, 0.18730926513671875, 0.196075439453125, 0.20484161376953125, 0.2136077880859375, 0.22237396240234375, 0.23114013671875, 0.23990631103515625, 0.2486724853515625, 0.25743865966796875, 0.266204833984375, 0.27497100830078125, 0.2837371826171875, 0.29250335693359375, 0.30126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 2.0, 7.0, 10.0, 9.0, 19.0, 17.0, 27.0, 27.0, 32.0, 33.0, 48.0, 55.0, 50.0, 63.0, 56.0, 56.0, 69.0, 56.0, 38.0, 56.0, 39.0, 26.0, 24.0, 33.0, 34.0, 26.0, 24.0, 13.0, 12.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.31647491455078, -21.541765213012695, -20.767053604125977, -19.99234390258789, -19.217632293701172, -18.442922592163086, -17.668212890625, -16.89350128173828, -16.118791580200195, -15.344080924987793, -14.56937026977539, -13.794660568237305, -13.019949913024902, -12.2452392578125, -11.470529556274414, -10.695818901062012, -9.92110824584961, -9.146397590637207, -8.371686935424805, -7.596977233886719, -6.822266578674316, -6.047555923461914, -5.27284574508667, -4.498135566711426, -3.7234249114990234, -2.9487144947052, -2.174004077911377, -1.3992936611175537, -0.6245832443237305, 0.15012717247009277, 0.924837589263916, 1.6995477676391602, 2.4742584228515625, 3.2489688396453857, 4.023679256439209, 4.798389434814453, 5.5731000900268555, 6.347810745239258, 7.122520923614502, 7.897231101989746, 8.671941757202148, 9.44665241241455, 10.221363067626953, 10.996072769165039, 11.770783424377441, 12.545494079589844, 13.32020378112793, 14.094914436340332, 14.869625091552734, 15.644335746765137, 16.41904640197754, 17.193756103515625, 17.968467712402344, 18.74317741394043, 19.517887115478516, 20.292598724365234, 21.06730842590332, 21.842018127441406, 22.616729736328125, 23.39143943786621, 24.166149139404297, 24.940860748291016, 25.7155704498291, 26.490280151367188, 27.264991760253906]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 9.0, 10.0, 11.0, 19.0, 22.0, 24.0, 22.0, 36.0, 30.0, 41.0, 40.0, 32.0, 58.0, 47.0, 55.0, 34.0, 39.0, 36.0, 49.0, 36.0, 35.0, 46.0, 41.0, 34.0, 31.0, 25.0, 17.0, 20.0, 10.0, 14.0, 16.0, 10.0, 8.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.66037368774414, -17.99193572998047, -17.323497772216797, -16.655059814453125, -15.98662281036377, -15.318184852600098, -14.649747848510742, -13.98130989074707, -13.312871932983398, -12.644433975219727, -11.975996017456055, -11.3075590133667, -10.639121055603027, -9.970683097839355, -9.30224609375, -8.633808135986328, -7.965370178222656, -7.296932220458984, -6.628494739532471, -5.960057258605957, -5.291619300842285, -4.623181343078613, -3.9547438621520996, -3.286306381225586, -2.617868423461914, -1.9494307041168213, -1.2809929847717285, -0.6125552654266357, 0.05588245391845703, 0.7243201732635498, 1.3927578926086426, 2.0611953735351562, 2.729633331298828, 3.398071050643921, 4.066508769989014, 4.734946250915527, 5.403384208679199, 6.071822166442871, 6.740259647369385, 7.408697128295898, 8.07713508605957, 8.745573043823242, 9.414011001586914, 10.08244800567627, 10.750885963439941, 11.419323921203613, 12.087760925292969, 12.75619888305664, 13.424636840820312, 14.093074798583984, 14.761512756347656, 15.429949760437012, 16.098388671875, 16.76682472229004, 17.43526268005371, 18.103700637817383, 18.772138595581055, 19.440576553344727, 20.1090145111084, 20.77745246887207, 21.44588851928711, 22.11432647705078, 22.782764434814453, 23.451202392578125, 24.119640350341797]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 15.0, 14.0, 26.0, 42.0, 51.0, 84.0, 98.0, 161.0, 236.0, 341.0, 499.0, 702.0, 1126.0, 1862.0, 2810.0, 4770.0, 7624.0, 12655.0, 21225.0, 35115.0, 56451.0, 86090.0, 120935.0, 148436.0, 152639.0, 130888.0, 96131.0, 64223.0, 40337.0, 24798.0, 14404.0, 8784.0, 5532.0, 3402.0, 2100.0, 1310.0, 881.0, 570.0, 354.0, 268.0, 174.0, 126.0, 97.0, 46.0, 36.0, 24.0, 22.0, 15.0, 14.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-22.578125, -21.89697265625, -21.2158203125, -20.53466796875, -19.853515625, -19.17236328125, -18.4912109375, -17.81005859375, -17.12890625, -16.44775390625, -15.7666015625, -15.08544921875, -14.404296875, -13.72314453125, -13.0419921875, -12.36083984375, -11.6796875, -10.99853515625, -10.3173828125, -9.63623046875, -8.955078125, -8.27392578125, -7.5927734375, -6.91162109375, -6.23046875, -5.54931640625, -4.8681640625, -4.18701171875, -3.505859375, -2.82470703125, -2.1435546875, -1.46240234375, -0.78125, -0.10009765625, 0.5810546875, 1.26220703125, 1.943359375, 2.62451171875, 3.3056640625, 3.98681640625, 4.66796875, 5.34912109375, 6.0302734375, 6.71142578125, 7.392578125, 8.07373046875, 8.7548828125, 9.43603515625, 10.1171875, 10.79833984375, 11.4794921875, 12.16064453125, 12.841796875, 13.52294921875, 14.2041015625, 14.88525390625, 15.56640625, 16.24755859375, 16.9287109375, 17.60986328125, 18.291015625, 18.97216796875, 19.6533203125, 20.33447265625, 21.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 10.0, 14.0, 11.0, 14.0, 4.0, 8.0, 21.0, 32.0, 22.0, 31.0, 34.0, 37.0, 38.0, 50.0, 42.0, 44.0, 45.0, 43.0, 38.0, 40.0, 46.0, 39.0, 38.0, 46.0, 32.0, 34.0, 29.0, 25.0, 30.0, 18.0, 12.0, 19.0, 10.0, 7.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8515625, -15.2686767578125, -14.685791015625, -14.1029052734375, -13.52001953125, -12.9371337890625, -12.354248046875, -11.7713623046875, -11.1884765625, -10.6055908203125, -10.022705078125, -9.4398193359375, -8.85693359375, -8.2740478515625, -7.691162109375, -7.1082763671875, -6.525390625, -5.9425048828125, -5.359619140625, -4.7767333984375, -4.19384765625, -3.6109619140625, -3.028076171875, -2.4451904296875, -1.8623046875, -1.2794189453125, -0.696533203125, -0.1136474609375, 0.46923828125, 1.0521240234375, 1.635009765625, 2.2178955078125, 2.80078125, 3.3836669921875, 3.966552734375, 4.5494384765625, 5.13232421875, 5.7152099609375, 6.298095703125, 6.8809814453125, 7.4638671875, 8.0467529296875, 8.629638671875, 9.2125244140625, 9.79541015625, 10.3782958984375, 10.961181640625, 11.5440673828125, 12.126953125, 12.7098388671875, 13.292724609375, 13.8756103515625, 14.45849609375, 15.0413818359375, 15.624267578125, 16.2071533203125, 16.7900390625, 17.3729248046875, 17.955810546875, 18.5386962890625, 19.12158203125, 19.7044677734375, 20.287353515625, 20.8702392578125, 21.453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 9.0, 13.0, 25.0, 33.0, 55.0, 61.0, 100.0, 135.0, 215.0, 317.0, 535.0, 819.0, 1344.0, 2178.0, 3625.0, 6552.0, 11710.0, 21766.0, 40267.0, 73989.0, 126542.0, 183744.0, 198741.0, 157376.0, 97568.0, 54566.0, 29636.0, 15965.0, 8490.0, 4685.0, 2838.0, 1650.0, 1036.0, 675.0, 439.0, 256.0, 193.0, 117.0, 93.0, 56.0, 38.0, 30.0, 20.0, 9.0, 10.0, 10.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -31.12841796875, -30.1630859375, -29.19775390625, -28.232421875, -27.26708984375, -26.3017578125, -25.33642578125, -24.37109375, -23.40576171875, -22.4404296875, -21.47509765625, -20.509765625, -19.54443359375, -18.5791015625, -17.61376953125, -16.6484375, -15.68310546875, -14.7177734375, -13.75244140625, -12.787109375, -11.82177734375, -10.8564453125, -9.89111328125, -8.92578125, -7.96044921875, -6.9951171875, -6.02978515625, -5.064453125, -4.09912109375, -3.1337890625, -2.16845703125, -1.203125, -0.23779296875, 0.7275390625, 1.69287109375, 2.658203125, 3.62353515625, 4.5888671875, 5.55419921875, 6.51953125, 7.48486328125, 8.4501953125, 9.41552734375, 10.380859375, 11.34619140625, 12.3115234375, 13.27685546875, 14.2421875, 15.20751953125, 16.1728515625, 17.13818359375, 18.103515625, 19.06884765625, 20.0341796875, 20.99951171875, 21.96484375, 22.93017578125, 23.8955078125, 24.86083984375, 25.826171875, 26.79150390625, 27.7568359375, 28.72216796875, 29.6875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 6.0, 6.0, 10.0, 14.0, 18.0, 20.0, 21.0, 31.0, 26.0, 33.0, 22.0, 27.0, 30.0, 33.0, 44.0, 35.0, 48.0, 44.0, 35.0, 43.0, 39.0, 26.0, 39.0, 42.0, 42.0, 32.0, 27.0, 25.0, 24.0, 26.0, 14.0, 17.0, 24.0, 11.0, 10.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0859375, -10.746337890625, -10.40673828125, -10.067138671875, -9.7275390625, -9.387939453125, -9.04833984375, -8.708740234375, -8.369140625, -8.029541015625, -7.68994140625, -7.350341796875, -7.0107421875, -6.671142578125, -6.33154296875, -5.991943359375, -5.65234375, -5.312744140625, -4.97314453125, -4.633544921875, -4.2939453125, -3.954345703125, -3.61474609375, -3.275146484375, -2.935546875, -2.595947265625, -2.25634765625, -1.916748046875, -1.5771484375, -1.237548828125, -0.89794921875, -0.558349609375, -0.21875, 0.120849609375, 0.46044921875, 0.800048828125, 1.1396484375, 1.479248046875, 1.81884765625, 2.158447265625, 2.498046875, 2.837646484375, 3.17724609375, 3.516845703125, 3.8564453125, 4.196044921875, 4.53564453125, 4.875244140625, 5.21484375, 5.554443359375, 5.89404296875, 6.233642578125, 6.5732421875, 6.912841796875, 7.25244140625, 7.592041015625, 7.931640625, 8.271240234375, 8.61083984375, 8.950439453125, 9.2900390625, 9.629638671875, 9.96923828125, 10.308837890625, 10.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 12.0, 29.0, 29.0, 37.0, 66.0, 99.0, 116.0, 191.0, 267.0, 390.0, 628.0, 1010.0, 1638.0, 2523.0, 4262.0, 7166.0, 12778.0, 22758.0, 42077.0, 75862.0, 126356.0, 178760.0, 192373.0, 152870.0, 98686.0, 55954.0, 31003.0, 16797.0, 9639.0, 5445.0, 3205.0, 1977.0, 1224.0, 825.0, 526.0, 301.0, 223.0, 122.0, 94.0, 81.0, 49.0, 25.0, 25.0, 13.0, 13.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.53515625, -6.33245849609375, -6.1297607421875, -5.92706298828125, -5.724365234375, -5.52166748046875, -5.3189697265625, -5.11627197265625, -4.91357421875, -4.71087646484375, -4.5081787109375, -4.30548095703125, -4.102783203125, -3.90008544921875, -3.6973876953125, -3.49468994140625, -3.2919921875, -3.08929443359375, -2.8865966796875, -2.68389892578125, -2.481201171875, -2.27850341796875, -2.0758056640625, -1.87310791015625, -1.67041015625, -1.46771240234375, -1.2650146484375, -1.06231689453125, -0.859619140625, -0.65692138671875, -0.4542236328125, -0.25152587890625, -0.048828125, 0.15386962890625, 0.3565673828125, 0.55926513671875, 0.761962890625, 0.96466064453125, 1.1673583984375, 1.37005615234375, 1.57275390625, 1.77545166015625, 1.9781494140625, 2.18084716796875, 2.383544921875, 2.58624267578125, 2.7889404296875, 2.99163818359375, 3.1943359375, 3.39703369140625, 3.5997314453125, 3.80242919921875, 4.005126953125, 4.20782470703125, 4.4105224609375, 4.61322021484375, 4.81591796875, 5.01861572265625, 5.2213134765625, 5.42401123046875, 5.626708984375, 5.82940673828125, 6.0321044921875, 6.23480224609375, 6.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 11.0, 16.0, 21.0, 30.0, 39.0, 47.0, 60.0, 50.0, 61.0, 81.0, 77.0, 75.0, 55.0, 67.0, 45.0, 44.0, 51.0, 32.0, 18.0, 26.0, 11.0, 14.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205009460449219, -0.000696226954460144, -0.0006719529628753662, -0.0006476789712905884, -0.0006234049797058105, -0.0005991309881210327, -0.0005748569965362549, -0.000550583004951477, -0.0005263090133666992, -0.0005020350217819214, -0.00047776103019714355, -0.0004534870386123657, -0.0004292130470275879, -0.00040493905544281006, -0.0003806650638580322, -0.0003563910722732544, -0.00033211708068847656, -0.00030784308910369873, -0.0002835690975189209, -0.00025929510593414307, -0.00023502111434936523, -0.0002107471227645874, -0.00018647313117980957, -0.00016219913959503174, -0.0001379251480102539, -0.00011365115642547607, -8.937716484069824e-05, -6.510317325592041e-05, -4.082918167114258e-05, -1.6555190086364746e-05, 7.718801498413086e-06, 3.199279308319092e-05, 5.626678466796875e-05, 8.054077625274658e-05, 0.00010481476783752441, 0.00012908875942230225, 0.00015336275100708008, 0.0001776367425918579, 0.00020191073417663574, 0.00022618472576141357, 0.0002504587173461914, 0.00027473270893096924, 0.00029900670051574707, 0.0003232806921005249, 0.00034755468368530273, 0.00037182867527008057, 0.0003961026668548584, 0.00042037665843963623, 0.00044465065002441406, 0.0004689246416091919, 0.0004931986331939697, 0.0005174726247787476, 0.0005417466163635254, 0.0005660206079483032, 0.0005902945995330811, 0.0006145685911178589, 0.0006388425827026367, 0.0006631165742874146, 0.0006873905658721924, 0.0007116645574569702, 0.000735938549041748, 0.0007602125406265259, 0.0007844865322113037, 0.0008087605237960815, 0.0008330345153808594]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 20.0, 22.0, 26.0, 43.0, 71.0, 86.0, 95.0, 178.0, 261.0, 355.0, 510.0, 776.0, 1164.0, 1675.0, 2551.0, 3835.0, 5856.0, 9429.0, 15566.0, 25439.0, 41646.0, 66027.0, 99386.0, 134725.0, 155030.0, 147164.0, 116670.0, 81918.0, 52284.0, 32255.0, 20000.0, 11980.0, 7501.0, 4703.0, 3029.0, 2009.0, 1376.0, 936.0, 629.0, 431.0, 286.0, 181.0, 128.0, 93.0, 75.0, 46.0, 29.0, 17.0, 12.0, 4.0, 10.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0], "bins": [-5.28125, -5.1148681640625, -4.948486328125, -4.7821044921875, -4.61572265625, -4.4493408203125, -4.282958984375, -4.1165771484375, -3.9501953125, -3.7838134765625, -3.617431640625, -3.4510498046875, -3.28466796875, -3.1182861328125, -2.951904296875, -2.7855224609375, -2.619140625, -2.4527587890625, -2.286376953125, -2.1199951171875, -1.95361328125, -1.7872314453125, -1.620849609375, -1.4544677734375, -1.2880859375, -1.1217041015625, -0.955322265625, -0.7889404296875, -0.62255859375, -0.4561767578125, -0.289794921875, -0.1234130859375, 0.04296875, 0.2093505859375, 0.375732421875, 0.5421142578125, 0.70849609375, 0.8748779296875, 1.041259765625, 1.2076416015625, 1.3740234375, 1.5404052734375, 1.706787109375, 1.8731689453125, 2.03955078125, 2.2059326171875, 2.372314453125, 2.5386962890625, 2.705078125, 2.8714599609375, 3.037841796875, 3.2042236328125, 3.37060546875, 3.5369873046875, 3.703369140625, 3.8697509765625, 4.0361328125, 4.2025146484375, 4.368896484375, 4.5352783203125, 4.70166015625, 4.8680419921875, 5.034423828125, 5.2008056640625, 5.3671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 2.0, 6.0, 6.0, 6.0, 10.0, 9.0, 17.0, 23.0, 21.0, 36.0, 25.0, 33.0, 37.0, 33.0, 42.0, 57.0, 44.0, 48.0, 39.0, 48.0, 62.0, 37.0, 37.0, 50.0, 40.0, 31.0, 32.0, 33.0, 28.0, 19.0, 17.0, 14.0, 10.0, 7.0, 13.0, 4.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.25390625, -2.192779541015625, -2.13165283203125, -2.070526123046875, -2.0093994140625, -1.948272705078125, -1.88714599609375, -1.826019287109375, -1.764892578125, -1.703765869140625, -1.64263916015625, -1.581512451171875, -1.5203857421875, -1.459259033203125, -1.39813232421875, -1.337005615234375, -1.27587890625, -1.214752197265625, -1.15362548828125, -1.092498779296875, -1.0313720703125, -0.970245361328125, -0.90911865234375, -0.847991943359375, -0.786865234375, -0.725738525390625, -0.66461181640625, -0.603485107421875, -0.5423583984375, -0.481231689453125, -0.42010498046875, -0.358978271484375, -0.2978515625, -0.236724853515625, -0.17559814453125, -0.114471435546875, -0.0533447265625, 0.007781982421875, 0.06890869140625, 0.130035400390625, 0.191162109375, 0.252288818359375, 0.31341552734375, 0.374542236328125, 0.4356689453125, 0.496795654296875, 0.55792236328125, 0.619049072265625, 0.68017578125, 0.741302490234375, 0.80242919921875, 0.863555908203125, 0.9246826171875, 0.985809326171875, 1.04693603515625, 1.108062744140625, 1.169189453125, 1.230316162109375, 1.29144287109375, 1.352569580078125, 1.4136962890625, 1.474822998046875, 1.53594970703125, 1.597076416015625, 1.658203125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 3.0, 9.0, 8.0, 14.0, 14.0, 26.0, 34.0, 38.0, 37.0, 29.0, 45.0, 41.0, 55.0, 70.0, 65.0, 61.0, 49.0, 50.0, 43.0, 48.0, 47.0, 35.0, 25.0, 18.0, 25.0, 19.0, 19.0, 15.0, 18.0, 9.0, 4.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.121753692626953, -19.388927459716797, -18.65610122680664, -17.923274993896484, -17.190446853637695, -16.45762062072754, -15.724794387817383, -14.991968154907227, -14.25914192199707, -13.526315689086914, -12.793488502502441, -12.060662269592285, -11.327836036682129, -10.595008850097656, -9.8621826171875, -9.129356384277344, -8.396529197692871, -7.663702487945557, -6.9308762550354, -6.198049545288086, -5.46522331237793, -4.732396602630615, -3.999569892883301, -3.2667436599731445, -2.53391695022583, -1.8010904788970947, -1.0682638883590698, -0.3354372978210449, 0.39738917350769043, 1.1302156448364258, 1.8630423545837402, 2.5958685874938965, 3.328695297241211, 4.061522006988525, 4.794348239898682, 5.527174949645996, 6.260001182556152, 6.992827892303467, 7.725654602050781, 8.458480834960938, 9.191307067871094, 9.92413330078125, 10.656960487365723, 11.389786720275879, 12.122612953186035, 12.855440139770508, 13.588266372680664, 14.32109260559082, 15.053919792175293, 15.78674602508545, 16.519573211669922, 17.252399444580078, 17.985225677490234, 18.71805191040039, 19.450878143310547, 20.183704376220703, 20.916532516479492, 21.64935874938965, 22.382184982299805, 23.115013122558594, 23.84783935546875, 24.580665588378906, 25.313491821289062, 26.04631805419922, 26.779144287109375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 10.0, 11.0, 14.0, 14.0, 17.0, 19.0, 20.0, 27.0, 41.0, 34.0, 36.0, 45.0, 40.0, 44.0, 41.0, 37.0, 48.0, 40.0, 40.0, 36.0, 39.0, 41.0, 34.0, 24.0, 36.0, 25.0, 29.0, 22.0, 21.0, 29.0, 12.0, 9.0, 9.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.59825897216797, -17.011245727539062, -16.424232482910156, -15.837221145629883, -15.250207901000977, -14.66319465637207, -14.07618236541748, -13.48917007446289, -12.902156829833984, -12.315143585205078, -11.728131294250488, -11.141119003295898, -10.554105758666992, -9.967092514038086, -9.380080223083496, -8.793067932128906, -8.2060546875, -7.619041919708252, -7.032029151916504, -6.445016384124756, -5.858003616333008, -5.27099084854126, -4.683978080749512, -4.096965312957764, -3.5099525451660156, -2.9229397773742676, -2.3359270095825195, -1.7489142417907715, -1.1619014739990234, -0.5748887062072754, 0.012124061584472656, 0.5991368293762207, 1.1861495971679688, 1.7731623649597168, 2.360175132751465, 2.947187900543213, 3.534200668334961, 4.121213436126709, 4.708226203918457, 5.295238971710205, 5.882251739501953, 6.469264507293701, 7.056277275085449, 7.643290042877197, 8.230302810668945, 8.817316055297852, 9.404328346252441, 9.991340637207031, 10.578353881835938, 11.165367126464844, 11.752379417419434, 12.339391708374023, 12.92640495300293, 13.513418197631836, 14.100430488586426, 14.687442779541016, 15.274456024169922, 15.861469268798828, 16.448482513427734, 17.035493850708008, 17.622507095336914, 18.20952033996582, 18.796531677246094, 19.383544921875, 19.970558166503906]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 14.0, 13.0, 24.0, 39.0, 66.0, 87.0, 136.0, 211.0, 329.0, 468.0, 707.0, 953.0, 1549.0, 2345.0, 3784.0, 5881.0, 9411.0, 15064.0, 24340.0, 40179.0, 66922.0, 111205.0, 186913.0, 307437.0, 471069.0, 625294.0, 675780.0, 580351.0, 410254.0, 258314.0, 156021.0, 93356.0, 55705.0, 33671.0, 20796.0, 12798.0, 8066.0, 5061.0, 3339.0, 2168.0, 1431.0, 920.0, 602.0, 413.0, 267.0, 183.0, 109.0, 83.0, 46.0, 39.0, 24.0, 18.0, 13.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-17.8125, -17.243896484375, -16.67529296875, -16.106689453125, -15.5380859375, -14.969482421875, -14.40087890625, -13.832275390625, -13.263671875, -12.695068359375, -12.12646484375, -11.557861328125, -10.9892578125, -10.420654296875, -9.85205078125, -9.283447265625, -8.71484375, -8.146240234375, -7.57763671875, -7.009033203125, -6.4404296875, -5.871826171875, -5.30322265625, -4.734619140625, -4.166015625, -3.597412109375, -3.02880859375, -2.460205078125, -1.8916015625, -1.322998046875, -0.75439453125, -0.185791015625, 0.3828125, 0.951416015625, 1.52001953125, 2.088623046875, 2.6572265625, 3.225830078125, 3.79443359375, 4.363037109375, 4.931640625, 5.500244140625, 6.06884765625, 6.637451171875, 7.2060546875, 7.774658203125, 8.34326171875, 8.911865234375, 9.48046875, 10.049072265625, 10.61767578125, 11.186279296875, 11.7548828125, 12.323486328125, 12.89208984375, 13.460693359375, 14.029296875, 14.597900390625, 15.16650390625, 15.735107421875, 16.3037109375, 16.872314453125, 17.44091796875, 18.009521484375, 18.578125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 16.0, 9.0, 18.0, 16.0, 19.0, 26.0, 30.0, 30.0, 40.0, 31.0, 28.0, 37.0, 43.0, 55.0, 36.0, 39.0, 43.0, 36.0, 40.0, 34.0, 36.0, 28.0, 31.0, 34.0, 32.0, 25.0, 20.0, 22.0, 26.0, 19.0, 19.0, 7.0, 10.0, 9.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -13.0443115234375, -12.580810546875, -12.1173095703125, -11.65380859375, -11.1903076171875, -10.726806640625, -10.2633056640625, -9.7998046875, -9.3363037109375, -8.872802734375, -8.4093017578125, -7.94580078125, -7.4822998046875, -7.018798828125, -6.5552978515625, -6.091796875, -5.6282958984375, -5.164794921875, -4.7012939453125, -4.23779296875, -3.7742919921875, -3.310791015625, -2.8472900390625, -2.3837890625, -1.9202880859375, -1.456787109375, -0.9932861328125, -0.52978515625, -0.0662841796875, 0.397216796875, 0.8607177734375, 1.32421875, 1.7877197265625, 2.251220703125, 2.7147216796875, 3.17822265625, 3.6417236328125, 4.105224609375, 4.5687255859375, 5.0322265625, 5.4957275390625, 5.959228515625, 6.4227294921875, 6.88623046875, 7.3497314453125, 7.813232421875, 8.2767333984375, 8.740234375, 9.2037353515625, 9.667236328125, 10.1307373046875, 10.59423828125, 11.0577392578125, 11.521240234375, 11.9847412109375, 12.4482421875, 12.9117431640625, 13.375244140625, 13.8387451171875, 14.30224609375, 14.7657470703125, 15.229248046875, 15.6927490234375, 16.15625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 12.0, 13.0, 22.0, 38.0, 59.0, 99.0, 190.0, 290.0, 410.0, 659.0, 1058.0, 1718.0, 2839.0, 4502.0, 7384.0, 11832.0, 19624.0, 32114.0, 52969.0, 85688.0, 138441.0, 217581.0, 327406.0, 457169.0, 564245.0, 591419.0, 525101.0, 400423.0, 277134.0, 179803.0, 113693.0, 69792.0, 42917.0, 26202.0, 16114.0, 9735.0, 6007.0, 3634.0, 2191.0, 1367.0, 867.0, 545.0, 380.0, 218.0, 153.0, 81.0, 57.0, 37.0, 21.0, 17.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.5927734375, -16.044921875, -15.4970703125, -14.94921875, -14.4013671875, -13.853515625, -13.3056640625, -12.7578125, -12.2099609375, -11.662109375, -11.1142578125, -10.56640625, -10.0185546875, -9.470703125, -8.9228515625, -8.375, -7.8271484375, -7.279296875, -6.7314453125, -6.18359375, -5.6357421875, -5.087890625, -4.5400390625, -3.9921875, -3.4443359375, -2.896484375, -2.3486328125, -1.80078125, -1.2529296875, -0.705078125, -0.1572265625, 0.390625, 0.9384765625, 1.486328125, 2.0341796875, 2.58203125, 3.1298828125, 3.677734375, 4.2255859375, 4.7734375, 5.3212890625, 5.869140625, 6.4169921875, 6.96484375, 7.5126953125, 8.060546875, 8.6083984375, 9.15625, 9.7041015625, 10.251953125, 10.7998046875, 11.34765625, 11.8955078125, 12.443359375, 12.9912109375, 13.5390625, 14.0869140625, 14.634765625, 15.1826171875, 15.73046875, 16.2783203125, 16.826171875, 17.3740234375, 17.921875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 7.0, 8.0, 10.0, 15.0, 20.0, 36.0, 40.0, 45.0, 46.0, 82.0, 81.0, 99.0, 129.0, 153.0, 180.0, 186.0, 207.0, 245.0, 235.0, 250.0, 231.0, 213.0, 227.0, 212.0, 200.0, 163.0, 164.0, 118.0, 93.0, 85.0, 60.0, 49.0, 29.0, 39.0, 27.0, 19.0, 20.0, 12.0, 10.0, 5.0, 6.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.05029296875, -6.7958984375, -6.54150390625, -6.287109375, -6.03271484375, -5.7783203125, -5.52392578125, -5.26953125, -5.01513671875, -4.7607421875, -4.50634765625, -4.251953125, -3.99755859375, -3.7431640625, -3.48876953125, -3.234375, -2.97998046875, -2.7255859375, -2.47119140625, -2.216796875, -1.96240234375, -1.7080078125, -1.45361328125, -1.19921875, -0.94482421875, -0.6904296875, -0.43603515625, -0.181640625, 0.07275390625, 0.3271484375, 0.58154296875, 0.8359375, 1.09033203125, 1.3447265625, 1.59912109375, 1.853515625, 2.10791015625, 2.3623046875, 2.61669921875, 2.87109375, 3.12548828125, 3.3798828125, 3.63427734375, 3.888671875, 4.14306640625, 4.3974609375, 4.65185546875, 4.90625, 5.16064453125, 5.4150390625, 5.66943359375, 5.923828125, 6.17822265625, 6.4326171875, 6.68701171875, 6.94140625, 7.19580078125, 7.4501953125, 7.70458984375, 7.958984375, 8.21337890625, 8.4677734375, 8.72216796875, 8.9765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 2.0, 4.0, 4.0, 11.0, 15.0, 11.0, 13.0, 22.0, 18.0, 26.0, 45.0, 25.0, 34.0, 45.0, 43.0, 37.0, 53.0, 46.0, 43.0, 36.0, 42.0, 51.0, 33.0, 36.0, 34.0, 35.0, 32.0, 27.0, 34.0, 24.0, 17.0, 21.0, 12.0, 12.0, 12.0, 10.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-20.966812133789062, -20.371826171875, -19.776840209960938, -19.181856155395508, -18.586870193481445, -17.991884231567383, -17.39689826965332, -16.801912307739258, -16.206928253173828, -15.611942291259766, -15.01695728302002, -14.421971321105957, -13.826986312866211, -13.232000350952148, -12.637014389038086, -12.042028427124023, -11.447042465209961, -10.852056503295898, -10.257071495056152, -9.66208553314209, -9.067100524902344, -8.472114562988281, -7.877128601074219, -7.2821431159973145, -6.68715763092041, -6.092172145843506, -5.497186660766602, -4.902200698852539, -4.307215213775635, -3.7122297286987305, -3.117244005203247, -2.5222582817077637, -1.9272747039794922, -1.3322890996932983, -0.7373034954071045, -0.14231789112091064, 0.4526677131652832, 1.0476531982421875, 1.642638921737671, 2.2376246452331543, 2.8326101303100586, 3.427595615386963, 4.022581100463867, 4.61756706237793, 5.212552547454834, 5.807538032531738, 6.402523994445801, 6.997509479522705, 7.592494964599609, 8.187480926513672, 8.782465934753418, 9.37745189666748, 9.972436904907227, 10.567422866821289, 11.162408828735352, 11.757394790649414, 12.35237979888916, 12.947365760803223, 13.542350769042969, 14.137336730957031, 14.732322692871094, 15.32730770111084, 15.922293663024902, 16.51727867126465, 17.11226463317871]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 8.0, 5.0, 6.0, 14.0, 12.0, 14.0, 12.0, 17.0, 23.0, 18.0, 26.0, 29.0, 44.0, 25.0, 37.0, 39.0, 40.0, 40.0, 29.0, 45.0, 49.0, 43.0, 41.0, 34.0, 43.0, 28.0, 33.0, 33.0, 35.0, 23.0, 18.0, 21.0, 9.0, 21.0, 19.0, 12.0, 9.0, 8.0, 6.0, 5.0, 5.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.620214462280273, -16.067855834960938, -15.515498161315918, -14.963139533996582, -14.410780906677246, -13.858423233032227, -13.30606460571289, -12.753705978393555, -12.201347351074219, -11.648988723754883, -11.096631050109863, -10.544272422790527, -9.991913795471191, -9.439556121826172, -8.887197494506836, -8.3348388671875, -7.7824811935424805, -7.230123043060303, -6.677764415740967, -6.125406265258789, -5.573047637939453, -5.020689487457275, -4.468331336975098, -3.915972948074341, -3.363614559173584, -2.811256170272827, -2.2588977813720703, -1.7065396308898926, -1.1541812419891357, -0.6018228530883789, -0.04946470260620117, 0.5028936862945557, 1.0552520751953125, 1.6076104640960693, 2.159968852996826, 2.712327003479004, 3.2646853923797607, 3.8170437812805176, 4.369401931762695, 4.921760559082031, 5.474118709564209, 6.026476860046387, 6.578835487365723, 7.1311936378479, 7.683551788330078, 8.235910415649414, 8.78826904296875, 9.34062671661377, 9.892985343933105, 10.445343971252441, 10.997701644897461, 11.550060272216797, 12.102418899536133, 12.654777526855469, 13.207135200500488, 13.759493827819824, 14.311851501464844, 14.86421012878418, 15.4165678024292, 15.968926429748535, 16.521284103393555, 17.07364273071289, 17.626001358032227, 18.178359985351562, 18.7307186126709]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 16.0, 27.0, 41.0, 54.0, 78.0, 104.0, 165.0, 297.0, 410.0, 525.0, 854.0, 1247.0, 1853.0, 2706.0, 4025.0, 5658.0, 8446.0, 12080.0, 17289.0, 24337.0, 33711.0, 45289.0, 59062.0, 73442.0, 87252.0, 96743.0, 100745.0, 97113.0, 87187.0, 73312.0, 58111.0, 44812.0, 32761.0, 23868.0, 17001.0, 11806.0, 8188.0, 5631.0, 3917.0, 2709.0, 1821.0, 1261.0, 853.0, 580.0, 388.0, 251.0, 186.0, 125.0, 86.0, 48.0, 26.0, 24.0, 10.0, 12.0, 9.0, 4.0, 1.0, 1.0], "bins": [-7.19921875, -6.9775390625, -6.755859375, -6.5341796875, -6.3125, -6.0908203125, -5.869140625, -5.6474609375, -5.42578125, -5.2041015625, -4.982421875, -4.7607421875, -4.5390625, -4.3173828125, -4.095703125, -3.8740234375, -3.65234375, -3.4306640625, -3.208984375, -2.9873046875, -2.765625, -2.5439453125, -2.322265625, -2.1005859375, -1.87890625, -1.6572265625, -1.435546875, -1.2138671875, -0.9921875, -0.7705078125, -0.548828125, -0.3271484375, -0.10546875, 0.1162109375, 0.337890625, 0.5595703125, 0.78125, 1.0029296875, 1.224609375, 1.4462890625, 1.66796875, 1.8896484375, 2.111328125, 2.3330078125, 2.5546875, 2.7763671875, 2.998046875, 3.2197265625, 3.44140625, 3.6630859375, 3.884765625, 4.1064453125, 4.328125, 4.5498046875, 4.771484375, 4.9931640625, 5.21484375, 5.4365234375, 5.658203125, 5.8798828125, 6.1015625, 6.3232421875, 6.544921875, 6.7666015625, 6.98828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 8.0, 6.0, 6.0, 11.0, 11.0, 17.0, 11.0, 17.0, 21.0, 17.0, 28.0, 22.0, 40.0, 31.0, 33.0, 44.0, 35.0, 43.0, 30.0, 37.0, 57.0, 40.0, 38.0, 42.0, 35.0, 31.0, 33.0, 34.0, 33.0, 28.0, 24.0, 13.0, 18.0, 17.0, 18.0, 12.0, 16.0, 4.0, 5.0, 7.0, 4.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.0625, -16.50537109375, -15.9482421875, -15.39111328125, -14.833984375, -14.27685546875, -13.7197265625, -13.16259765625, -12.60546875, -12.04833984375, -11.4912109375, -10.93408203125, -10.376953125, -9.81982421875, -9.2626953125, -8.70556640625, -8.1484375, -7.59130859375, -7.0341796875, -6.47705078125, -5.919921875, -5.36279296875, -4.8056640625, -4.24853515625, -3.69140625, -3.13427734375, -2.5771484375, -2.02001953125, -1.462890625, -0.90576171875, -0.3486328125, 0.20849609375, 0.765625, 1.32275390625, 1.8798828125, 2.43701171875, 2.994140625, 3.55126953125, 4.1083984375, 4.66552734375, 5.22265625, 5.77978515625, 6.3369140625, 6.89404296875, 7.451171875, 8.00830078125, 8.5654296875, 9.12255859375, 9.6796875, 10.23681640625, 10.7939453125, 11.35107421875, 11.908203125, 12.46533203125, 13.0224609375, 13.57958984375, 14.13671875, 14.69384765625, 15.2509765625, 15.80810546875, 16.365234375, 16.92236328125, 17.4794921875, 18.03662109375, 18.59375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 12.0, 18.0, 34.0, 57.0, 57.0, 93.0, 131.0, 188.0, 325.0, 488.0, 696.0, 1217.0, 1737.0, 2838.0, 4424.0, 6767.0, 10574.0, 16867.0, 27315.0, 124076.0, 740112.0, 47849.0, 22855.0, 14246.0, 8893.0, 5933.0, 3764.0, 2378.0, 1567.0, 1017.0, 688.0, 458.0, 315.0, 192.0, 121.0, 74.0, 54.0, 36.0, 23.0, 12.0, 11.0, 6.0, 12.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.703125, -16.169921875, -15.63671875, -15.103515625, -14.5703125, -14.037109375, -13.50390625, -12.970703125, -12.4375, -11.904296875, -11.37109375, -10.837890625, -10.3046875, -9.771484375, -9.23828125, -8.705078125, -8.171875, -7.638671875, -7.10546875, -6.572265625, -6.0390625, -5.505859375, -4.97265625, -4.439453125, -3.90625, -3.373046875, -2.83984375, -2.306640625, -1.7734375, -1.240234375, -0.70703125, -0.173828125, 0.359375, 0.892578125, 1.42578125, 1.958984375, 2.4921875, 3.025390625, 3.55859375, 4.091796875, 4.625, 5.158203125, 5.69140625, 6.224609375, 6.7578125, 7.291015625, 7.82421875, 8.357421875, 8.890625, 9.423828125, 9.95703125, 10.490234375, 11.0234375, 11.556640625, 12.08984375, 12.623046875, 13.15625, 13.689453125, 14.22265625, 14.755859375, 15.2890625, 15.822265625, 16.35546875, 16.888671875, 17.421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 10.0, 14.0, 6.0, 16.0, 22.0, 28.0, 25.0, 13.0, 31.0, 30.0, 29.0, 32.0, 43.0, 41.0, 49.0, 32.0, 45.0, 36.0, 44.0, 39.0, 33.0, 46.0, 33.0, 35.0, 30.0, 30.0, 29.0, 31.0, 19.0, 18.0, 21.0, 17.0, 13.0, 8.0, 7.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.359375, -14.915283203125, -14.47119140625, -14.027099609375, -13.5830078125, -13.138916015625, -12.69482421875, -12.250732421875, -11.806640625, -11.362548828125, -10.91845703125, -10.474365234375, -10.0302734375, -9.586181640625, -9.14208984375, -8.697998046875, -8.25390625, -7.809814453125, -7.36572265625, -6.921630859375, -6.4775390625, -6.033447265625, -5.58935546875, -5.145263671875, -4.701171875, -4.257080078125, -3.81298828125, -3.368896484375, -2.9248046875, -2.480712890625, -2.03662109375, -1.592529296875, -1.1484375, -0.704345703125, -0.26025390625, 0.183837890625, 0.6279296875, 1.072021484375, 1.51611328125, 1.960205078125, 2.404296875, 2.848388671875, 3.29248046875, 3.736572265625, 4.1806640625, 4.624755859375, 5.06884765625, 5.512939453125, 5.95703125, 6.401123046875, 6.84521484375, 7.289306640625, 7.7333984375, 8.177490234375, 8.62158203125, 9.065673828125, 9.509765625, 9.953857421875, 10.39794921875, 10.842041015625, 11.2861328125, 11.730224609375, 12.17431640625, 12.618408203125, 13.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 14.0, 12.0, 30.0, 23.0, 44.0, 59.0, 69.0, 115.0, 125.0, 226.0, 345.0, 552.0, 1013.0, 1862.0, 3799.0, 8366.0, 22332.0, 118281.0, 830430.0, 37139.0, 12661.0, 5166.0, 2515.0, 1330.0, 755.0, 426.0, 279.0, 165.0, 114.0, 90.0, 42.0, 44.0, 33.0, 30.0, 18.0, 9.0, 3.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.65234375, -2.5748291015625, -2.497314453125, -2.4197998046875, -2.34228515625, -2.2647705078125, -2.187255859375, -2.1097412109375, -2.0322265625, -1.9547119140625, -1.877197265625, -1.7996826171875, -1.72216796875, -1.6446533203125, -1.567138671875, -1.4896240234375, -1.412109375, -1.3345947265625, -1.257080078125, -1.1795654296875, -1.10205078125, -1.0245361328125, -0.947021484375, -0.8695068359375, -0.7919921875, -0.7144775390625, -0.636962890625, -0.5594482421875, -0.48193359375, -0.4044189453125, -0.326904296875, -0.2493896484375, -0.171875, -0.0943603515625, -0.016845703125, 0.0606689453125, 0.13818359375, 0.2156982421875, 0.293212890625, 0.3707275390625, 0.4482421875, 0.5257568359375, 0.603271484375, 0.6807861328125, 0.75830078125, 0.8358154296875, 0.913330078125, 0.9908447265625, 1.068359375, 1.1458740234375, 1.223388671875, 1.3009033203125, 1.37841796875, 1.4559326171875, 1.533447265625, 1.6109619140625, 1.6884765625, 1.7659912109375, 1.843505859375, 1.9210205078125, 1.99853515625, 2.0760498046875, 2.153564453125, 2.2310791015625, 2.30859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 13.0, 21.0, 15.0, 30.0, 49.0, 49.0, 56.0, 67.0, 67.0, 96.0, 89.0, 83.0, 70.0, 58.0, 48.0, 39.0, 25.0, 26.0, 12.0, 17.0, 13.0, 5.0, 6.0, 5.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004284381866455078, -0.0004131905734539032, -0.0003979429602622986, -0.00038269534707069397, -0.00036744773387908936, -0.00035220012068748474, -0.0003369525074958801, -0.0003217048943042755, -0.0003064572811126709, -0.0002912096679210663, -0.00027596205472946167, -0.00026071444153785706, -0.00024546682834625244, -0.00023021921515464783, -0.0002149716019630432, -0.0001997239887714386, -0.00018447637557983398, -0.00016922876238822937, -0.00015398114919662476, -0.00013873353600502014, -0.00012348592281341553, -0.00010823830962181091, -9.29906964302063e-05, -7.774308323860168e-05, -6.249547004699707e-05, -4.7247856855392456e-05, -3.200024366378784e-05, -1.6752630472183228e-05, -1.5050172805786133e-06, 1.3742595911026001e-05, 2.8990209102630615e-05, 4.423782229423523e-05, 5.9485435485839844e-05, 7.473304867744446e-05, 8.998066186904907e-05, 0.00010522827506065369, 0.0001204758882522583, 0.00013572350144386292, 0.00015097111463546753, 0.00016621872782707214, 0.00018146634101867676, 0.00019671395421028137, 0.00021196156740188599, 0.0002272091805934906, 0.00024245679378509521, 0.00025770440697669983, 0.00027295202016830444, 0.00028819963335990906, 0.00030344724655151367, 0.0003186948597431183, 0.0003339424729347229, 0.0003491900861263275, 0.00036443769931793213, 0.00037968531250953674, 0.00039493292570114136, 0.00041018053889274597, 0.0004254281520843506, 0.0004406757652759552, 0.0004559233784675598, 0.00047117099165916443, 0.00048641860485076904, 0.0005016662180423737, 0.0005169138312339783, 0.0005321614444255829, 0.0005474090576171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 9.0, 10.0, 18.0, 32.0, 43.0, 62.0, 105.0, 136.0, 155.0, 243.0, 351.0, 576.0, 792.0, 1177.0, 1659.0, 2634.0, 3858.0, 5856.0, 8971.0, 14303.0, 22343.0, 34799.0, 54731.0, 83291.0, 118150.0, 149864.0, 153423.0, 127781.0, 92414.0, 61098.0, 39265.0, 24878.0, 15834.0, 10121.0, 6421.0, 4251.0, 2833.0, 1869.0, 1279.0, 887.0, 634.0, 426.0, 297.0, 235.0, 124.0, 103.0, 64.0, 51.0, 27.0, 22.0, 23.0, 5.0, 11.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.73876953125, -0.7157745361328125, -0.692779541015625, -0.6697845458984375, -0.64678955078125, -0.6237945556640625, -0.600799560546875, -0.5778045654296875, -0.5548095703125, -0.5318145751953125, -0.508819580078125, -0.4858245849609375, -0.46282958984375, -0.4398345947265625, -0.416839599609375, -0.3938446044921875, -0.370849609375, -0.3478546142578125, -0.324859619140625, -0.3018646240234375, -0.27886962890625, -0.2558746337890625, -0.232879638671875, -0.2098846435546875, -0.1868896484375, -0.1638946533203125, -0.140899658203125, -0.1179046630859375, -0.09490966796875, -0.0719146728515625, -0.048919677734375, -0.0259246826171875, -0.0029296875, 0.0200653076171875, 0.043060302734375, 0.0660552978515625, 0.08905029296875, 0.1120452880859375, 0.135040283203125, 0.1580352783203125, 0.1810302734375, 0.2040252685546875, 0.227020263671875, 0.2500152587890625, 0.27301025390625, 0.2960052490234375, 0.319000244140625, 0.3419952392578125, 0.364990234375, 0.3879852294921875, 0.410980224609375, 0.4339752197265625, 0.45697021484375, 0.4799652099609375, 0.502960205078125, 0.5259552001953125, 0.5489501953125, 0.5719451904296875, 0.594940185546875, 0.6179351806640625, 0.64093017578125, 0.6639251708984375, 0.686920166015625, 0.7099151611328125, 0.73291015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 10.0, 11.0, 13.0, 12.0, 20.0, 25.0, 28.0, 34.0, 39.0, 49.0, 67.0, 58.0, 67.0, 50.0, 67.0, 63.0, 55.0, 45.0, 52.0, 31.0, 35.0, 39.0, 21.0, 17.0, 23.0, 6.0, 10.0, 6.0, 5.0, 4.0, 5.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3212547302246094, -0.31047821044921875, -0.2997016906738281, -0.2889251708984375, -0.2781486511230469, -0.26737213134765625, -0.2565956115722656, -0.245819091796875, -0.23504257202148438, -0.22426605224609375, -0.21348953247070312, -0.2027130126953125, -0.19193649291992188, -0.18115997314453125, -0.17038345336914062, -0.15960693359375, -0.14883041381835938, -0.13805389404296875, -0.12727737426757812, -0.1165008544921875, -0.10572433471679688, -0.09494781494140625, -0.08417129516601562, -0.073394775390625, -0.06261825561523438, -0.05184173583984375, -0.041065216064453125, -0.0302886962890625, -0.019512176513671875, -0.00873565673828125, 0.002040863037109375, 0.0128173828125, 0.023593902587890625, 0.03437042236328125, 0.045146942138671875, 0.0559234619140625, 0.06669998168945312, 0.07747650146484375, 0.08825302124023438, 0.099029541015625, 0.10980606079101562, 0.12058258056640625, 0.13135910034179688, 0.1421356201171875, 0.15291213989257812, 0.16368865966796875, 0.17446517944335938, 0.18524169921875, 0.19601821899414062, 0.20679473876953125, 0.21757125854492188, 0.2283477783203125, 0.23912429809570312, 0.24990081787109375, 0.2606773376464844, 0.271453857421875, 0.2822303771972656, 0.29300689697265625, 0.3037834167480469, 0.3145599365234375, 0.3253364562988281, 0.33611297607421875, 0.3468894958496094, 0.357666015625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 6.0, 17.0, 21.0, 20.0, 7.0, 25.0, 27.0, 31.0, 39.0, 42.0, 55.0, 49.0, 39.0, 45.0, 49.0, 56.0, 47.0, 40.0, 43.0, 38.0, 45.0, 25.0, 28.0, 31.0, 28.0, 22.0, 23.0, 25.0, 19.0, 8.0, 5.0, 11.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8658390045166, -19.23126220703125, -18.5966854095459, -17.962108612060547, -17.327531814575195, -16.692955017089844, -16.058378219604492, -15.42380142211914, -14.789224624633789, -14.154647827148438, -13.520071029663086, -12.885494232177734, -12.250917434692383, -11.616340637207031, -10.98176383972168, -10.347187042236328, -9.712610244750977, -9.078033447265625, -8.443456649780273, -7.808879852294922, -7.17430305480957, -6.539726257324219, -5.905149459838867, -5.270572662353516, -4.635995864868164, -4.0014190673828125, -3.366842269897461, -2.7322654724121094, -2.097688674926758, -1.4631118774414062, -0.8285350799560547, -0.19395828247070312, 0.44061851501464844, 1.0751953125, 1.7097721099853516, 2.344348907470703, 2.9789257049560547, 3.6135025024414062, 4.248079299926758, 4.882656097412109, 5.517232894897461, 6.1518096923828125, 6.786386489868164, 7.420963287353516, 8.055540084838867, 8.690116882324219, 9.32469367980957, 9.959270477294922, 10.593847274780273, 11.228424072265625, 11.863000869750977, 12.497577667236328, 13.13215446472168, 13.766731262207031, 14.401308059692383, 15.035884857177734, 15.670461654663086, 16.305038452148438, 16.93961524963379, 17.57419204711914, 18.208768844604492, 18.843345642089844, 19.477922439575195, 20.112499237060547, 20.7470760345459]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 10.0, 7.0, 5.0, 13.0, 19.0, 9.0, 15.0, 20.0, 16.0, 27.0, 26.0, 39.0, 30.0, 31.0, 39.0, 43.0, 33.0, 43.0, 34.0, 48.0, 43.0, 48.0, 39.0, 37.0, 28.0, 39.0, 31.0, 35.0, 28.0, 24.0, 18.0, 18.0, 11.0, 22.0, 12.0, 12.0, 10.0, 3.0, 7.0, 5.0, 9.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.38070297241211, -16.81770133972168, -16.25469970703125, -15.69169807434082, -15.12869644165039, -14.565694808959961, -14.002692222595215, -13.439690589904785, -12.876688957214355, -12.313687324523926, -11.750685691833496, -11.187684059143066, -10.62468147277832, -10.06167984008789, -9.498678207397461, -8.935676574707031, -8.372674942016602, -7.809673309326172, -7.246671676635742, -6.683669567108154, -6.120667934417725, -5.557666301727295, -4.994664192199707, -4.431662559509277, -3.8686609268188477, -3.305659294128418, -2.742657423019409, -2.1796555519104004, -1.6166539192199707, -1.053652286529541, -0.4906504154205322, 0.07235145568847656, 0.6353511810302734, 1.1983529329299927, 1.761354684829712, 2.3243565559387207, 2.8873581886291504, 3.45035982131958, 4.013361930847168, 4.576363563537598, 5.139365196228027, 5.702366828918457, 6.265368461608887, 6.828370571136475, 7.391372203826904, 7.954373836517334, 8.517375946044922, 9.080377578735352, 9.643379211425781, 10.206380844116211, 10.76938247680664, 11.33238410949707, 11.8953857421875, 12.45838737487793, 13.021389961242676, 13.584391593933105, 14.147393226623535, 14.710394859313965, 15.273396492004395, 15.836398124694824, 16.39940071105957, 16.96240234375, 17.52540397644043, 18.08840560913086, 18.65140724182129]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 22.0, 23.0, 26.0, 43.0, 73.0, 98.0, 168.0, 246.0, 361.0, 605.0, 879.0, 1472.0, 2254.0, 3742.0, 5787.0, 9419.0, 14824.0, 23262.0, 36112.0, 54032.0, 77219.0, 102599.0, 123586.0, 131778.0, 124522.0, 103128.0, 77307.0, 54633.0, 36254.0, 23459.0, 14975.0, 9599.0, 5901.0, 3662.0, 2353.0, 1466.0, 926.0, 625.0, 404.0, 249.0, 156.0, 115.0, 62.0, 47.0, 34.0, 15.0, 10.0, 8.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.171875, -15.641845703125, -15.11181640625, -14.581787109375, -14.0517578125, -13.521728515625, -12.99169921875, -12.461669921875, -11.931640625, -11.401611328125, -10.87158203125, -10.341552734375, -9.8115234375, -9.281494140625, -8.75146484375, -8.221435546875, -7.69140625, -7.161376953125, -6.63134765625, -6.101318359375, -5.5712890625, -5.041259765625, -4.51123046875, -3.981201171875, -3.451171875, -2.921142578125, -2.39111328125, -1.861083984375, -1.3310546875, -0.801025390625, -0.27099609375, 0.259033203125, 0.7890625, 1.319091796875, 1.84912109375, 2.379150390625, 2.9091796875, 3.439208984375, 3.96923828125, 4.499267578125, 5.029296875, 5.559326171875, 6.08935546875, 6.619384765625, 7.1494140625, 7.679443359375, 8.20947265625, 8.739501953125, 9.26953125, 9.799560546875, 10.32958984375, 10.859619140625, 11.3896484375, 11.919677734375, 12.44970703125, 12.979736328125, 13.509765625, 14.039794921875, 14.56982421875, 15.099853515625, 15.6298828125, 16.159912109375, 16.68994140625, 17.219970703125, 17.75]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 7.0, 6.0, 10.0, 8.0, 13.0, 14.0, 16.0, 14.0, 21.0, 23.0, 25.0, 30.0, 42.0, 26.0, 31.0, 44.0, 43.0, 28.0, 39.0, 39.0, 55.0, 38.0, 41.0, 39.0, 41.0, 26.0, 40.0, 27.0, 41.0, 20.0, 18.0, 17.0, 21.0, 13.0, 22.0, 8.0, 9.0, 8.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8984375, -15.3746337890625, -14.850830078125, -14.3270263671875, -13.80322265625, -13.2794189453125, -12.755615234375, -12.2318115234375, -11.7080078125, -11.1842041015625, -10.660400390625, -10.1365966796875, -9.61279296875, -9.0889892578125, -8.565185546875, -8.0413818359375, -7.517578125, -6.9937744140625, -6.469970703125, -5.9461669921875, -5.42236328125, -4.8985595703125, -4.374755859375, -3.8509521484375, -3.3271484375, -2.8033447265625, -2.279541015625, -1.7557373046875, -1.23193359375, -0.7081298828125, -0.184326171875, 0.3394775390625, 0.86328125, 1.3870849609375, 1.910888671875, 2.4346923828125, 2.95849609375, 3.4822998046875, 4.006103515625, 4.5299072265625, 5.0537109375, 5.5775146484375, 6.101318359375, 6.6251220703125, 7.14892578125, 7.6727294921875, 8.196533203125, 8.7203369140625, 9.244140625, 9.7679443359375, 10.291748046875, 10.8155517578125, 11.33935546875, 11.8631591796875, 12.386962890625, 12.9107666015625, 13.4345703125, 13.9583740234375, 14.482177734375, 15.0059814453125, 15.52978515625, 16.0535888671875, 16.577392578125, 17.1011962890625, 17.625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 10.0, 19.0, 24.0, 46.0, 62.0, 113.0, 189.0, 283.0, 558.0, 1022.0, 1963.0, 3854.0, 8040.0, 16992.0, 35176.0, 69575.0, 126594.0, 187884.0, 210151.0, 170258.0, 105794.0, 56199.0, 27660.0, 13198.0, 6326.0, 3076.0, 1536.0, 842.0, 443.0, 275.0, 141.0, 85.0, 56.0, 38.0, 18.0, 15.0, 12.0, 7.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5625, -27.67919921875, -26.7958984375, -25.91259765625, -25.029296875, -24.14599609375, -23.2626953125, -22.37939453125, -21.49609375, -20.61279296875, -19.7294921875, -18.84619140625, -17.962890625, -17.07958984375, -16.1962890625, -15.31298828125, -14.4296875, -13.54638671875, -12.6630859375, -11.77978515625, -10.896484375, -10.01318359375, -9.1298828125, -8.24658203125, -7.36328125, -6.47998046875, -5.5966796875, -4.71337890625, -3.830078125, -2.94677734375, -2.0634765625, -1.18017578125, -0.296875, 0.58642578125, 1.4697265625, 2.35302734375, 3.236328125, 4.11962890625, 5.0029296875, 5.88623046875, 6.76953125, 7.65283203125, 8.5361328125, 9.41943359375, 10.302734375, 11.18603515625, 12.0693359375, 12.95263671875, 13.8359375, 14.71923828125, 15.6025390625, 16.48583984375, 17.369140625, 18.25244140625, 19.1357421875, 20.01904296875, 20.90234375, 21.78564453125, 22.6689453125, 23.55224609375, 24.435546875, 25.31884765625, 26.2021484375, 27.08544921875, 27.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 12.0, 15.0, 20.0, 16.0, 20.0, 16.0, 23.0, 23.0, 27.0, 33.0, 31.0, 29.0, 40.0, 39.0, 35.0, 37.0, 38.0, 50.0, 41.0, 33.0, 38.0, 31.0, 35.0, 29.0, 25.0, 32.0, 30.0, 27.0, 20.0, 24.0, 13.0, 15.0, 10.0, 11.0, 9.0, 3.0, 6.0, 12.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.5628662109375, -9.235107421875, -8.9073486328125, -8.57958984375, -8.2518310546875, -7.924072265625, -7.5963134765625, -7.2685546875, -6.9407958984375, -6.613037109375, -6.2852783203125, -5.95751953125, -5.6297607421875, -5.302001953125, -4.9742431640625, -4.646484375, -4.3187255859375, -3.990966796875, -3.6632080078125, -3.33544921875, -3.0076904296875, -2.679931640625, -2.3521728515625, -2.0244140625, -1.6966552734375, -1.368896484375, -1.0411376953125, -0.71337890625, -0.3856201171875, -0.057861328125, 0.2698974609375, 0.59765625, 0.9254150390625, 1.253173828125, 1.5809326171875, 1.90869140625, 2.2364501953125, 2.564208984375, 2.8919677734375, 3.2197265625, 3.5474853515625, 3.875244140625, 4.2030029296875, 4.53076171875, 4.8585205078125, 5.186279296875, 5.5140380859375, 5.841796875, 6.1695556640625, 6.497314453125, 6.8250732421875, 7.15283203125, 7.4805908203125, 7.808349609375, 8.1361083984375, 8.4638671875, 8.7916259765625, 9.119384765625, 9.4471435546875, 9.77490234375, 10.1026611328125, 10.430419921875, 10.7581787109375, 11.0859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 10.0, 9.0, 13.0, 13.0, 16.0, 20.0, 40.0, 75.0, 112.0, 165.0, 256.0, 446.0, 792.0, 1262.0, 2249.0, 3983.0, 7117.0, 13012.0, 23992.0, 44021.0, 77194.0, 128244.0, 177545.0, 190259.0, 152779.0, 98127.0, 56820.0, 31203.0, 17002.0, 9372.0, 5266.0, 2920.0, 1709.0, 1065.0, 545.0, 350.0, 205.0, 133.0, 72.0, 43.0, 40.0, 30.0, 14.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.75, -6.52667236328125, -6.3033447265625, -6.08001708984375, -5.856689453125, -5.63336181640625, -5.4100341796875, -5.18670654296875, -4.96337890625, -4.74005126953125, -4.5167236328125, -4.29339599609375, -4.070068359375, -3.84674072265625, -3.6234130859375, -3.40008544921875, -3.1767578125, -2.95343017578125, -2.7301025390625, -2.50677490234375, -2.283447265625, -2.06011962890625, -1.8367919921875, -1.61346435546875, -1.39013671875, -1.16680908203125, -0.9434814453125, -0.72015380859375, -0.496826171875, -0.27349853515625, -0.0501708984375, 0.17315673828125, 0.396484375, 0.61981201171875, 0.8431396484375, 1.06646728515625, 1.289794921875, 1.51312255859375, 1.7364501953125, 1.95977783203125, 2.18310546875, 2.40643310546875, 2.6297607421875, 2.85308837890625, 3.076416015625, 3.29974365234375, 3.5230712890625, 3.74639892578125, 3.9697265625, 4.19305419921875, 4.4163818359375, 4.63970947265625, 4.863037109375, 5.08636474609375, 5.3096923828125, 5.53302001953125, 5.75634765625, 5.97967529296875, 6.2030029296875, 6.42633056640625, 6.649658203125, 6.87298583984375, 7.0963134765625, 7.31964111328125, 7.54296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 13.0, 10.0, 10.0, 16.0, 14.0, 12.0, 21.0, 31.0, 30.0, 27.0, 43.0, 50.0, 57.0, 47.0, 65.0, 55.0, 61.0, 53.0, 50.0, 53.0, 47.0, 42.0, 38.0, 43.0, 19.0, 19.0, 22.0, 8.0, 13.0, 4.0, 5.0, 8.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006818771362304688, -0.0006601959466934204, -0.0006385147571563721, -0.0006168335676193237, -0.0005951523780822754, -0.000573471188545227, -0.0005517899990081787, -0.0005301088094711304, -0.000508427619934082, -0.0004867464303970337, -0.00046506524085998535, -0.000443384051322937, -0.00042170286178588867, -0.00040002167224884033, -0.000378340482711792, -0.00035665929317474365, -0.0003349781036376953, -0.00031329691410064697, -0.00029161572456359863, -0.0002699345350265503, -0.00024825334548950195, -0.0002265721559524536, -0.00020489096641540527, -0.00018320977687835693, -0.0001615285873413086, -0.00013984739780426025, -0.00011816620826721191, -9.648501873016357e-05, -7.480382919311523e-05, -5.3122639656066895e-05, -3.1441450119018555e-05, -9.760260581970215e-06, 1.1920928955078125e-05, 3.3602118492126465e-05, 5.5283308029174805e-05, 7.696449756622314e-05, 9.864568710327148e-05, 0.00012032687664031982, 0.00014200806617736816, 0.0001636892557144165, 0.00018537044525146484, 0.00020705163478851318, 0.00022873282432556152, 0.00025041401386260986, 0.0002720952033996582, 0.00029377639293670654, 0.0003154575824737549, 0.0003371387720108032, 0.00035881996154785156, 0.0003805011510848999, 0.00040218234062194824, 0.0004238635301589966, 0.0004455447196960449, 0.00046722590923309326, 0.0004889070987701416, 0.0005105882883071899, 0.0005322694778442383, 0.0005539506673812866, 0.000575631856918335, 0.0005973130464553833, 0.0006189942359924316, 0.00064067542552948, 0.0006623566150665283, 0.0006840378046035767, 0.000705718994140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 3.0, 21.0, 22.0, 26.0, 40.0, 62.0, 91.0, 152.0, 222.0, 356.0, 531.0, 904.0, 1526.0, 2624.0, 4707.0, 8441.0, 14890.0, 27291.0, 48287.0, 83246.0, 131362.0, 174683.0, 181170.0, 144838.0, 94676.0, 56228.0, 31616.0, 17460.0, 9899.0, 5490.0, 3168.0, 1763.0, 1021.0, 601.0, 421.0, 218.0, 159.0, 96.0, 68.0, 47.0, 46.0, 24.0, 11.0, 8.0, 5.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.1171875, -6.89569091796875, -6.6741943359375, -6.45269775390625, -6.231201171875, -6.00970458984375, -5.7882080078125, -5.56671142578125, -5.34521484375, -5.12371826171875, -4.9022216796875, -4.68072509765625, -4.459228515625, -4.23773193359375, -4.0162353515625, -3.79473876953125, -3.5732421875, -3.35174560546875, -3.1302490234375, -2.90875244140625, -2.687255859375, -2.46575927734375, -2.2442626953125, -2.02276611328125, -1.80126953125, -1.57977294921875, -1.3582763671875, -1.13677978515625, -0.915283203125, -0.69378662109375, -0.4722900390625, -0.25079345703125, -0.029296875, 0.19219970703125, 0.4136962890625, 0.63519287109375, 0.856689453125, 1.07818603515625, 1.2996826171875, 1.52117919921875, 1.74267578125, 1.96417236328125, 2.1856689453125, 2.40716552734375, 2.628662109375, 2.85015869140625, 3.0716552734375, 3.29315185546875, 3.5146484375, 3.73614501953125, 3.9576416015625, 4.17913818359375, 4.400634765625, 4.62213134765625, 4.8436279296875, 5.06512451171875, 5.28662109375, 5.50811767578125, 5.7296142578125, 5.95111083984375, 6.172607421875, 6.39410400390625, 6.6156005859375, 6.83709716796875, 7.05859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 15.0, 7.0, 11.0, 16.0, 15.0, 18.0, 31.0, 36.0, 43.0, 35.0, 45.0, 45.0, 51.0, 44.0, 57.0, 52.0, 52.0, 45.0, 51.0, 44.0, 45.0, 49.0, 28.0, 36.0, 23.0, 20.0, 16.0, 17.0, 15.0, 11.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.169921875, -2.091461181640625, -2.01300048828125, -1.934539794921875, -1.8560791015625, -1.777618408203125, -1.69915771484375, -1.620697021484375, -1.542236328125, -1.463775634765625, -1.38531494140625, -1.306854248046875, -1.2283935546875, -1.149932861328125, -1.07147216796875, -0.993011474609375, -0.91455078125, -0.836090087890625, -0.75762939453125, -0.679168701171875, -0.6007080078125, -0.522247314453125, -0.44378662109375, -0.365325927734375, -0.286865234375, -0.208404541015625, -0.12994384765625, -0.051483154296875, 0.0269775390625, 0.105438232421875, 0.18389892578125, 0.262359619140625, 0.3408203125, 0.419281005859375, 0.49774169921875, 0.576202392578125, 0.6546630859375, 0.733123779296875, 0.81158447265625, 0.890045166015625, 0.968505859375, 1.046966552734375, 1.12542724609375, 1.203887939453125, 1.2823486328125, 1.360809326171875, 1.43927001953125, 1.517730712890625, 1.59619140625, 1.674652099609375, 1.75311279296875, 1.831573486328125, 1.9100341796875, 1.988494873046875, 2.06695556640625, 2.145416259765625, 2.223876953125, 2.302337646484375, 2.38079833984375, 2.459259033203125, 2.5377197265625, 2.616180419921875, 2.69464111328125, 2.773101806640625, 2.8515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 10.0, 6.0, 11.0, 11.0, 23.0, 11.0, 19.0, 22.0, 23.0, 35.0, 21.0, 40.0, 43.0, 38.0, 43.0, 50.0, 36.0, 39.0, 48.0, 40.0, 42.0, 29.0, 49.0, 42.0, 31.0, 30.0, 30.0, 25.0, 20.0, 19.0, 17.0, 12.0, 19.0, 11.0, 8.0, 8.0, 5.0, 7.0, 8.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.005413055419922, -17.463844299316406, -16.922273635864258, -16.380704879760742, -15.839134216308594, -15.297565460205078, -14.755995750427246, -14.214426040649414, -13.672856330871582, -13.13128662109375, -12.589716911315918, -12.048147201538086, -11.50657844543457, -10.965007781982422, -10.423439025878906, -9.881869316101074, -9.340299606323242, -8.79872989654541, -8.257160186767578, -7.715590953826904, -7.174021244049072, -6.63245153427124, -6.090882301330566, -5.549312591552734, -5.007742881774902, -4.46617317199707, -3.9246037006378174, -3.3830342292785645, -2.8414645195007324, -2.2998948097229004, -1.7583253383636475, -1.2167558670043945, -0.6751880645751953, -0.13361847400665283, 0.40795111656188965, 0.9495207071304321, 1.4910902976989746, 2.0326600074768066, 2.5742294788360596, 3.1157989501953125, 3.6573686599731445, 4.198938369750977, 4.740508079528809, 5.282077312469482, 5.8236470222473145, 6.3652167320251465, 6.90678596496582, 7.448355674743652, 7.989925384521484, 8.531495094299316, 9.073064804077148, 9.61463451385498, 10.156204223632812, 10.697772979736328, 11.23934268951416, 11.780912399291992, 12.322482109069824, 12.864051818847656, 13.405621528625488, 13.94719123840332, 14.488759994506836, 15.030330657958984, 15.5718994140625, 16.113468170166016, 16.655038833618164]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 9.0, 6.0, 7.0, 9.0, 15.0, 21.0, 19.0, 17.0, 24.0, 26.0, 27.0, 35.0, 37.0, 23.0, 27.0, 41.0, 33.0, 31.0, 39.0, 39.0, 41.0, 40.0, 50.0, 27.0, 37.0, 33.0, 27.0, 32.0, 18.0, 22.0, 16.0, 23.0, 16.0, 17.0, 13.0, 17.0, 12.0, 13.0, 6.0, 12.0, 7.0, 12.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.920804023742676, -14.411434173583984, -13.90206527709961, -13.392695426940918, -12.883325576782227, -12.373955726623535, -11.864585876464844, -11.355216979980469, -10.845847129821777, -10.336477279663086, -9.827108383178711, -9.31773853302002, -8.808368682861328, -8.298998832702637, -7.7896294593811035, -7.28026008605957, -6.770890235900879, -6.2615203857421875, -5.752151012420654, -5.242781639099121, -4.73341178894043, -4.224041938781738, -3.714672565460205, -3.2053029537200928, -2.6959333419799805, -2.186563730239868, -1.6771941184997559, -1.1678245067596436, -0.6584548950195312, -0.14908528327941895, 0.36028432846069336, 0.8696539402008057, 1.3790245056152344, 1.8883941173553467, 2.397763729095459, 2.9071333408355713, 3.4165029525756836, 3.925872564315796, 4.435242176055908, 4.944611549377441, 5.453981399536133, 5.963351249694824, 6.472720623016357, 6.982089996337891, 7.491459846496582, 8.000829696655273, 8.510198593139648, 9.01956844329834, 9.528938293457031, 10.038308143615723, 10.547677993774414, 11.057046890258789, 11.56641674041748, 12.075786590576172, 12.585155487060547, 13.094525337219238, 13.60389518737793, 14.113265037536621, 14.622634887695312, 15.132003784179688, 15.641373634338379, 16.15074348449707, 16.660112380981445, 17.169483184814453, 17.678852081298828]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 10.0, 7.0, 5.0, 7.0, 15.0, 22.0, 44.0, 73.0, 110.0, 158.0, 230.0, 360.0, 603.0, 913.0, 1465.0, 2242.0, 3742.0, 6271.0, 10273.0, 17562.0, 29545.0, 50735.0, 87725.0, 153359.0, 263578.0, 426571.0, 603873.0, 696353.0, 637667.0, 471372.0, 299881.0, 177249.0, 103211.0, 59399.0, 35051.0, 21294.0, 12886.0, 7750.0, 4683.0, 2914.0, 1809.0, 1193.0, 710.0, 462.0, 325.0, 201.0, 153.0, 64.0, 65.0, 42.0, 28.0, 11.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.28125, -16.735107421875, -16.18896484375, -15.642822265625, -15.0966796875, -14.550537109375, -14.00439453125, -13.458251953125, -12.912109375, -12.365966796875, -11.81982421875, -11.273681640625, -10.7275390625, -10.181396484375, -9.63525390625, -9.089111328125, -8.54296875, -7.996826171875, -7.45068359375, -6.904541015625, -6.3583984375, -5.812255859375, -5.26611328125, -4.719970703125, -4.173828125, -3.627685546875, -3.08154296875, -2.535400390625, -1.9892578125, -1.443115234375, -0.89697265625, -0.350830078125, 0.1953125, 0.741455078125, 1.28759765625, 1.833740234375, 2.3798828125, 2.926025390625, 3.47216796875, 4.018310546875, 4.564453125, 5.110595703125, 5.65673828125, 6.202880859375, 6.7490234375, 7.295166015625, 7.84130859375, 8.387451171875, 8.93359375, 9.479736328125, 10.02587890625, 10.572021484375, 11.1181640625, 11.664306640625, 12.21044921875, 12.756591796875, 13.302734375, 13.848876953125, 14.39501953125, 14.941162109375, 15.4873046875, 16.033447265625, 16.57958984375, 17.125732421875, 17.671875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 9.0, 10.0, 9.0, 14.0, 17.0, 14.0, 13.0, 15.0, 32.0, 29.0, 23.0, 42.0, 29.0, 29.0, 31.0, 28.0, 46.0, 33.0, 31.0, 36.0, 47.0, 31.0, 41.0, 42.0, 44.0, 35.0, 30.0, 17.0, 15.0, 25.0, 20.0, 21.0, 14.0, 20.0, 16.0, 8.0, 11.0, 9.0, 11.0, 9.0, 5.0, 12.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.6796875, -12.23828125, -11.796875, -11.35546875, -10.9140625, -10.47265625, -10.03125, -9.58984375, -9.1484375, -8.70703125, -8.265625, -7.82421875, -7.3828125, -6.94140625, -6.5, -6.05859375, -5.6171875, -5.17578125, -4.734375, -4.29296875, -3.8515625, -3.41015625, -2.96875, -2.52734375, -2.0859375, -1.64453125, -1.203125, -0.76171875, -0.3203125, 0.12109375, 0.5625, 1.00390625, 1.4453125, 1.88671875, 2.328125, 2.76953125, 3.2109375, 3.65234375, 4.09375, 4.53515625, 4.9765625, 5.41796875, 5.859375, 6.30078125, 6.7421875, 7.18359375, 7.625, 8.06640625, 8.5078125, 8.94921875, 9.390625, 9.83203125, 10.2734375, 10.71484375, 11.15625, 11.59765625, 12.0390625, 12.48046875, 12.921875, 13.36328125, 13.8046875, 14.24609375, 14.6875, 15.12890625, 15.5703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 9.0, 11.0, 14.0, 15.0, 22.0, 51.0, 58.0, 113.0, 153.0, 227.0, 323.0, 542.0, 827.0, 1268.0, 1941.0, 3007.0, 4864.0, 7737.0, 12335.0, 20034.0, 32154.0, 52591.0, 83989.0, 134496.0, 206552.0, 307356.0, 424979.0, 530151.0, 572486.0, 525792.0, 419889.0, 300969.0, 202355.0, 130744.0, 81755.0, 50657.0, 31570.0, 19672.0, 12043.0, 7593.0, 4696.0, 2970.0, 1873.0, 1198.0, 752.0, 492.0, 318.0, 222.0, 156.0, 94.0, 62.0, 41.0, 32.0, 15.0, 10.0, 9.0, 3.0, 3.0, 2.0, 6.0], "bins": [-16.375, -15.8707275390625, -15.366455078125, -14.8621826171875, -14.35791015625, -13.8536376953125, -13.349365234375, -12.8450927734375, -12.3408203125, -11.8365478515625, -11.332275390625, -10.8280029296875, -10.32373046875, -9.8194580078125, -9.315185546875, -8.8109130859375, -8.306640625, -7.8023681640625, -7.298095703125, -6.7938232421875, -6.28955078125, -5.7852783203125, -5.281005859375, -4.7767333984375, -4.2724609375, -3.7681884765625, -3.263916015625, -2.7596435546875, -2.25537109375, -1.7510986328125, -1.246826171875, -0.7425537109375, -0.23828125, 0.2659912109375, 0.770263671875, 1.2745361328125, 1.77880859375, 2.2830810546875, 2.787353515625, 3.2916259765625, 3.7958984375, 4.3001708984375, 4.804443359375, 5.3087158203125, 5.81298828125, 6.3172607421875, 6.821533203125, 7.3258056640625, 7.830078125, 8.3343505859375, 8.838623046875, 9.3428955078125, 9.84716796875, 10.3514404296875, 10.855712890625, 11.3599853515625, 11.8642578125, 12.3685302734375, 12.872802734375, 13.3770751953125, 13.88134765625, 14.3856201171875, 14.889892578125, 15.3941650390625, 15.8984375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 15.0, 15.0, 17.0, 30.0, 24.0, 24.0, 41.0, 47.0, 57.0, 88.0, 104.0, 127.0, 141.0, 183.0, 171.0, 186.0, 219.0, 250.0, 228.0, 255.0, 204.0, 227.0, 198.0, 181.0, 193.0, 134.0, 126.0, 101.0, 86.0, 77.0, 67.0, 46.0, 49.0, 40.0, 20.0, 28.0, 16.0, 8.0, 12.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.43359375, -7.19549560546875, -6.9573974609375, -6.71929931640625, -6.481201171875, -6.24310302734375, -6.0050048828125, -5.76690673828125, -5.52880859375, -5.29071044921875, -5.0526123046875, -4.81451416015625, -4.576416015625, -4.33831787109375, -4.1002197265625, -3.86212158203125, -3.6240234375, -3.38592529296875, -3.1478271484375, -2.90972900390625, -2.671630859375, -2.43353271484375, -2.1954345703125, -1.95733642578125, -1.71923828125, -1.48114013671875, -1.2430419921875, -1.00494384765625, -0.766845703125, -0.52874755859375, -0.2906494140625, -0.05255126953125, 0.185546875, 0.42364501953125, 0.6617431640625, 0.89984130859375, 1.137939453125, 1.37603759765625, 1.6141357421875, 1.85223388671875, 2.09033203125, 2.32843017578125, 2.5665283203125, 2.80462646484375, 3.042724609375, 3.28082275390625, 3.5189208984375, 3.75701904296875, 3.9951171875, 4.23321533203125, 4.4713134765625, 4.70941162109375, 4.947509765625, 5.18560791015625, 5.4237060546875, 5.66180419921875, 5.89990234375, 6.13800048828125, 6.3760986328125, 6.61419677734375, 6.852294921875, 7.09039306640625, 7.3284912109375, 7.56658935546875, 7.8046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 10.0, 13.0, 19.0, 17.0, 19.0, 20.0, 17.0, 27.0, 31.0, 28.0, 30.0, 45.0, 50.0, 34.0, 47.0, 53.0, 63.0, 43.0, 52.0, 53.0, 38.0, 34.0, 32.0, 31.0, 29.0, 26.0, 23.0, 18.0, 15.0, 14.0, 7.0, 13.0, 8.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.380870819091797, -17.808752059936523, -17.236631393432617, -16.664512634277344, -16.092391967773438, -15.520273208618164, -14.948153495788574, -14.376033782958984, -13.803914070129395, -13.231794357299805, -12.659674644470215, -12.087554931640625, -11.515436172485352, -10.943315505981445, -10.371196746826172, -9.799077033996582, -9.226957321166992, -8.654837608337402, -8.082717895507812, -7.510598659515381, -6.938478946685791, -6.366359233856201, -5.7942399978637695, -5.22212028503418, -4.65000057220459, -4.077880859375, -3.5057613849639893, -2.9336419105529785, -2.3615221977233887, -1.7894024848937988, -1.217283010482788, -0.6451635360717773, -0.0730438232421875, 0.4990757703781128, 1.071195363998413, 1.6433149576187134, 2.2154345512390137, 2.7875542640686035, 3.3596737384796143, 3.931793212890625, 4.503912925720215, 5.076032638549805, 5.6481523513793945, 6.220271587371826, 6.792391300201416, 7.364511013031006, 7.9366302490234375, 8.508749961853027, 9.080869674682617, 9.652989387512207, 10.225109100341797, 10.797228813171387, 11.369348526000977, 11.94146728515625, 12.51358699798584, 13.08570671081543, 13.65782642364502, 14.22994613647461, 14.8020658493042, 15.374185562133789, 15.946304321289062, 16.51842498779297, 17.090543746948242, 17.662662506103516, 18.234783172607422]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 6.0, 6.0, 4.0, 5.0, 6.0, 10.0, 10.0, 16.0, 14.0, 28.0, 19.0, 15.0, 27.0, 23.0, 24.0, 21.0, 27.0, 34.0, 32.0, 39.0, 36.0, 43.0, 46.0, 41.0, 27.0, 29.0, 42.0, 39.0, 34.0, 34.0, 30.0, 30.0, 21.0, 27.0, 23.0, 21.0, 21.0, 13.0, 15.0, 7.0, 7.0, 6.0, 4.0, 5.0, 4.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.413839340209961, -13.925719261169434, -13.437599182128906, -12.949479103088379, -12.461359024047852, -11.97323989868164, -11.485118865966797, -10.996999740600586, -10.508879661560059, -10.020759582519531, -9.532639503479004, -9.044519424438477, -8.55639934539795, -8.068279266357422, -7.580159664154053, -7.092040061950684, -6.603919506072998, -6.115799427032471, -5.627679347991943, -5.139559745788574, -4.651439666748047, -4.1633195877075195, -3.675199508666992, -3.187079668045044, -2.6989595890045166, -2.2108395099639893, -1.722719669342041, -1.2345995903015137, -0.7464796304702759, -0.2583596706390381, 0.22976040840148926, 0.7178802490234375, 1.2060003280639648, 1.6941202878952026, 2.1822402477264404, 2.6703603267669678, 3.158480167388916, 3.6466002464294434, 4.134720325469971, 4.62283992767334, 5.110960006713867, 5.5990800857543945, 6.087200164794922, 6.575320243835449, 7.063439846038818, 7.551559925079346, 8.039680480957031, 8.527799606323242, 9.015920639038086, 9.504040718078613, 9.99216079711914, 10.480280876159668, 10.968400955200195, 11.456520080566406, 11.94464111328125, 12.432760238647461, 12.920880317687988, 13.409000396728516, 13.897120475769043, 14.38524055480957, 14.873360633850098, 15.361480712890625, 15.849599838256836, 16.33772087097168, 16.82583999633789]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 12.0, 14.0, 19.0, 37.0, 51.0, 93.0, 131.0, 190.0, 292.0, 438.0, 676.0, 1015.0, 1506.0, 2331.0, 3429.0, 5382.0, 7905.0, 11929.0, 17934.0, 25722.0, 36930.0, 51061.0, 68089.0, 85090.0, 100149.0, 108516.0, 108537.0, 99212.0, 83810.0, 66302.0, 49731.0, 35582.0, 24894.0, 17256.0, 11481.0, 7710.0, 5071.0, 3398.0, 2236.0, 1500.0, 1012.0, 663.0, 411.0, 285.0, 169.0, 124.0, 76.0, 55.0, 26.0, 32.0, 19.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.93359375, -6.71661376953125, -6.4996337890625, -6.28265380859375, -6.065673828125, -5.84869384765625, -5.6317138671875, -5.41473388671875, -5.19775390625, -4.98077392578125, -4.7637939453125, -4.54681396484375, -4.329833984375, -4.11285400390625, -3.8958740234375, -3.67889404296875, -3.4619140625, -3.24493408203125, -3.0279541015625, -2.81097412109375, -2.593994140625, -2.37701416015625, -2.1600341796875, -1.94305419921875, -1.72607421875, -1.50909423828125, -1.2921142578125, -1.07513427734375, -0.858154296875, -0.64117431640625, -0.4241943359375, -0.20721435546875, 0.009765625, 0.22674560546875, 0.4437255859375, 0.66070556640625, 0.877685546875, 1.09466552734375, 1.3116455078125, 1.52862548828125, 1.74560546875, 1.96258544921875, 2.1795654296875, 2.39654541015625, 2.613525390625, 2.83050537109375, 3.0474853515625, 3.26446533203125, 3.4814453125, 3.69842529296875, 3.9154052734375, 4.13238525390625, 4.349365234375, 4.56634521484375, 4.7833251953125, 5.00030517578125, 5.21728515625, 5.43426513671875, 5.6512451171875, 5.86822509765625, 6.085205078125, 6.30218505859375, 6.5191650390625, 6.73614501953125, 6.953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 4.0, 6.0, 5.0, 5.0, 10.0, 11.0, 15.0, 15.0, 24.0, 22.0, 15.0, 23.0, 26.0, 24.0, 20.0, 29.0, 32.0, 32.0, 35.0, 39.0, 41.0, 43.0, 46.0, 28.0, 26.0, 45.0, 35.0, 34.0, 35.0, 32.0, 30.0, 21.0, 27.0, 24.0, 21.0, 20.0, 15.0, 14.0, 8.0, 8.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.5703125, -14.0789794921875, -13.587646484375, -13.0963134765625, -12.60498046875, -12.1136474609375, -11.622314453125, -11.1309814453125, -10.6396484375, -10.1483154296875, -9.656982421875, -9.1656494140625, -8.67431640625, -8.1829833984375, -7.691650390625, -7.2003173828125, -6.708984375, -6.2176513671875, -5.726318359375, -5.2349853515625, -4.74365234375, -4.2523193359375, -3.760986328125, -3.2696533203125, -2.7783203125, -2.2869873046875, -1.795654296875, -1.3043212890625, -0.81298828125, -0.3216552734375, 0.169677734375, 0.6610107421875, 1.15234375, 1.6436767578125, 2.135009765625, 2.6263427734375, 3.11767578125, 3.6090087890625, 4.100341796875, 4.5916748046875, 5.0830078125, 5.5743408203125, 6.065673828125, 6.5570068359375, 7.04833984375, 7.5396728515625, 8.031005859375, 8.5223388671875, 9.013671875, 9.5050048828125, 9.996337890625, 10.4876708984375, 10.97900390625, 11.4703369140625, 11.961669921875, 12.4530029296875, 12.9443359375, 13.4356689453125, 13.927001953125, 14.4183349609375, 14.90966796875, 15.4010009765625, 15.892333984375, 16.3836669921875, 16.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 6.0, 6.0, 15.0, 19.0, 28.0, 37.0, 55.0, 84.0, 149.0, 182.0, 295.0, 512.0, 738.0, 1161.0, 1925.0, 3137.0, 5111.0, 8028.0, 13216.0, 21714.0, 41371.0, 709461.0, 167854.0, 28525.0, 17253.0, 10554.0, 6395.0, 3977.0, 2469.0, 1553.0, 981.0, 583.0, 387.0, 259.0, 166.0, 118.0, 55.0, 49.0, 34.0, 36.0, 16.0, 9.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.296875, -15.76708984375, -15.2373046875, -14.70751953125, -14.177734375, -13.64794921875, -13.1181640625, -12.58837890625, -12.05859375, -11.52880859375, -10.9990234375, -10.46923828125, -9.939453125, -9.40966796875, -8.8798828125, -8.35009765625, -7.8203125, -7.29052734375, -6.7607421875, -6.23095703125, -5.701171875, -5.17138671875, -4.6416015625, -4.11181640625, -3.58203125, -3.05224609375, -2.5224609375, -1.99267578125, -1.462890625, -0.93310546875, -0.4033203125, 0.12646484375, 0.65625, 1.18603515625, 1.7158203125, 2.24560546875, 2.775390625, 3.30517578125, 3.8349609375, 4.36474609375, 4.89453125, 5.42431640625, 5.9541015625, 6.48388671875, 7.013671875, 7.54345703125, 8.0732421875, 8.60302734375, 9.1328125, 9.66259765625, 10.1923828125, 10.72216796875, 11.251953125, 11.78173828125, 12.3115234375, 12.84130859375, 13.37109375, 13.90087890625, 14.4306640625, 14.96044921875, 15.490234375, 16.02001953125, 16.5498046875, 17.07958984375, 17.609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 12.0, 8.0, 8.0, 20.0, 19.0, 26.0, 23.0, 23.0, 30.0, 29.0, 29.0, 29.0, 32.0, 39.0, 38.0, 33.0, 41.0, 41.0, 40.0, 34.0, 46.0, 34.0, 37.0, 37.0, 41.0, 32.0, 27.0, 35.0, 10.0, 22.0, 26.0, 14.0, 18.0, 13.0, 12.0, 7.0, 8.0, 2.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.809814453125, -10.40087890625, -9.991943359375, -9.5830078125, -9.174072265625, -8.76513671875, -8.356201171875, -7.947265625, -7.538330078125, -7.12939453125, -6.720458984375, -6.3115234375, -5.902587890625, -5.49365234375, -5.084716796875, -4.67578125, -4.266845703125, -3.85791015625, -3.448974609375, -3.0400390625, -2.631103515625, -2.22216796875, -1.813232421875, -1.404296875, -0.995361328125, -0.58642578125, -0.177490234375, 0.2314453125, 0.640380859375, 1.04931640625, 1.458251953125, 1.8671875, 2.276123046875, 2.68505859375, 3.093994140625, 3.5029296875, 3.911865234375, 4.32080078125, 4.729736328125, 5.138671875, 5.547607421875, 5.95654296875, 6.365478515625, 6.7744140625, 7.183349609375, 7.59228515625, 8.001220703125, 8.41015625, 8.819091796875, 9.22802734375, 9.636962890625, 10.0458984375, 10.454833984375, 10.86376953125, 11.272705078125, 11.681640625, 12.090576171875, 12.49951171875, 12.908447265625, 13.3173828125, 13.726318359375, 14.13525390625, 14.544189453125, 14.953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 7.0, 7.0, 12.0, 24.0, 21.0, 31.0, 36.0, 62.0, 84.0, 118.0, 154.0, 219.0, 317.0, 540.0, 780.0, 1229.0, 1794.0, 2904.0, 4473.0, 7174.0, 11871.0, 20167.0, 45018.0, 670295.0, 208534.0, 30411.0, 16172.0, 9579.0, 5824.0, 3727.0, 2334.0, 1566.0, 1000.0, 621.0, 466.0, 295.0, 191.0, 132.0, 100.0, 70.0, 48.0, 35.0, 28.0, 21.0, 17.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8895797729492188, -0.8597259521484375, -0.8298721313476562, -0.800018310546875, -0.7701644897460938, -0.7403106689453125, -0.7104568481445312, -0.68060302734375, -0.6507492065429688, -0.6208953857421875, -0.5910415649414062, -0.561187744140625, -0.5313339233398438, -0.5014801025390625, -0.47162628173828125, -0.4417724609375, -0.41191864013671875, -0.3820648193359375, -0.35221099853515625, -0.322357177734375, -0.29250335693359375, -0.2626495361328125, -0.23279571533203125, -0.20294189453125, -0.17308807373046875, -0.1432342529296875, -0.11338043212890625, -0.083526611328125, -0.05367279052734375, -0.0238189697265625, 0.00603485107421875, 0.035888671875, 0.06574249267578125, 0.0955963134765625, 0.12545013427734375, 0.155303955078125, 0.18515777587890625, 0.2150115966796875, 0.24486541748046875, 0.27471923828125, 0.30457305908203125, 0.3344268798828125, 0.36428070068359375, 0.394134521484375, 0.42398834228515625, 0.4538421630859375, 0.48369598388671875, 0.5135498046875, 0.5434036254882812, 0.5732574462890625, 0.6031112670898438, 0.632965087890625, 0.6628189086914062, 0.6926727294921875, 0.7225265502929688, 0.75238037109375, 0.7822341918945312, 0.8120880126953125, 0.8419418334960938, 0.871795654296875, 0.9016494750976562, 0.9315032958984375, 0.9613571166992188, 0.9912109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 16.0, 23.0, 24.0, 23.0, 43.0, 46.0, 44.0, 63.0, 46.0, 54.0, 68.0, 72.0, 59.0, 55.0, 47.0, 39.0, 38.0, 38.0, 28.0, 25.0, 20.0, 17.0, 19.0, 9.0, 9.0, 12.0, 7.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0003559589385986328, -0.0003462545573711395, -0.00033655017614364624, -0.00032684579491615295, -0.00031714141368865967, -0.0003074370324611664, -0.0002977326512336731, -0.0002880282700061798, -0.0002783238887786865, -0.00026861950755119324, -0.00025891512632369995, -0.00024921074509620667, -0.00023950636386871338, -0.0002298019826412201, -0.0002200976014137268, -0.00021039322018623352, -0.00020068883895874023, -0.00019098445773124695, -0.00018128007650375366, -0.00017157569527626038, -0.0001618713140487671, -0.0001521669328212738, -0.00014246255159378052, -0.00013275817036628723, -0.00012305378913879395, -0.00011334940791130066, -0.00010364502668380737, -9.394064545631409e-05, -8.42362642288208e-05, -7.453188300132751e-05, -6.482750177383423e-05, -5.512312054634094e-05, -4.5418739318847656e-05, -3.571435809135437e-05, -2.6009976863861084e-05, -1.6305595636367798e-05, -6.601214408874512e-06, 3.1031668186187744e-06, 1.280754804611206e-05, 2.2511929273605347e-05, 3.221631050109863e-05, 4.192069172859192e-05, 5.1625072956085205e-05, 6.132945418357849e-05, 7.103383541107178e-05, 8.073821663856506e-05, 9.044259786605835e-05, 0.00010014697909355164, 0.00010985136032104492, 0.00011955574154853821, 0.0001292601227760315, 0.00013896450400352478, 0.00014866888523101807, 0.00015837326645851135, 0.00016807764768600464, 0.00017778202891349792, 0.0001874864101409912, 0.0001971907913684845, 0.00020689517259597778, 0.00021659955382347107, 0.00022630393505096436, 0.00023600831627845764, 0.00024571269750595093, 0.0002554170787334442, 0.0002651214599609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 11.0, 7.0, 12.0, 25.0, 40.0, 69.0, 118.0, 161.0, 275.0, 432.0, 703.0, 1046.0, 1674.0, 2966.0, 4974.0, 8902.0, 16386.0, 29424.0, 52093.0, 86048.0, 125679.0, 159835.0, 166256.0, 140869.0, 100919.0, 64614.0, 37627.0, 20693.0, 11281.0, 6350.0, 3590.0, 2052.0, 1288.0, 797.0, 489.0, 308.0, 191.0, 128.0, 89.0, 53.0, 27.0, 19.0, 12.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6536483764648438, -0.6320037841796875, -0.6103591918945312, -0.588714599609375, -0.5670700073242188, -0.5454254150390625, -0.5237808227539062, -0.50213623046875, -0.48049163818359375, -0.4588470458984375, -0.43720245361328125, -0.415557861328125, -0.39391326904296875, -0.3722686767578125, -0.35062408447265625, -0.3289794921875, -0.30733489990234375, -0.2856903076171875, -0.26404571533203125, -0.242401123046875, -0.22075653076171875, -0.1991119384765625, -0.17746734619140625, -0.15582275390625, -0.13417816162109375, -0.1125335693359375, -0.09088897705078125, -0.069244384765625, -0.04759979248046875, -0.0259552001953125, -0.00431060791015625, 0.017333984375, 0.03897857666015625, 0.0606231689453125, 0.08226776123046875, 0.103912353515625, 0.12555694580078125, 0.1472015380859375, 0.16884613037109375, 0.19049072265625, 0.21213531494140625, 0.2337799072265625, 0.25542449951171875, 0.277069091796875, 0.29871368408203125, 0.3203582763671875, 0.34200286865234375, 0.3636474609375, 0.38529205322265625, 0.4069366455078125, 0.42858123779296875, 0.450225830078125, 0.47187042236328125, 0.4935150146484375, 0.5151596069335938, 0.53680419921875, 0.5584487915039062, 0.5800933837890625, 0.6017379760742188, 0.623382568359375, 0.6450271606445312, 0.6666717529296875, 0.6883163452148438, 0.7099609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 0.0, 5.0, 16.0, 14.0, 12.0, 10.0, 17.0, 30.0, 25.0, 30.0, 31.0, 38.0, 41.0, 59.0, 44.0, 47.0, 53.0, 37.0, 56.0, 60.0, 55.0, 35.0, 41.0, 42.0, 34.0, 32.0, 26.0, 16.0, 18.0, 20.0, 7.0, 7.0, 5.0, 8.0, 10.0, 6.0, 1.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.3017253875732422, -0.2936363220214844, -0.28554725646972656, -0.27745819091796875, -0.26936912536621094, -0.2612800598144531, -0.2531909942626953, -0.2451019287109375, -0.2370128631591797, -0.22892379760742188, -0.22083473205566406, -0.21274566650390625, -0.20465660095214844, -0.19656753540039062, -0.1884784698486328, -0.180389404296875, -0.1723003387451172, -0.16421127319335938, -0.15612220764160156, -0.14803314208984375, -0.13994407653808594, -0.13185501098632812, -0.12376594543457031, -0.1156768798828125, -0.10758781433105469, -0.09949874877929688, -0.09140968322753906, -0.08332061767578125, -0.07523155212402344, -0.06714248657226562, -0.05905342102050781, -0.05096435546875, -0.04287528991699219, -0.034786224365234375, -0.026697158813476562, -0.01860809326171875, -0.010519027709960938, -0.002429962158203125, 0.0056591033935546875, 0.0137481689453125, 0.021837234497070312, 0.029926300048828125, 0.03801536560058594, 0.04610443115234375, 0.05419349670410156, 0.062282562255859375, 0.07037162780761719, 0.078460693359375, 0.08654975891113281, 0.09463882446289062, 0.10272789001464844, 0.11081695556640625, 0.11890602111816406, 0.12699508666992188, 0.1350841522216797, 0.1431732177734375, 0.1512622833251953, 0.15935134887695312, 0.16744041442871094, 0.17552947998046875, 0.18361854553222656, 0.19170761108398438, 0.1997966766357422, 0.2078857421875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 7.0, 11.0, 10.0, 15.0, 15.0, 12.0, 27.0, 20.0, 25.0, 29.0, 43.0, 30.0, 38.0, 40.0, 56.0, 62.0, 53.0, 51.0, 56.0, 56.0, 52.0, 37.0, 34.0, 34.0, 33.0, 31.0, 19.0, 25.0, 12.0, 10.0, 15.0, 10.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.834659576416016, -21.208133697509766, -20.58160972595215, -19.9550838470459, -19.32855796813965, -18.70203399658203, -18.07550811767578, -17.44898223876953, -16.82245635986328, -16.19593048095703, -15.569405555725098, -14.942880630493164, -14.316354751586914, -13.68982982635498, -13.063304901123047, -12.436779022216797, -11.81025505065918, -11.183730125427246, -10.557204246520996, -9.930679321289062, -9.304153442382812, -8.677628517150879, -8.051103591918945, -7.4245781898498535, -6.798052787780762, -6.17152738571167, -5.545001983642578, -4.9184770584106445, -4.291951656341553, -3.665426254272461, -3.0389010906219482, -2.4123759269714355, -1.7858524322509766, -1.1593271493911743, -0.5328018665313721, 0.09372341632843018, 0.7202486991882324, 1.3467741012573242, 1.973299264907837, 2.5998244285583496, 3.2263498306274414, 3.852875232696533, 4.479400634765625, 5.105925559997559, 5.73245096206665, 6.358976364135742, 6.985501289367676, 7.612026691436768, 8.23855209350586, 8.865077018737793, 9.491602897644043, 10.118127822875977, 10.744653701782227, 11.37117862701416, 11.997703552246094, 12.624229431152344, 13.250754356384277, 13.877279281616211, 14.503805160522461, 15.130330085754395, 15.756855010986328, 16.383380889892578, 17.009906768798828, 17.636430740356445, 18.262956619262695]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 5.0, 4.0, 7.0, 6.0, 11.0, 11.0, 13.0, 22.0, 24.0, 18.0, 18.0, 24.0, 26.0, 25.0, 18.0, 26.0, 29.0, 41.0, 38.0, 32.0, 48.0, 47.0, 35.0, 28.0, 30.0, 43.0, 36.0, 37.0, 29.0, 34.0, 26.0, 19.0, 26.0, 29.0, 22.0, 20.0, 16.0, 7.0, 10.0, 6.0, 7.0, 4.0, 4.0, 3.0, 11.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.431306838989258, -13.94017219543457, -13.449037551879883, -12.957902908325195, -12.466768264770508, -11.97563362121582, -11.484498977661133, -10.993364334106445, -10.502229690551758, -10.01109504699707, -9.519960403442383, -9.028825759887695, -8.537691116333008, -8.04655647277832, -7.555421352386475, -7.064286708831787, -6.573151588439941, -6.082016944885254, -5.590882301330566, -5.099747657775879, -4.608613014221191, -4.117478370666504, -3.626343250274658, -3.1352086067199707, -2.644073963165283, -2.1529393196105957, -1.6618045568466187, -1.1706697940826416, -0.6795351505279541, -0.1884005069732666, 0.302734375, 0.7938690185546875, 1.285003662109375, 1.7761383056640625, 2.26727294921875, 2.7584078311920166, 3.249542474746704, 3.7406771183013916, 4.231812000274658, 4.722946643829346, 5.214081287384033, 5.705215930938721, 6.196350574493408, 6.687485694885254, 7.178620338439941, 7.669754981994629, 8.160889625549316, 8.652024269104004, 9.143158912658691, 9.634293556213379, 10.125428199768066, 10.616562843322754, 11.107697486877441, 11.598832130432129, 12.089967727661133, 12.58110237121582, 13.072237014770508, 13.563371658325195, 14.054506301879883, 14.54564094543457, 15.036775588989258, 15.527910232543945, 16.019044876098633, 16.51017951965332, 17.001314163208008]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 6.0, 13.0, 19.0, 18.0, 37.0, 71.0, 63.0, 93.0, 171.0, 237.0, 431.0, 674.0, 1075.0, 1613.0, 2364.0, 3789.0, 6129.0, 9363.0, 14690.0, 22374.0, 33977.0, 49812.0, 69530.0, 91986.0, 111359.0, 122277.0, 120661.0, 106459.0, 85080.0, 63590.0, 44436.0, 30201.0, 20041.0, 12868.0, 8275.0, 5309.0, 3338.0, 2179.0, 1459.0, 849.0, 616.0, 360.0, 238.0, 142.0, 91.0, 75.0, 46.0, 29.0, 14.0, 10.0, 8.0, 7.0, 7.0, 1.0, 2.0], "bins": [-17.21875, -16.7247314453125, -16.230712890625, -15.7366943359375, -15.24267578125, -14.7486572265625, -14.254638671875, -13.7606201171875, -13.2666015625, -12.7725830078125, -12.278564453125, -11.7845458984375, -11.29052734375, -10.7965087890625, -10.302490234375, -9.8084716796875, -9.314453125, -8.8204345703125, -8.326416015625, -7.8323974609375, -7.33837890625, -6.8443603515625, -6.350341796875, -5.8563232421875, -5.3623046875, -4.8682861328125, -4.374267578125, -3.8802490234375, -3.38623046875, -2.8922119140625, -2.398193359375, -1.9041748046875, -1.41015625, -0.9161376953125, -0.422119140625, 0.0718994140625, 0.56591796875, 1.0599365234375, 1.553955078125, 2.0479736328125, 2.5419921875, 3.0360107421875, 3.530029296875, 4.0240478515625, 4.51806640625, 5.0120849609375, 5.506103515625, 6.0001220703125, 6.494140625, 6.9881591796875, 7.482177734375, 7.9761962890625, 8.47021484375, 8.9642333984375, 9.458251953125, 9.9522705078125, 10.4462890625, 10.9403076171875, 11.434326171875, 11.9283447265625, 12.42236328125, 12.9163818359375, 13.410400390625, 13.9044189453125, 14.3984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 8.0, 4.0, 8.0, 4.0, 6.0, 10.0, 12.0, 17.0, 18.0, 21.0, 23.0, 17.0, 25.0, 25.0, 25.0, 17.0, 32.0, 30.0, 41.0, 35.0, 38.0, 41.0, 48.0, 34.0, 30.0, 32.0, 41.0, 41.0, 29.0, 36.0, 32.0, 23.0, 19.0, 29.0, 32.0, 16.0, 19.0, 12.0, 10.0, 8.0, 8.0, 6.0, 2.0, 6.0, 5.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.7421875, -13.2718505859375, -12.801513671875, -12.3311767578125, -11.86083984375, -11.3905029296875, -10.920166015625, -10.4498291015625, -9.9794921875, -9.5091552734375, -9.038818359375, -8.5684814453125, -8.09814453125, -7.6278076171875, -7.157470703125, -6.6871337890625, -6.216796875, -5.7464599609375, -5.276123046875, -4.8057861328125, -4.33544921875, -3.8651123046875, -3.394775390625, -2.9244384765625, -2.4541015625, -1.9837646484375, -1.513427734375, -1.0430908203125, -0.57275390625, -0.1024169921875, 0.367919921875, 0.8382568359375, 1.30859375, 1.7789306640625, 2.249267578125, 2.7196044921875, 3.18994140625, 3.6602783203125, 4.130615234375, 4.6009521484375, 5.0712890625, 5.5416259765625, 6.011962890625, 6.4822998046875, 6.95263671875, 7.4229736328125, 7.893310546875, 8.3636474609375, 8.833984375, 9.3043212890625, 9.774658203125, 10.2449951171875, 10.71533203125, 11.1856689453125, 11.656005859375, 12.1263427734375, 12.5966796875, 13.0670166015625, 13.537353515625, 14.0076904296875, 14.47802734375, 14.9483642578125, 15.418701171875, 15.8890380859375, 16.359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 8.0, 14.0, 16.0, 40.0, 55.0, 80.0, 119.0, 207.0, 268.0, 400.0, 601.0, 877.0, 1316.0, 1989.0, 3011.0, 4547.0, 6925.0, 10629.0, 15301.0, 22910.0, 33888.0, 46890.0, 64017.0, 82106.0, 98812.0, 109956.0, 111759.0, 103556.0, 88029.0, 70304.0, 52646.0, 37868.0, 26106.0, 17883.0, 12008.0, 7859.0, 5157.0, 3524.0, 2344.0, 1552.0, 999.0, 699.0, 465.0, 266.0, 178.0, 119.0, 85.0, 63.0, 33.0, 26.0, 18.0, 14.0, 13.0, 5.0, 5.0, 1.0, 1.0], "bins": [-14.953125, -14.5023193359375, -14.051513671875, -13.6007080078125, -13.14990234375, -12.6990966796875, -12.248291015625, -11.7974853515625, -11.3466796875, -10.8958740234375, -10.445068359375, -9.9942626953125, -9.54345703125, -9.0926513671875, -8.641845703125, -8.1910400390625, -7.740234375, -7.2894287109375, -6.838623046875, -6.3878173828125, -5.93701171875, -5.4862060546875, -5.035400390625, -4.5845947265625, -4.1337890625, -3.6829833984375, -3.232177734375, -2.7813720703125, -2.33056640625, -1.8797607421875, -1.428955078125, -0.9781494140625, -0.52734375, -0.0765380859375, 0.374267578125, 0.8250732421875, 1.27587890625, 1.7266845703125, 2.177490234375, 2.6282958984375, 3.0791015625, 3.5299072265625, 3.980712890625, 4.4315185546875, 4.88232421875, 5.3331298828125, 5.783935546875, 6.2347412109375, 6.685546875, 7.1363525390625, 7.587158203125, 8.0379638671875, 8.48876953125, 8.9395751953125, 9.390380859375, 9.8411865234375, 10.2919921875, 10.7427978515625, 11.193603515625, 11.6444091796875, 12.09521484375, 12.5460205078125, 12.996826171875, 13.4476318359375, 13.8984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 8.0, 7.0, 17.0, 12.0, 20.0, 11.0, 21.0, 17.0, 19.0, 23.0, 25.0, 40.0, 26.0, 36.0, 37.0, 50.0, 40.0, 39.0, 42.0, 29.0, 21.0, 33.0, 34.0, 34.0, 39.0, 34.0, 33.0, 38.0, 28.0, 27.0, 22.0, 16.0, 19.0, 18.0, 14.0, 11.0, 6.0, 8.0, 10.0, 4.0, 0.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.3203125, -9.0089111328125, -8.697509765625, -8.3861083984375, -8.07470703125, -7.7633056640625, -7.451904296875, -7.1405029296875, -6.8291015625, -6.5177001953125, -6.206298828125, -5.8948974609375, -5.58349609375, -5.2720947265625, -4.960693359375, -4.6492919921875, -4.337890625, -4.0264892578125, -3.715087890625, -3.4036865234375, -3.09228515625, -2.7808837890625, -2.469482421875, -2.1580810546875, -1.8466796875, -1.5352783203125, -1.223876953125, -0.9124755859375, -0.60107421875, -0.2896728515625, 0.021728515625, 0.3331298828125, 0.64453125, 0.9559326171875, 1.267333984375, 1.5787353515625, 1.89013671875, 2.2015380859375, 2.512939453125, 2.8243408203125, 3.1357421875, 3.4471435546875, 3.758544921875, 4.0699462890625, 4.38134765625, 4.6927490234375, 5.004150390625, 5.3155517578125, 5.626953125, 5.9383544921875, 6.249755859375, 6.5611572265625, 6.87255859375, 7.1839599609375, 7.495361328125, 7.8067626953125, 8.1181640625, 8.4295654296875, 8.740966796875, 9.0523681640625, 9.36376953125, 9.6751708984375, 9.986572265625, 10.2979736328125, 10.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 22.0, 22.0, 46.0, 54.0, 76.0, 95.0, 137.0, 224.0, 304.0, 410.0, 666.0, 957.0, 1567.0, 2429.0, 3845.0, 6200.0, 10393.0, 17582.0, 30467.0, 51236.0, 83823.0, 124740.0, 159503.0, 166247.0, 139122.0, 97363.0, 60941.0, 36443.0, 21142.0, 12530.0, 7464.0, 4558.0, 2720.0, 1761.0, 1109.0, 721.0, 496.0, 351.0, 226.0, 155.0, 114.0, 84.0, 64.0, 37.0, 36.0, 21.0, 10.0, 7.0, 13.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6328125, -6.4266357421875, -6.220458984375, -6.0142822265625, -5.80810546875, -5.6019287109375, -5.395751953125, -5.1895751953125, -4.9833984375, -4.7772216796875, -4.571044921875, -4.3648681640625, -4.15869140625, -3.9525146484375, -3.746337890625, -3.5401611328125, -3.333984375, -3.1278076171875, -2.921630859375, -2.7154541015625, -2.50927734375, -2.3031005859375, -2.096923828125, -1.8907470703125, -1.6845703125, -1.4783935546875, -1.272216796875, -1.0660400390625, -0.85986328125, -0.6536865234375, -0.447509765625, -0.2413330078125, -0.03515625, 0.1710205078125, 0.377197265625, 0.5833740234375, 0.78955078125, 0.9957275390625, 1.201904296875, 1.4080810546875, 1.6142578125, 1.8204345703125, 2.026611328125, 2.2327880859375, 2.43896484375, 2.6451416015625, 2.851318359375, 3.0574951171875, 3.263671875, 3.4698486328125, 3.676025390625, 3.8822021484375, 4.08837890625, 4.2945556640625, 4.500732421875, 4.7069091796875, 4.9130859375, 5.1192626953125, 5.325439453125, 5.5316162109375, 5.73779296875, 5.9439697265625, 6.150146484375, 6.3563232421875, 6.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 13.0, 21.0, 15.0, 28.0, 34.0, 45.0, 44.0, 53.0, 67.0, 89.0, 81.0, 82.0, 74.0, 74.0, 62.0, 48.0, 47.0, 35.0, 21.0, 19.0, 10.0, 11.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008153915405273438, -0.0007837414741516113, -0.0007520914077758789, -0.0007204413414001465, -0.0006887912750244141, -0.0006571412086486816, -0.0006254911422729492, -0.0005938410758972168, -0.0005621910095214844, -0.000530540943145752, -0.0004988908767700195, -0.0004672408103942871, -0.0004355907440185547, -0.00040394067764282227, -0.00037229061126708984, -0.0003406405448913574, -0.000308990478515625, -0.0002773404121398926, -0.00024569034576416016, -0.00021404027938842773, -0.0001823902130126953, -0.0001507401466369629, -0.00011909008026123047, -8.744001388549805e-05, -5.5789947509765625e-05, -2.4139881134033203e-05, 7.510185241699219e-06, 3.916025161743164e-05, 7.081031799316406e-05, 0.00010246038436889648, 0.0001341104507446289, 0.00016576051712036133, 0.00019741058349609375, 0.00022906064987182617, 0.0002607107162475586, 0.000292360782623291, 0.00032401084899902344, 0.00035566091537475586, 0.0003873109817504883, 0.0004189610481262207, 0.0004506111145019531, 0.00048226118087768555, 0.000513911247253418, 0.0005455613136291504, 0.0005772113800048828, 0.0006088614463806152, 0.0006405115127563477, 0.0006721615791320801, 0.0007038116455078125, 0.0007354617118835449, 0.0007671117782592773, 0.0007987618446350098, 0.0008304119110107422, 0.0008620619773864746, 0.000893712043762207, 0.0009253621101379395, 0.0009570121765136719, 0.0009886622428894043, 0.0010203123092651367, 0.0010519623756408691, 0.0010836124420166016, 0.001115262508392334, 0.0011469125747680664, 0.0011785626411437988, 0.0012102127075195312]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 11.0, 14.0, 23.0, 33.0, 59.0, 79.0, 118.0, 174.0, 255.0, 389.0, 553.0, 834.0, 1377.0, 2241.0, 3503.0, 5777.0, 9845.0, 16963.0, 29772.0, 52271.0, 87794.0, 134667.0, 170555.0, 174080.0, 136972.0, 91267.0, 54278.0, 30891.0, 17753.0, 10075.0, 5992.0, 3616.0, 2208.0, 1464.0, 926.0, 531.0, 391.0, 280.0, 152.0, 123.0, 82.0, 58.0, 36.0, 20.0, 19.0, 11.0, 9.0, 2.0, 4.0, 6.0, 2.0], "bins": [-8.390625, -8.15777587890625, -7.9249267578125, -7.69207763671875, -7.459228515625, -7.22637939453125, -6.9935302734375, -6.76068115234375, -6.52783203125, -6.29498291015625, -6.0621337890625, -5.82928466796875, -5.596435546875, -5.36358642578125, -5.1307373046875, -4.89788818359375, -4.6650390625, -4.43218994140625, -4.1993408203125, -3.96649169921875, -3.733642578125, -3.50079345703125, -3.2679443359375, -3.03509521484375, -2.80224609375, -2.56939697265625, -2.3365478515625, -2.10369873046875, -1.870849609375, -1.63800048828125, -1.4051513671875, -1.17230224609375, -0.939453125, -0.70660400390625, -0.4737548828125, -0.24090576171875, -0.008056640625, 0.22479248046875, 0.4576416015625, 0.69049072265625, 0.92333984375, 1.15618896484375, 1.3890380859375, 1.62188720703125, 1.854736328125, 2.08758544921875, 2.3204345703125, 2.55328369140625, 2.7861328125, 3.01898193359375, 3.2518310546875, 3.48468017578125, 3.717529296875, 3.95037841796875, 4.1832275390625, 4.41607666015625, 4.64892578125, 4.88177490234375, 5.1146240234375, 5.34747314453125, 5.580322265625, 5.81317138671875, 6.0460205078125, 6.27886962890625, 6.51171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 2.0, 7.0, 11.0, 14.0, 17.0, 22.0, 23.0, 25.0, 27.0, 30.0, 33.0, 29.0, 45.0, 43.0, 44.0, 57.0, 46.0, 56.0, 46.0, 49.0, 49.0, 52.0, 37.0, 22.0, 35.0, 32.0, 23.0, 23.0, 21.0, 17.0, 11.0, 8.0, 10.0, 3.0, 2.0, 7.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.619140625, -2.54010009765625, -2.4610595703125, -2.38201904296875, -2.302978515625, -2.22393798828125, -2.1448974609375, -2.06585693359375, -1.98681640625, -1.90777587890625, -1.8287353515625, -1.74969482421875, -1.670654296875, -1.59161376953125, -1.5125732421875, -1.43353271484375, -1.3544921875, -1.27545166015625, -1.1964111328125, -1.11737060546875, -1.038330078125, -0.95928955078125, -0.8802490234375, -0.80120849609375, -0.72216796875, -0.64312744140625, -0.5640869140625, -0.48504638671875, -0.406005859375, -0.32696533203125, -0.2479248046875, -0.16888427734375, -0.08984375, -0.01080322265625, 0.0682373046875, 0.14727783203125, 0.226318359375, 0.30535888671875, 0.3843994140625, 0.46343994140625, 0.54248046875, 0.62152099609375, 0.7005615234375, 0.77960205078125, 0.858642578125, 0.93768310546875, 1.0167236328125, 1.09576416015625, 1.1748046875, 1.25384521484375, 1.3328857421875, 1.41192626953125, 1.490966796875, 1.57000732421875, 1.6490478515625, 1.72808837890625, 1.80712890625, 1.88616943359375, 1.9652099609375, 2.04425048828125, 2.123291015625, 2.20233154296875, 2.2813720703125, 2.36041259765625, 2.439453125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 6.0, 4.0, 6.0, 8.0, 9.0, 15.0, 13.0, 11.0, 25.0, 13.0, 37.0, 23.0, 25.0, 28.0, 35.0, 46.0, 48.0, 52.0, 43.0, 38.0, 52.0, 51.0, 50.0, 47.0, 41.0, 33.0, 31.0, 27.0, 31.0, 30.0, 9.0, 17.0, 26.0, 17.0, 11.0, 1.0, 6.0, 6.0, 5.0, 5.0, 1.0, 9.0, 0.0, 3.0, 4.0, 1.0, 3.0, 1.0], "bins": [-19.92853355407715, -19.375043869018555, -18.821556091308594, -18.26806640625, -17.714576721191406, -17.161087036132812, -16.60759925842285, -16.054109573364258, -15.500619888305664, -14.947131156921387, -14.393641471862793, -13.840152740478516, -13.286663055419922, -12.733174324035645, -12.179685592651367, -11.626195907592773, -11.072707176208496, -10.519218444824219, -9.965728759765625, -9.412240028381348, -8.858750343322754, -8.305261611938477, -7.751772403717041, -7.1982831954956055, -6.64479398727417, -6.091304779052734, -5.537815570831299, -4.984326362609863, -4.430837631225586, -3.8773481845855713, -3.323859214782715, -2.7703700065612793, -2.2168807983398438, -1.6633915901184082, -1.1099025011062622, -0.5564134120941162, -0.002924203872680664, 0.5505650043487549, 1.1040539741516113, 1.6575431823730469, 2.2110323905944824, 2.764521598815918, 3.3180108070373535, 3.87149977684021, 4.424988746643066, 4.97847843170166, 5.5319671630859375, 6.085456371307373, 6.638945579528809, 7.192434787750244, 7.74592399597168, 8.299412727355957, 8.85290241241455, 9.406391143798828, 9.959880828857422, 10.5133695602417, 11.066858291625977, 11.620347023010254, 12.173836708068848, 12.727325439453125, 13.280815124511719, 13.834303855895996, 14.387792587280273, 14.941282272338867, 15.494771957397461]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 10.0, 8.0, 14.0, 11.0, 19.0, 10.0, 19.0, 11.0, 28.0, 26.0, 28.0, 26.0, 37.0, 28.0, 36.0, 32.0, 28.0, 37.0, 39.0, 41.0, 32.0, 50.0, 43.0, 28.0, 23.0, 46.0, 30.0, 28.0, 29.0, 29.0, 16.0, 16.0, 17.0, 14.0, 23.0, 17.0, 10.0, 10.0, 9.0, 4.0, 4.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.991277694702148, -14.489485740661621, -13.987693786621094, -13.485901832580566, -12.984109878540039, -12.482318878173828, -11.9805269241333, -11.478734970092773, -10.976943016052246, -10.475151062011719, -9.973359107971191, -9.471567153930664, -8.969776153564453, -8.46798324584961, -7.966192245483398, -7.464400291442871, -6.962608337402344, -6.460816383361816, -5.959024429321289, -5.45723295211792, -4.955440998077393, -4.453649044036865, -3.951857328414917, -3.4500656127929688, -2.9482736587524414, -2.446481704711914, -1.9446899890899658, -1.442898154258728, -0.9411063194274902, -0.4393143653869629, 0.06247735023498535, 0.5642690658569336, 1.0660591125488281, 1.567850947380066, 2.0696427822113037, 2.571434497833252, 3.0732264518737793, 3.5750184059143066, 4.076809883117676, 4.578601837158203, 5.0803937911987305, 5.582185745239258, 6.083977699279785, 6.585769176483154, 7.087561130523682, 7.589353084564209, 8.091144561767578, 8.592936515808105, 9.094728469848633, 9.59652042388916, 10.098312377929688, 10.600104331970215, 11.101896286010742, 11.603687286376953, 12.10547924041748, 12.607271194458008, 13.109063148498535, 13.610855102539062, 14.11264705657959, 14.614439010620117, 15.116230010986328, 15.618022918701172, 16.119813919067383, 16.621604919433594, 17.123397827148438]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 10.0, 10.0, 17.0, 32.0, 47.0, 64.0, 102.0, 182.0, 195.0, 390.0, 586.0, 865.0, 1405.0, 2198.0, 3631.0, 5606.0, 9228.0, 15276.0, 25292.0, 43179.0, 73530.0, 127043.0, 216126.0, 352708.0, 519330.0, 649089.0, 659019.0, 542114.0, 377116.0, 234385.0, 138404.0, 80785.0, 46706.0, 27413.0, 16171.0, 9939.0, 6081.0, 3702.0, 2306.0, 1471.0, 928.0, 551.0, 371.0, 243.0, 175.0, 90.0, 63.0, 35.0, 29.0, 25.0, 4.0, 13.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.828125, -16.3193359375, -15.810546875, -15.3017578125, -14.79296875, -14.2841796875, -13.775390625, -13.2666015625, -12.7578125, -12.2490234375, -11.740234375, -11.2314453125, -10.72265625, -10.2138671875, -9.705078125, -9.1962890625, -8.6875, -8.1787109375, -7.669921875, -7.1611328125, -6.65234375, -6.1435546875, -5.634765625, -5.1259765625, -4.6171875, -4.1083984375, -3.599609375, -3.0908203125, -2.58203125, -2.0732421875, -1.564453125, -1.0556640625, -0.546875, -0.0380859375, 0.470703125, 0.9794921875, 1.48828125, 1.9970703125, 2.505859375, 3.0146484375, 3.5234375, 4.0322265625, 4.541015625, 5.0498046875, 5.55859375, 6.0673828125, 6.576171875, 7.0849609375, 7.59375, 8.1025390625, 8.611328125, 9.1201171875, 9.62890625, 10.1376953125, 10.646484375, 11.1552734375, 11.6640625, 12.1728515625, 12.681640625, 13.1904296875, 13.69921875, 14.2080078125, 14.716796875, 15.2255859375, 15.734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 6.0, 7.0, 16.0, 14.0, 15.0, 10.0, 19.0, 19.0, 24.0, 26.0, 20.0, 30.0, 33.0, 32.0, 38.0, 24.0, 34.0, 43.0, 35.0, 40.0, 41.0, 36.0, 42.0, 38.0, 27.0, 40.0, 33.0, 21.0, 32.0, 28.0, 23.0, 19.0, 13.0, 15.0, 18.0, 11.0, 16.0, 12.0, 8.0, 6.0, 2.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.3558349609375, -11.914794921875, -11.4737548828125, -11.03271484375, -10.5916748046875, -10.150634765625, -9.7095947265625, -9.2685546875, -8.8275146484375, -8.386474609375, -7.9454345703125, -7.50439453125, -7.0633544921875, -6.622314453125, -6.1812744140625, -5.740234375, -5.2991943359375, -4.858154296875, -4.4171142578125, -3.97607421875, -3.5350341796875, -3.093994140625, -2.6529541015625, -2.2119140625, -1.7708740234375, -1.329833984375, -0.8887939453125, -0.44775390625, -0.0067138671875, 0.434326171875, 0.8753662109375, 1.31640625, 1.7574462890625, 2.198486328125, 2.6395263671875, 3.08056640625, 3.5216064453125, 3.962646484375, 4.4036865234375, 4.8447265625, 5.2857666015625, 5.726806640625, 6.1678466796875, 6.60888671875, 7.0499267578125, 7.490966796875, 7.9320068359375, 8.373046875, 8.8140869140625, 9.255126953125, 9.6961669921875, 10.13720703125, 10.5782470703125, 11.019287109375, 11.4603271484375, 11.9013671875, 12.3424072265625, 12.783447265625, 13.2244873046875, 13.66552734375, 14.1065673828125, 14.547607421875, 14.9886474609375, 15.4296875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 10.0, 19.0, 27.0, 50.0, 59.0, 135.0, 181.0, 281.0, 416.0, 675.0, 1021.0, 1577.0, 2374.0, 3709.0, 5747.0, 9020.0, 14345.0, 23171.0, 36682.0, 58229.0, 92301.0, 144130.0, 218827.0, 317519.0, 427718.0, 519981.0, 552900.0, 504110.0, 405549.0, 294484.0, 200967.0, 131265.0, 83926.0, 53030.0, 33369.0, 20637.0, 12965.0, 8235.0, 5113.0, 3394.0, 2137.0, 1379.0, 906.0, 600.0, 388.0, 236.0, 139.0, 113.0, 72.0, 56.0, 39.0, 23.0, 10.0, 13.0, 4.0, 6.0, 4.0, 2.0], "bins": [-15.453125, -14.97607421875, -14.4990234375, -14.02197265625, -13.544921875, -13.06787109375, -12.5908203125, -12.11376953125, -11.63671875, -11.15966796875, -10.6826171875, -10.20556640625, -9.728515625, -9.25146484375, -8.7744140625, -8.29736328125, -7.8203125, -7.34326171875, -6.8662109375, -6.38916015625, -5.912109375, -5.43505859375, -4.9580078125, -4.48095703125, -4.00390625, -3.52685546875, -3.0498046875, -2.57275390625, -2.095703125, -1.61865234375, -1.1416015625, -0.66455078125, -0.1875, 0.28955078125, 0.7666015625, 1.24365234375, 1.720703125, 2.19775390625, 2.6748046875, 3.15185546875, 3.62890625, 4.10595703125, 4.5830078125, 5.06005859375, 5.537109375, 6.01416015625, 6.4912109375, 6.96826171875, 7.4453125, 7.92236328125, 8.3994140625, 8.87646484375, 9.353515625, 9.83056640625, 10.3076171875, 10.78466796875, 11.26171875, 11.73876953125, 12.2158203125, 12.69287109375, 13.169921875, 13.64697265625, 14.1240234375, 14.60107421875, 15.078125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 6.0, 10.0, 8.0, 23.0, 13.0, 19.0, 24.0, 44.0, 41.0, 61.0, 46.0, 74.0, 95.0, 98.0, 80.0, 122.0, 138.0, 154.0, 150.0, 191.0, 202.0, 199.0, 217.0, 211.0, 219.0, 181.0, 168.0, 152.0, 153.0, 125.0, 129.0, 117.0, 89.0, 88.0, 77.0, 68.0, 51.0, 37.0, 32.0, 22.0, 23.0, 30.0, 22.0, 15.0, 13.0, 13.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-6.265625, -6.06707763671875, -5.8685302734375, -5.66998291015625, -5.471435546875, -5.27288818359375, -5.0743408203125, -4.87579345703125, -4.67724609375, -4.47869873046875, -4.2801513671875, -4.08160400390625, -3.883056640625, -3.68450927734375, -3.4859619140625, -3.28741455078125, -3.0888671875, -2.89031982421875, -2.6917724609375, -2.49322509765625, -2.294677734375, -2.09613037109375, -1.8975830078125, -1.69903564453125, -1.50048828125, -1.30194091796875, -1.1033935546875, -0.90484619140625, -0.706298828125, -0.50775146484375, -0.3092041015625, -0.11065673828125, 0.087890625, 0.28643798828125, 0.4849853515625, 0.68353271484375, 0.882080078125, 1.08062744140625, 1.2791748046875, 1.47772216796875, 1.67626953125, 1.87481689453125, 2.0733642578125, 2.27191162109375, 2.470458984375, 2.66900634765625, 2.8675537109375, 3.06610107421875, 3.2646484375, 3.46319580078125, 3.6617431640625, 3.86029052734375, 4.058837890625, 4.25738525390625, 4.4559326171875, 4.65447998046875, 4.85302734375, 5.05157470703125, 5.2501220703125, 5.44866943359375, 5.647216796875, 5.84576416015625, 6.0443115234375, 6.24285888671875, 6.44140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 7.0, 7.0, 4.0, 9.0, 14.0, 16.0, 18.0, 15.0, 11.0, 27.0, 25.0, 34.0, 37.0, 52.0, 45.0, 48.0, 49.0, 60.0, 57.0, 46.0, 68.0, 53.0, 45.0, 37.0, 35.0, 37.0, 21.0, 27.0, 22.0, 13.0, 17.0, 9.0, 10.0, 3.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.549909591674805, -21.91442108154297, -21.278934478759766, -20.64344596862793, -20.007957458496094, -19.37247085571289, -18.736982345581055, -18.10149383544922, -17.466007232666016, -16.83051872253418, -16.195032119750977, -15.55954360961914, -14.924055099487305, -14.288567543029785, -13.653079986572266, -13.01759147644043, -12.382102966308594, -11.746615409851074, -11.111126899719238, -10.475639343261719, -9.840150833129883, -9.204663276672363, -8.569175720214844, -7.933687686920166, -7.298199653625488, -6.6627116203308105, -6.027223587036133, -5.391736030578613, -4.7562479972839355, -4.120759963989258, -3.485272169113159, -2.8497843742370605, -2.21429443359375, -1.5788065195083618, -0.9433186054229736, -0.30783069133758545, 0.32765722274780273, 0.9631452560424805, 1.598633050918579, 2.2341208457946777, 2.8696088790893555, 3.505096912384033, 4.140584945678711, 4.7760725021362305, 5.411560535430908, 6.047048568725586, 6.6825361251831055, 7.318024158477783, 7.953512191772461, 8.58899974822998, 9.224488258361816, 9.859975814819336, 10.495464324951172, 11.130951881408691, 11.766439437866211, 12.401927947998047, 13.037415504455566, 13.672903060913086, 14.308391571044922, 14.943879127502441, 15.579366683959961, 16.214855194091797, 16.850343704223633, 17.485830307006836, 18.121318817138672]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 5.0, 6.0, 7.0, 11.0, 12.0, 14.0, 9.0, 15.0, 23.0, 26.0, 29.0, 25.0, 30.0, 36.0, 33.0, 40.0, 33.0, 32.0, 35.0, 42.0, 46.0, 42.0, 37.0, 29.0, 35.0, 28.0, 32.0, 35.0, 27.0, 22.0, 33.0, 28.0, 24.0, 11.0, 19.0, 15.0, 11.0, 12.0, 7.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-16.6811466217041, -16.18553924560547, -15.689933776855469, -15.194326400756836, -14.69871997833252, -14.203113555908203, -13.707507133483887, -13.21190071105957, -12.716293334960938, -12.220686912536621, -11.725080490112305, -11.229473114013672, -10.733866691589355, -10.238260269165039, -9.742653846740723, -9.247047424316406, -8.75144100189209, -8.255834579467773, -7.760227680206299, -7.264621257781982, -6.769014358520508, -6.273407936096191, -5.777801513671875, -5.282195091247559, -4.786588191986084, -4.290981769561768, -3.795374870300293, -3.2997684478759766, -2.804161787033081, -2.3085551261901855, -1.8129487037658691, -1.3173420429229736, -0.8217363357543945, -0.3261297345161438, 0.16947686672210693, 0.6650834083557129, 1.1606900691986084, 1.656296730041504, 2.1519031524658203, 2.647509813308716, 3.1431164741516113, 3.638723134994507, 4.134329795837402, 4.629936218261719, 5.125542640686035, 5.62114953994751, 6.116755962371826, 6.612362861633301, 7.107969284057617, 7.603575706481934, 8.09918212890625, 8.594789505004883, 9.0903959274292, 9.586002349853516, 10.081608772277832, 10.577215194702148, 11.072822570800781, 11.568428993225098, 12.064035415649414, 12.559642791748047, 13.055249214172363, 13.55085563659668, 14.046462059020996, 14.542068481445312, 15.037674903869629]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 8.0, 15.0, 21.0, 27.0, 57.0, 73.0, 108.0, 174.0, 273.0, 435.0, 685.0, 1134.0, 1871.0, 2984.0, 5087.0, 8387.0, 13579.0, 21903.0, 35126.0, 53589.0, 78417.0, 105274.0, 128774.0, 137491.0, 127945.0, 104704.0, 77275.0, 52625.0, 34315.0, 21924.0, 13222.0, 8233.0, 5020.0, 2982.0, 1833.0, 1132.0, 673.0, 434.0, 247.0, 139.0, 124.0, 63.0, 48.0, 29.0, 29.0, 14.0, 16.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-6.75390625, -6.53936767578125, -6.3248291015625, -6.11029052734375, -5.895751953125, -5.68121337890625, -5.4666748046875, -5.25213623046875, -5.03759765625, -4.82305908203125, -4.6085205078125, -4.39398193359375, -4.179443359375, -3.96490478515625, -3.7503662109375, -3.53582763671875, -3.3212890625, -3.10675048828125, -2.8922119140625, -2.67767333984375, -2.463134765625, -2.24859619140625, -2.0340576171875, -1.81951904296875, -1.60498046875, -1.39044189453125, -1.1759033203125, -0.96136474609375, -0.746826171875, -0.53228759765625, -0.3177490234375, -0.10321044921875, 0.111328125, 0.32586669921875, 0.5404052734375, 0.75494384765625, 0.969482421875, 1.18402099609375, 1.3985595703125, 1.61309814453125, 1.82763671875, 2.04217529296875, 2.2567138671875, 2.47125244140625, 2.685791015625, 2.90032958984375, 3.1148681640625, 3.32940673828125, 3.5439453125, 3.75848388671875, 3.9730224609375, 4.18756103515625, 4.402099609375, 4.61663818359375, 4.8311767578125, 5.04571533203125, 5.26025390625, 5.47479248046875, 5.6893310546875, 5.90386962890625, 6.118408203125, 6.33294677734375, 6.5474853515625, 6.76202392578125, 6.9765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 8.0, 5.0, 5.0, 8.0, 11.0, 12.0, 15.0, 8.0, 16.0, 23.0, 27.0, 25.0, 28.0, 33.0, 34.0, 33.0, 33.0, 34.0, 37.0, 34.0, 41.0, 44.0, 42.0, 35.0, 30.0, 37.0, 28.0, 30.0, 36.0, 25.0, 25.0, 29.0, 32.0, 18.0, 14.0, 22.0, 16.0, 12.0, 9.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-16.640625, -16.1446533203125, -15.648681640625, -15.1527099609375, -14.65673828125, -14.1607666015625, -13.664794921875, -13.1688232421875, -12.6728515625, -12.1768798828125, -11.680908203125, -11.1849365234375, -10.68896484375, -10.1929931640625, -9.697021484375, -9.2010498046875, -8.705078125, -8.2091064453125, -7.713134765625, -7.2171630859375, -6.72119140625, -6.2252197265625, -5.729248046875, -5.2332763671875, -4.7373046875, -4.2413330078125, -3.745361328125, -3.2493896484375, -2.75341796875, -2.2574462890625, -1.761474609375, -1.2655029296875, -0.76953125, -0.2735595703125, 0.222412109375, 0.7183837890625, 1.21435546875, 1.7103271484375, 2.206298828125, 2.7022705078125, 3.1982421875, 3.6942138671875, 4.190185546875, 4.6861572265625, 5.18212890625, 5.6781005859375, 6.174072265625, 6.6700439453125, 7.166015625, 7.6619873046875, 8.157958984375, 8.6539306640625, 9.14990234375, 9.6458740234375, 10.141845703125, 10.6378173828125, 11.1337890625, 11.6297607421875, 12.125732421875, 12.6217041015625, 13.11767578125, 13.6136474609375, 14.109619140625, 14.6055908203125, 15.1015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 14.0, 13.0, 12.0, 24.0, 44.0, 45.0, 75.0, 122.0, 208.0, 319.0, 520.0, 885.0, 1575.0, 2887.0, 5336.0, 9895.0, 18874.0, 38503.0, 793631.0, 118256.0, 27021.0, 13791.0, 7293.0, 4008.0, 2217.0, 1174.0, 690.0, 407.0, 242.0, 160.0, 94.0, 64.0, 34.0, 41.0, 20.0, 17.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.8359375, -18.203125, -17.5703125, -16.9375, -16.3046875, -15.671875, -15.0390625, -14.40625, -13.7734375, -13.140625, -12.5078125, -11.875, -11.2421875, -10.609375, -9.9765625, -9.34375, -8.7109375, -8.078125, -7.4453125, -6.8125, -6.1796875, -5.546875, -4.9140625, -4.28125, -3.6484375, -3.015625, -2.3828125, -1.75, -1.1171875, -0.484375, 0.1484375, 0.78125, 1.4140625, 2.046875, 2.6796875, 3.3125, 3.9453125, 4.578125, 5.2109375, 5.84375, 6.4765625, 7.109375, 7.7421875, 8.375, 9.0078125, 9.640625, 10.2734375, 10.90625, 11.5390625, 12.171875, 12.8046875, 13.4375, 14.0703125, 14.703125, 15.3359375, 15.96875, 16.6015625, 17.234375, 17.8671875, 18.5, 19.1328125, 19.765625, 20.3984375, 21.03125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 11.0, 18.0, 21.0, 18.0, 19.0, 21.0, 39.0, 33.0, 27.0, 37.0, 39.0, 42.0, 48.0, 52.0, 44.0, 36.0, 41.0, 43.0, 49.0, 49.0, 37.0, 30.0, 31.0, 34.0, 23.0, 20.0, 28.0, 19.0, 16.0, 8.0, 10.0, 7.0, 6.0, 5.0, 7.0, 6.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.5811767578125, -11.170166015625, -10.7591552734375, -10.34814453125, -9.9371337890625, -9.526123046875, -9.1151123046875, -8.7041015625, -8.2930908203125, -7.882080078125, -7.4710693359375, -7.06005859375, -6.6490478515625, -6.238037109375, -5.8270263671875, -5.416015625, -5.0050048828125, -4.593994140625, -4.1829833984375, -3.77197265625, -3.3609619140625, -2.949951171875, -2.5389404296875, -2.1279296875, -1.7169189453125, -1.305908203125, -0.8948974609375, -0.48388671875, -0.0728759765625, 0.338134765625, 0.7491455078125, 1.16015625, 1.5711669921875, 1.982177734375, 2.3931884765625, 2.80419921875, 3.2152099609375, 3.626220703125, 4.0372314453125, 4.4482421875, 4.8592529296875, 5.270263671875, 5.6812744140625, 6.09228515625, 6.5032958984375, 6.914306640625, 7.3253173828125, 7.736328125, 8.1473388671875, 8.558349609375, 8.9693603515625, 9.38037109375, 9.7913818359375, 10.202392578125, 10.6134033203125, 11.0244140625, 11.4354248046875, 11.846435546875, 12.2574462890625, 12.66845703125, 13.0794677734375, 13.490478515625, 13.9014892578125, 14.3125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 14.0, 14.0, 22.0, 46.0, 41.0, 60.0, 94.0, 139.0, 191.0, 351.0, 541.0, 969.0, 1992.0, 4254.0, 10378.0, 29779.0, 781047.0, 180566.0, 22304.0, 8289.0, 3525.0, 1645.0, 906.0, 500.0, 273.0, 174.0, 134.0, 75.0, 58.0, 31.0, 22.0, 15.0, 18.0, 14.0, 16.0, 4.0, 6.0, 10.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.404296875, -2.3311767578125, -2.258056640625, -2.1849365234375, -2.11181640625, -2.0386962890625, -1.965576171875, -1.8924560546875, -1.8193359375, -1.7462158203125, -1.673095703125, -1.5999755859375, -1.52685546875, -1.4537353515625, -1.380615234375, -1.3074951171875, -1.234375, -1.1612548828125, -1.088134765625, -1.0150146484375, -0.94189453125, -0.8687744140625, -0.795654296875, -0.7225341796875, -0.6494140625, -0.5762939453125, -0.503173828125, -0.4300537109375, -0.35693359375, -0.2838134765625, -0.210693359375, -0.1375732421875, -0.064453125, 0.0086669921875, 0.081787109375, 0.1549072265625, 0.22802734375, 0.3011474609375, 0.374267578125, 0.4473876953125, 0.5205078125, 0.5936279296875, 0.666748046875, 0.7398681640625, 0.81298828125, 0.8861083984375, 0.959228515625, 1.0323486328125, 1.10546875, 1.1785888671875, 1.251708984375, 1.3248291015625, 1.39794921875, 1.4710693359375, 1.544189453125, 1.6173095703125, 1.6904296875, 1.7635498046875, 1.836669921875, 1.9097900390625, 1.98291015625, 2.0560302734375, 2.129150390625, 2.2022705078125, 2.275390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 15.0, 15.0, 13.0, 15.0, 13.0, 20.0, 28.0, 36.0, 28.0, 44.0, 69.0, 52.0, 60.0, 59.0, 66.0, 59.0, 51.0, 50.0, 32.0, 47.0, 44.0, 26.0, 25.0, 18.0, 9.0, 12.0, 12.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.00018978118896484375, -0.000184500589966774, -0.00017921999096870422, -0.00017393939197063446, -0.0001686587929725647, -0.00016337819397449493, -0.00015809759497642517, -0.0001528169959783554, -0.00014753639698028564, -0.00014225579798221588, -0.00013697519898414612, -0.00013169459998607635, -0.0001264140009880066, -0.00012113340198993683, -0.00011585280299186707, -0.0001105722039937973, -0.00010529160499572754, -0.00010001100599765778, -9.473040699958801e-05, -8.944980800151825e-05, -8.416920900344849e-05, -7.888861000537872e-05, -7.360801100730896e-05, -6.83274120092392e-05, -6.304681301116943e-05, -5.776621401309967e-05, -5.248561501502991e-05, -4.7205016016960144e-05, -4.192441701889038e-05, -3.664381802082062e-05, -3.1363219022750854e-05, -2.608262002468109e-05, -2.0802021026611328e-05, -1.5521422028541565e-05, -1.0240823030471802e-05, -4.9602240324020386e-06, 3.203749656677246e-07, 5.600973963737488e-06, 1.0881572961807251e-05, 1.6162171959877014e-05, 2.1442770957946777e-05, 2.672336995601654e-05, 3.2003968954086304e-05, 3.728456795215607e-05, 4.256516695022583e-05, 4.784576594829559e-05, 5.3126364946365356e-05, 5.840696394443512e-05, 6.368756294250488e-05, 6.896816194057465e-05, 7.424876093864441e-05, 7.952935993671417e-05, 8.480995893478394e-05, 9.00905579328537e-05, 9.537115693092346e-05, 0.00010065175592899323, 0.00010593235492706299, 0.00011121295392513275, 0.00011649355292320251, 0.00012177415192127228, 0.00012705475091934204, 0.0001323353499174118, 0.00013761594891548157, 0.00014289654791355133, 0.0001481771469116211]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 10.0, 15.0, 23.0, 24.0, 31.0, 47.0, 77.0, 91.0, 120.0, 160.0, 259.0, 322.0, 446.0, 631.0, 902.0, 1235.0, 1797.0, 2650.0, 4159.0, 6686.0, 12521.0, 26132.0, 61765.0, 146102.0, 258523.0, 257651.0, 145916.0, 61961.0, 26078.0, 12415.0, 6864.0, 4008.0, 2700.0, 1759.0, 1275.0, 903.0, 597.0, 453.0, 321.0, 266.0, 202.0, 113.0, 95.0, 70.0, 37.0, 45.0, 31.0, 26.0, 14.0, 10.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.435546875, -1.39068603515625, -1.3458251953125, -1.30096435546875, -1.256103515625, -1.21124267578125, -1.1663818359375, -1.12152099609375, -1.07666015625, -1.03179931640625, -0.9869384765625, -0.94207763671875, -0.897216796875, -0.85235595703125, -0.8074951171875, -0.76263427734375, -0.7177734375, -0.67291259765625, -0.6280517578125, -0.58319091796875, -0.538330078125, -0.49346923828125, -0.4486083984375, -0.40374755859375, -0.35888671875, -0.31402587890625, -0.2691650390625, -0.22430419921875, -0.179443359375, -0.13458251953125, -0.0897216796875, -0.04486083984375, 0.0, 0.04486083984375, 0.0897216796875, 0.13458251953125, 0.179443359375, 0.22430419921875, 0.2691650390625, 0.31402587890625, 0.35888671875, 0.40374755859375, 0.4486083984375, 0.49346923828125, 0.538330078125, 0.58319091796875, 0.6280517578125, 0.67291259765625, 0.7177734375, 0.76263427734375, 0.8074951171875, 0.85235595703125, 0.897216796875, 0.94207763671875, 0.9869384765625, 1.03179931640625, 1.07666015625, 1.12152099609375, 1.1663818359375, 1.21124267578125, 1.256103515625, 1.30096435546875, 1.3458251953125, 1.39068603515625, 1.435546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 13.0, 12.0, 25.0, 19.0, 27.0, 37.0, 43.0, 53.0, 57.0, 73.0, 85.0, 69.0, 66.0, 66.0, 67.0, 46.0, 50.0, 34.0, 18.0, 19.0, 13.0, 16.0, 13.0, 9.0, 9.0, 7.0, 3.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46630859375, -0.4535064697265625, -0.440704345703125, -0.4279022216796875, -0.41510009765625, -0.4022979736328125, -0.389495849609375, -0.3766937255859375, -0.3638916015625, -0.3510894775390625, -0.338287353515625, -0.3254852294921875, -0.31268310546875, -0.2998809814453125, -0.287078857421875, -0.2742767333984375, -0.261474609375, -0.2486724853515625, -0.235870361328125, -0.2230682373046875, -0.21026611328125, -0.1974639892578125, -0.184661865234375, -0.1718597412109375, -0.1590576171875, -0.1462554931640625, -0.133453369140625, -0.1206512451171875, -0.10784912109375, -0.0950469970703125, -0.082244873046875, -0.0694427490234375, -0.056640625, -0.0438385009765625, -0.031036376953125, -0.0182342529296875, -0.00543212890625, 0.0073699951171875, 0.020172119140625, 0.0329742431640625, 0.0457763671875, 0.0585784912109375, 0.071380615234375, 0.0841827392578125, 0.09698486328125, 0.1097869873046875, 0.122589111328125, 0.1353912353515625, 0.148193359375, 0.1609954833984375, 0.173797607421875, 0.1865997314453125, 0.19940185546875, 0.2122039794921875, 0.225006103515625, 0.2378082275390625, 0.2506103515625, 0.2634124755859375, 0.276214599609375, 0.2890167236328125, 0.30181884765625, 0.3146209716796875, 0.327423095703125, 0.3402252197265625, 0.35302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 14.0, 7.0, 10.0, 8.0, 7.0, 23.0, 16.0, 20.0, 30.0, 38.0, 30.0, 40.0, 39.0, 40.0, 53.0, 61.0, 53.0, 50.0, 61.0, 44.0, 59.0, 39.0, 37.0, 31.0, 41.0, 28.0, 17.0, 19.0, 18.0, 14.0, 11.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-22.50246810913086, -21.878021240234375, -21.25357437133789, -20.62912940979004, -20.004682540893555, -19.38023567199707, -18.755788803100586, -18.131343841552734, -17.50689697265625, -16.882450103759766, -16.25800323486328, -15.633557319641113, -15.009111404418945, -14.384664535522461, -13.760217666625977, -13.135771751403809, -12.511324882507324, -11.88687801361084, -11.262432098388672, -10.637985229492188, -10.01353931427002, -9.389092445373535, -8.764646530151367, -8.140199661254883, -7.515753269195557, -6.8913068771362305, -6.266860485076904, -5.642414093017578, -5.017967224121094, -4.393521308898926, -3.7690744400024414, -3.1446280479431152, -2.520181655883789, -1.895735263824463, -1.2712887525558472, -0.6468422412872314, -0.022395849227905273, 0.6020505428314209, 1.2264971733093262, 1.8509435653686523, 2.4753899574279785, 3.0998363494873047, 3.724282741546631, 4.348729133605957, 4.973176002502441, 5.597621917724609, 6.222068786621094, 6.84651517868042, 7.470961570739746, 8.09540843963623, 8.719854354858398, 9.344301223754883, 9.96874713897705, 10.593194007873535, 11.217639923095703, 11.842086791992188, 12.466533660888672, 13.090980529785156, 13.715426445007324, 14.339873313903809, 14.964319229125977, 15.588766098022461, 16.213212966918945, 16.837657928466797, 17.46210479736328]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 4.0, 7.0, 11.0, 11.0, 11.0, 12.0, 13.0, 20.0, 21.0, 28.0, 21.0, 25.0, 36.0, 30.0, 32.0, 36.0, 35.0, 34.0, 35.0, 47.0, 36.0, 44.0, 35.0, 35.0, 32.0, 29.0, 27.0, 33.0, 28.0, 22.0, 27.0, 33.0, 24.0, 12.0, 20.0, 15.0, 13.0, 12.0, 8.0, 3.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-16.397401809692383, -15.907699584960938, -15.417997360229492, -14.928296089172363, -14.438593864440918, -13.948891639709473, -13.459190368652344, -12.969488143920898, -12.479785919189453, -11.990083694458008, -11.500381469726562, -11.010680198669434, -10.520977973937988, -10.031275749206543, -9.541574478149414, -9.051872253417969, -8.562170028686523, -8.072467803955078, -7.582766056060791, -7.093064308166504, -6.603362083435059, -6.113659858703613, -5.623958110809326, -5.134256362915039, -4.644554138183594, -4.154851913452148, -3.6651501655578613, -3.175448179244995, -2.685746192932129, -2.1960442066192627, -1.7063422203063965, -1.2166402339935303, -0.7269392013549805, -0.23723721504211426, 0.25246477127075195, 0.7421667575836182, 1.2318687438964844, 1.7215707302093506, 2.211272716522217, 2.700974702835083, 3.190676689147949, 3.6803786754608154, 4.170080661773682, 4.659782409667969, 5.149484634399414, 5.639186859130859, 6.1288886070251465, 6.618590354919434, 7.108292579650879, 7.597994804382324, 8.087696075439453, 8.577398300170898, 9.067100524902344, 9.556802749633789, 10.046504974365234, 10.536206245422363, 11.025908470153809, 11.515610694885254, 12.005311965942383, 12.495014190673828, 12.984716415405273, 13.474418640136719, 13.964120864868164, 14.453822135925293, 14.943524360656738]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 16.0, 33.0, 34.0, 58.0, 90.0, 134.0, 248.0, 357.0, 601.0, 961.0, 1633.0, 2382.0, 3941.0, 6262.0, 9619.0, 15173.0, 23643.0, 35746.0, 51521.0, 70706.0, 91636.0, 109447.0, 119570.0, 117140.0, 104669.0, 85282.0, 63499.0, 46308.0, 30977.0, 20858.0, 13259.0, 8456.0, 5296.0, 3271.0, 2115.0, 1321.0, 842.0, 539.0, 322.0, 208.0, 142.0, 91.0, 47.0, 41.0, 15.0, 7.0, 12.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.671875, -15.208740234375, -14.74560546875, -14.282470703125, -13.8193359375, -13.356201171875, -12.89306640625, -12.429931640625, -11.966796875, -11.503662109375, -11.04052734375, -10.577392578125, -10.1142578125, -9.651123046875, -9.18798828125, -8.724853515625, -8.26171875, -7.798583984375, -7.33544921875, -6.872314453125, -6.4091796875, -5.946044921875, -5.48291015625, -5.019775390625, -4.556640625, -4.093505859375, -3.63037109375, -3.167236328125, -2.7041015625, -2.240966796875, -1.77783203125, -1.314697265625, -0.8515625, -0.388427734375, 0.07470703125, 0.537841796875, 1.0009765625, 1.464111328125, 1.92724609375, 2.390380859375, 2.853515625, 3.316650390625, 3.77978515625, 4.242919921875, 4.7060546875, 5.169189453125, 5.63232421875, 6.095458984375, 6.55859375, 7.021728515625, 7.48486328125, 7.947998046875, 8.4111328125, 8.874267578125, 9.33740234375, 9.800537109375, 10.263671875, 10.726806640625, 11.18994140625, 11.653076171875, 12.1162109375, 12.579345703125, 13.04248046875, 13.505615234375, 13.96875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 3.0, 7.0, 8.0, 12.0, 11.0, 13.0, 10.0, 17.0, 20.0, 30.0, 25.0, 26.0, 32.0, 33.0, 28.0, 44.0, 29.0, 31.0, 35.0, 42.0, 52.0, 37.0, 40.0, 33.0, 33.0, 29.0, 25.0, 33.0, 29.0, 24.0, 27.0, 31.0, 23.0, 17.0, 20.0, 15.0, 13.0, 11.0, 6.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-15.921875, -15.4483642578125, -14.974853515625, -14.5013427734375, -14.02783203125, -13.5543212890625, -13.080810546875, -12.6072998046875, -12.1337890625, -11.6602783203125, -11.186767578125, -10.7132568359375, -10.23974609375, -9.7662353515625, -9.292724609375, -8.8192138671875, -8.345703125, -7.8721923828125, -7.398681640625, -6.9251708984375, -6.45166015625, -5.9781494140625, -5.504638671875, -5.0311279296875, -4.5576171875, -4.0841064453125, -3.610595703125, -3.1370849609375, -2.66357421875, -2.1900634765625, -1.716552734375, -1.2430419921875, -0.76953125, -0.2960205078125, 0.177490234375, 0.6510009765625, 1.12451171875, 1.5980224609375, 2.071533203125, 2.5450439453125, 3.0185546875, 3.4920654296875, 3.965576171875, 4.4390869140625, 4.91259765625, 5.3861083984375, 5.859619140625, 6.3331298828125, 6.806640625, 7.2801513671875, 7.753662109375, 8.2271728515625, 8.70068359375, 9.1741943359375, 9.647705078125, 10.1212158203125, 10.5947265625, 11.0682373046875, 11.541748046875, 12.0152587890625, 12.48876953125, 12.9622802734375, 13.435791015625, 13.9093017578125, 14.3828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 9.0, 2.0, 10.0, 29.0, 41.0, 62.0, 102.0, 149.0, 253.0, 389.0, 622.0, 1052.0, 1660.0, 2878.0, 4560.0, 7514.0, 12332.0, 20129.0, 31619.0, 49214.0, 71503.0, 97323.0, 120811.0, 132918.0, 129766.0, 111049.0, 85150.0, 60507.0, 39964.0, 25693.0, 16029.0, 9833.0, 5935.0, 3684.0, 2247.0, 1352.0, 854.0, 504.0, 288.0, 185.0, 119.0, 85.0, 60.0, 33.0, 13.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-16.796875, -16.2994384765625, -15.802001953125, -15.3045654296875, -14.80712890625, -14.3096923828125, -13.812255859375, -13.3148193359375, -12.8173828125, -12.3199462890625, -11.822509765625, -11.3250732421875, -10.82763671875, -10.3302001953125, -9.832763671875, -9.3353271484375, -8.837890625, -8.3404541015625, -7.843017578125, -7.3455810546875, -6.84814453125, -6.3507080078125, -5.853271484375, -5.3558349609375, -4.8583984375, -4.3609619140625, -3.863525390625, -3.3660888671875, -2.86865234375, -2.3712158203125, -1.873779296875, -1.3763427734375, -0.87890625, -0.3814697265625, 0.115966796875, 0.6134033203125, 1.11083984375, 1.6082763671875, 2.105712890625, 2.6031494140625, 3.1005859375, 3.5980224609375, 4.095458984375, 4.5928955078125, 5.09033203125, 5.5877685546875, 6.085205078125, 6.5826416015625, 7.080078125, 7.5775146484375, 8.074951171875, 8.5723876953125, 9.06982421875, 9.5672607421875, 10.064697265625, 10.5621337890625, 11.0595703125, 11.5570068359375, 12.054443359375, 12.5518798828125, 13.04931640625, 13.5467529296875, 14.044189453125, 14.5416259765625, 15.0390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 12.0, 10.0, 17.0, 24.0, 16.0, 18.0, 23.0, 28.0, 26.0, 24.0, 30.0, 39.0, 39.0, 37.0, 48.0, 38.0, 57.0, 43.0, 45.0, 45.0, 41.0, 44.0, 44.0, 27.0, 29.0, 33.0, 25.0, 20.0, 16.0, 15.0, 16.0, 18.0, 8.0, 12.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.623779296875, -9.26318359375, -8.902587890625, -8.5419921875, -8.181396484375, -7.82080078125, -7.460205078125, -7.099609375, -6.739013671875, -6.37841796875, -6.017822265625, -5.6572265625, -5.296630859375, -4.93603515625, -4.575439453125, -4.21484375, -3.854248046875, -3.49365234375, -3.133056640625, -2.7724609375, -2.411865234375, -2.05126953125, -1.690673828125, -1.330078125, -0.969482421875, -0.60888671875, -0.248291015625, 0.1123046875, 0.472900390625, 0.83349609375, 1.194091796875, 1.5546875, 1.915283203125, 2.27587890625, 2.636474609375, 2.9970703125, 3.357666015625, 3.71826171875, 4.078857421875, 4.439453125, 4.800048828125, 5.16064453125, 5.521240234375, 5.8818359375, 6.242431640625, 6.60302734375, 6.963623046875, 7.32421875, 7.684814453125, 8.04541015625, 8.406005859375, 8.7666015625, 9.127197265625, 9.48779296875, 9.848388671875, 10.208984375, 10.569580078125, 10.93017578125, 11.290771484375, 11.6513671875, 12.011962890625, 12.37255859375, 12.733154296875, 13.09375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 11.0, 13.0, 27.0, 35.0, 39.0, 81.0, 119.0, 184.0, 406.0, 679.0, 1614.0, 4335.0, 14057.0, 52391.0, 192113.0, 396462.0, 270869.0, 82699.0, 21812.0, 6349.0, 2266.0, 911.0, 437.0, 224.0, 140.0, 109.0, 56.0, 33.0, 25.0, 21.0, 12.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.6932373046875, -17.167724609375, -16.6422119140625, -16.11669921875, -15.5911865234375, -15.065673828125, -14.5401611328125, -14.0146484375, -13.4891357421875, -12.963623046875, -12.4381103515625, -11.91259765625, -11.3870849609375, -10.861572265625, -10.3360595703125, -9.810546875, -9.2850341796875, -8.759521484375, -8.2340087890625, -7.70849609375, -7.1829833984375, -6.657470703125, -6.1319580078125, -5.6064453125, -5.0809326171875, -4.555419921875, -4.0299072265625, -3.50439453125, -2.9788818359375, -2.453369140625, -1.9278564453125, -1.40234375, -0.8768310546875, -0.351318359375, 0.1741943359375, 0.69970703125, 1.2252197265625, 1.750732421875, 2.2762451171875, 2.8017578125, 3.3272705078125, 3.852783203125, 4.3782958984375, 4.90380859375, 5.4293212890625, 5.954833984375, 6.4803466796875, 7.005859375, 7.5313720703125, 8.056884765625, 8.5823974609375, 9.10791015625, 9.6334228515625, 10.158935546875, 10.6844482421875, 11.2099609375, 11.7354736328125, 12.260986328125, 12.7864990234375, 13.31201171875, 13.8375244140625, 14.363037109375, 14.8885498046875, 15.4140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 3.0, 9.0, 9.0, 13.0, 13.0, 22.0, 32.0, 27.0, 29.0, 34.0, 40.0, 47.0, 56.0, 57.0, 59.0, 51.0, 47.0, 51.0, 67.0, 46.0, 53.0, 43.0, 37.0, 21.0, 24.0, 14.0, 23.0, 16.0, 12.0, 8.0, 7.0, 2.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007190704345703125, -0.0006963014602661133, -0.0006735324859619141, -0.0006507635116577148, -0.0006279945373535156, -0.0006052255630493164, -0.0005824565887451172, -0.000559687614440918, -0.0005369186401367188, -0.0005141496658325195, -0.0004913806915283203, -0.0004686117172241211, -0.0004458427429199219, -0.00042307376861572266, -0.00040030479431152344, -0.0003775358200073242, -0.000354766845703125, -0.0003319978713989258, -0.00030922889709472656, -0.00028645992279052734, -0.0002636909484863281, -0.0002409219741821289, -0.0002181529998779297, -0.00019538402557373047, -0.00017261505126953125, -0.00014984607696533203, -0.0001270771026611328, -0.0001043081283569336, -8.153915405273438e-05, -5.8770179748535156e-05, -3.600120544433594e-05, -1.3232231140136719e-05, 9.5367431640625e-06, 3.230571746826172e-05, 5.507469177246094e-05, 7.784366607666016e-05, 0.00010061264038085938, 0.0001233816146850586, 0.0001461505889892578, 0.00016891956329345703, 0.00019168853759765625, 0.00021445751190185547, 0.0002372264862060547, 0.0002599954605102539, 0.0002827644348144531, 0.00030553340911865234, 0.00032830238342285156, 0.0003510713577270508, 0.00037384033203125, 0.0003966093063354492, 0.00041937828063964844, 0.00044214725494384766, 0.0004649162292480469, 0.0004876852035522461, 0.0005104541778564453, 0.0005332231521606445, 0.0005559921264648438, 0.000578761100769043, 0.0006015300750732422, 0.0006242990493774414, 0.0006470680236816406, 0.0006698369979858398, 0.0006926059722900391, 0.0007153749465942383, 0.0007381439208984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 7.0, 15.0, 21.0, 21.0, 41.0, 32.0, 58.0, 83.0, 91.0, 161.0, 229.0, 346.0, 519.0, 947.0, 1568.0, 2856.0, 5785.0, 11895.0, 25205.0, 55294.0, 114009.0, 192926.0, 234606.0, 189525.0, 110551.0, 53319.0, 24577.0, 11433.0, 5385.0, 2750.0, 1586.0, 936.0, 559.0, 386.0, 249.0, 162.0, 111.0, 92.0, 62.0, 46.0, 33.0, 23.0, 11.0, 10.0, 12.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.3828125, -10.0816650390625, -9.780517578125, -9.4793701171875, -9.17822265625, -8.8770751953125, -8.575927734375, -8.2747802734375, -7.9736328125, -7.6724853515625, -7.371337890625, -7.0701904296875, -6.76904296875, -6.4678955078125, -6.166748046875, -5.8656005859375, -5.564453125, -5.2633056640625, -4.962158203125, -4.6610107421875, -4.35986328125, -4.0587158203125, -3.757568359375, -3.4564208984375, -3.1552734375, -2.8541259765625, -2.552978515625, -2.2518310546875, -1.95068359375, -1.6495361328125, -1.348388671875, -1.0472412109375, -0.74609375, -0.4449462890625, -0.143798828125, 0.1573486328125, 0.45849609375, 0.7596435546875, 1.060791015625, 1.3619384765625, 1.6630859375, 1.9642333984375, 2.265380859375, 2.5665283203125, 2.86767578125, 3.1688232421875, 3.469970703125, 3.7711181640625, 4.072265625, 4.3734130859375, 4.674560546875, 4.9757080078125, 5.27685546875, 5.5780029296875, 5.879150390625, 6.1802978515625, 6.4814453125, 6.7825927734375, 7.083740234375, 7.3848876953125, 7.68603515625, 7.9871826171875, 8.288330078125, 8.5894775390625, 8.890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 13.0, 14.0, 15.0, 26.0, 21.0, 47.0, 52.0, 35.0, 60.0, 82.0, 62.0, 82.0, 82.0, 64.0, 63.0, 62.0, 38.0, 40.0, 28.0, 23.0, 16.0, 11.0, 9.0, 10.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.680908203125, -3.57666015625, -3.472412109375, -3.3681640625, -3.263916015625, -3.15966796875, -3.055419921875, -2.951171875, -2.846923828125, -2.74267578125, -2.638427734375, -2.5341796875, -2.429931640625, -2.32568359375, -2.221435546875, -2.1171875, -2.012939453125, -1.90869140625, -1.804443359375, -1.7001953125, -1.595947265625, -1.49169921875, -1.387451171875, -1.283203125, -1.178955078125, -1.07470703125, -0.970458984375, -0.8662109375, -0.761962890625, -0.65771484375, -0.553466796875, -0.44921875, -0.344970703125, -0.24072265625, -0.136474609375, -0.0322265625, 0.072021484375, 0.17626953125, 0.280517578125, 0.384765625, 0.489013671875, 0.59326171875, 0.697509765625, 0.8017578125, 0.906005859375, 1.01025390625, 1.114501953125, 1.21875, 1.322998046875, 1.42724609375, 1.531494140625, 1.6357421875, 1.739990234375, 1.84423828125, 1.948486328125, 2.052734375, 2.156982421875, 2.26123046875, 2.365478515625, 2.4697265625, 2.573974609375, 2.67822265625, 2.782470703125, 2.88671875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 12.0, 11.0, 19.0, 14.0, 22.0, 38.0, 27.0, 44.0, 44.0, 50.0, 61.0, 60.0, 73.0, 73.0, 61.0, 59.0, 44.0, 49.0, 35.0, 25.0, 35.0, 30.0, 18.0, 26.0, 10.0, 11.0, 7.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.60324478149414, -21.90143585205078, -21.199628829956055, -20.497819900512695, -19.79601287841797, -19.09420394897461, -18.392396926879883, -17.690587997436523, -16.988780975341797, -16.286972045898438, -15.585165023803711, -14.883357048034668, -14.181549072265625, -13.479741096496582, -12.777933120727539, -12.07612419128418, -11.374316215515137, -10.672508239746094, -9.97070026397705, -9.268892288208008, -8.567084312438965, -7.865276336669922, -7.163467884063721, -6.461659908294678, -5.759851932525635, -5.058043956756592, -4.356235980987549, -3.6544277667999268, -2.952619791030884, -2.250811815261841, -1.5490036010742188, -0.8471956253051758, -0.1453876495361328, 0.5564203858375549, 1.2582284212112427, 1.9600365161895752, 2.661844491958618, 3.363652467727661, 4.065460681915283, 4.767268657684326, 5.469076633453369, 6.170884609222412, 6.872692584991455, 7.574501037597656, 8.2763090133667, 8.978116989135742, 9.679924964904785, 10.381732940673828, 11.083540916442871, 11.785348892211914, 12.487156867980957, 13.18896484375, 13.890772819519043, 14.592580795288086, 15.294389724731445, 15.996196746826172, 16.69800567626953, 17.39981460571289, 18.101621627807617, 18.803430557250977, 19.505237579345703, 20.207046508789062, 20.90885353088379, 21.61066246032715, 22.312469482421875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 9.0, 10.0, 14.0, 8.0, 9.0, 19.0, 26.0, 29.0, 28.0, 33.0, 26.0, 30.0, 32.0, 21.0, 36.0, 35.0, 41.0, 26.0, 38.0, 36.0, 36.0, 40.0, 38.0, 37.0, 28.0, 26.0, 41.0, 32.0, 36.0, 14.0, 18.0, 21.0, 11.0, 15.0, 14.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.458547592163086, -13.98674201965332, -13.514936447143555, -13.043129920959473, -12.571324348449707, -12.099518775939941, -11.62771224975586, -11.155906677246094, -10.684101104736328, -10.212295532226562, -9.740489959716797, -9.268683433532715, -8.79687786102295, -8.325072288513184, -7.85326623916626, -7.381460189819336, -6.90965461730957, -6.437849044799805, -5.966042995452881, -5.494236946105957, -5.022431373596191, -4.550625801086426, -4.078819751739502, -3.6070139408111572, -3.1352081298828125, -2.6634023189544678, -2.191596508026123, -1.7197906970977783, -1.2479848861694336, -0.7761790752410889, -0.30437326431274414, 0.16743254661560059, 0.6392393112182617, 1.1110451221466064, 1.5828509330749512, 2.054656744003296, 2.5264625549316406, 2.9982683658599854, 3.47007417678833, 3.941879987716675, 4.4136857986450195, 4.885491371154785, 5.357297420501709, 5.829103469848633, 6.300909042358398, 6.772714614868164, 7.244520664215088, 7.716326713562012, 8.188132286071777, 8.659937858581543, 9.131744384765625, 9.60354995727539, 10.075355529785156, 10.547161102294922, 11.018966674804688, 11.49077320098877, 11.962578773498535, 12.4343843460083, 12.906190872192383, 13.377996444702148, 13.849802017211914, 14.32160758972168, 14.793413162231445, 15.265219688415527, 15.737025260925293]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 2.0, 4.0, 11.0, 16.0, 20.0, 39.0, 57.0, 88.0, 140.0, 228.0, 310.0, 496.0, 789.0, 1248.0, 2121.0, 3385.0, 5542.0, 9091.0, 15171.0, 25820.0, 44833.0, 77748.0, 137315.0, 234872.0, 382726.0, 557524.0, 677968.0, 659385.0, 518410.0, 345413.0, 209379.0, 120248.0, 68883.0, 39388.0, 22705.0, 13197.0, 7818.0, 4640.0, 2802.0, 1664.0, 1058.0, 652.0, 397.0, 261.0, 145.0, 107.0, 75.0, 38.0, 21.0, 20.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.85986328125, -15.3291015625, -14.79833984375, -14.267578125, -13.73681640625, -13.2060546875, -12.67529296875, -12.14453125, -11.61376953125, -11.0830078125, -10.55224609375, -10.021484375, -9.49072265625, -8.9599609375, -8.42919921875, -7.8984375, -7.36767578125, -6.8369140625, -6.30615234375, -5.775390625, -5.24462890625, -4.7138671875, -4.18310546875, -3.65234375, -3.12158203125, -2.5908203125, -2.06005859375, -1.529296875, -0.99853515625, -0.4677734375, 0.06298828125, 0.59375, 1.12451171875, 1.6552734375, 2.18603515625, 2.716796875, 3.24755859375, 3.7783203125, 4.30908203125, 4.83984375, 5.37060546875, 5.9013671875, 6.43212890625, 6.962890625, 7.49365234375, 8.0244140625, 8.55517578125, 9.0859375, 9.61669921875, 10.1474609375, 10.67822265625, 11.208984375, 11.73974609375, 12.2705078125, 12.80126953125, 13.33203125, 13.86279296875, 14.3935546875, 14.92431640625, 15.455078125, 15.98583984375, 16.5166015625, 17.04736328125, 17.578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 10.0, 4.0, 10.0, 16.0, 7.0, 8.0, 21.0, 23.0, 25.0, 35.0, 29.0, 27.0, 26.0, 25.0, 29.0, 44.0, 35.0, 30.0, 29.0, 36.0, 41.0, 27.0, 38.0, 33.0, 46.0, 29.0, 26.0, 30.0, 38.0, 29.0, 23.0, 17.0, 17.0, 16.0, 19.0, 15.0, 11.0, 5.0, 8.0, 6.0, 4.0, 6.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.09375, -11.690185546875, -11.28662109375, -10.883056640625, -10.4794921875, -10.075927734375, -9.67236328125, -9.268798828125, -8.865234375, -8.461669921875, -8.05810546875, -7.654541015625, -7.2509765625, -6.847412109375, -6.44384765625, -6.040283203125, -5.63671875, -5.233154296875, -4.82958984375, -4.426025390625, -4.0224609375, -3.618896484375, -3.21533203125, -2.811767578125, -2.408203125, -2.004638671875, -1.60107421875, -1.197509765625, -0.7939453125, -0.390380859375, 0.01318359375, 0.416748046875, 0.8203125, 1.223876953125, 1.62744140625, 2.031005859375, 2.4345703125, 2.838134765625, 3.24169921875, 3.645263671875, 4.048828125, 4.452392578125, 4.85595703125, 5.259521484375, 5.6630859375, 6.066650390625, 6.47021484375, 6.873779296875, 7.27734375, 7.680908203125, 8.08447265625, 8.488037109375, 8.8916015625, 9.295166015625, 9.69873046875, 10.102294921875, 10.505859375, 10.909423828125, 11.31298828125, 11.716552734375, 12.1201171875, 12.523681640625, 12.92724609375, 13.330810546875, 13.734375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 21.0, 31.0, 60.0, 107.0, 151.0, 221.0, 383.0, 634.0, 1005.0, 1647.0, 2754.0, 4331.0, 7362.0, 12546.0, 20359.0, 33762.0, 56243.0, 92689.0, 149945.0, 235292.0, 350121.0, 475838.0, 569847.0, 583676.0, 506067.0, 385036.0, 264482.0, 170672.0, 106874.0, 64664.0, 38487.0, 23201.0, 14082.0, 8570.0, 5006.0, 3216.0, 1902.0, 1173.0, 709.0, 440.0, 244.0, 164.0, 114.0, 61.0, 29.0, 19.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.65625, -17.1390380859375, -16.621826171875, -16.1046142578125, -15.58740234375, -15.0701904296875, -14.552978515625, -14.0357666015625, -13.5185546875, -13.0013427734375, -12.484130859375, -11.9669189453125, -11.44970703125, -10.9324951171875, -10.415283203125, -9.8980712890625, -9.380859375, -8.8636474609375, -8.346435546875, -7.8292236328125, -7.31201171875, -6.7947998046875, -6.277587890625, -5.7603759765625, -5.2431640625, -4.7259521484375, -4.208740234375, -3.6915283203125, -3.17431640625, -2.6571044921875, -2.139892578125, -1.6226806640625, -1.10546875, -0.5882568359375, -0.071044921875, 0.4461669921875, 0.96337890625, 1.4805908203125, 1.997802734375, 2.5150146484375, 3.0322265625, 3.5494384765625, 4.066650390625, 4.5838623046875, 5.10107421875, 5.6182861328125, 6.135498046875, 6.6527099609375, 7.169921875, 7.6871337890625, 8.204345703125, 8.7215576171875, 9.23876953125, 9.7559814453125, 10.273193359375, 10.7904052734375, 11.3076171875, 11.8248291015625, 12.342041015625, 12.8592529296875, 13.37646484375, 13.8936767578125, 14.410888671875, 14.9281005859375, 15.4453125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 2.0, 11.0, 10.0, 12.0, 20.0, 23.0, 33.0, 41.0, 44.0, 56.0, 69.0, 87.0, 103.0, 124.0, 123.0, 141.0, 164.0, 159.0, 186.0, 180.0, 191.0, 202.0, 219.0, 192.0, 212.0, 195.0, 164.0, 167.0, 142.0, 139.0, 116.0, 109.0, 83.0, 53.0, 65.0, 55.0, 40.0, 34.0, 25.0, 21.0, 19.0, 12.0, 10.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.6546630859375, -5.446044921875, -5.2374267578125, -5.02880859375, -4.8201904296875, -4.611572265625, -4.4029541015625, -4.1943359375, -3.9857177734375, -3.777099609375, -3.5684814453125, -3.35986328125, -3.1512451171875, -2.942626953125, -2.7340087890625, -2.525390625, -2.3167724609375, -2.108154296875, -1.8995361328125, -1.69091796875, -1.4822998046875, -1.273681640625, -1.0650634765625, -0.8564453125, -0.6478271484375, -0.439208984375, -0.2305908203125, -0.02197265625, 0.1866455078125, 0.395263671875, 0.6038818359375, 0.8125, 1.0211181640625, 1.229736328125, 1.4383544921875, 1.64697265625, 1.8555908203125, 2.064208984375, 2.2728271484375, 2.4814453125, 2.6900634765625, 2.898681640625, 3.1072998046875, 3.31591796875, 3.5245361328125, 3.733154296875, 3.9417724609375, 4.150390625, 4.3590087890625, 4.567626953125, 4.7762451171875, 4.98486328125, 5.1934814453125, 5.402099609375, 5.6107177734375, 5.8193359375, 6.0279541015625, 6.236572265625, 6.4451904296875, 6.65380859375, 6.8624267578125, 7.071044921875, 7.2796630859375, 7.48828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 10.0, 10.0, 12.0, 13.0, 19.0, 17.0, 24.0, 16.0, 24.0, 38.0, 37.0, 37.0, 42.0, 42.0, 45.0, 39.0, 48.0, 56.0, 45.0, 40.0, 54.0, 52.0, 39.0, 38.0, 26.0, 21.0, 28.0, 21.0, 17.0, 9.0, 12.0, 15.0, 10.0, 6.0, 9.0, 5.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.023977279663086, -18.460514068603516, -17.897050857543945, -17.333587646484375, -16.770122528076172, -16.2066593170166, -15.643196105957031, -15.079732894897461, -14.51626968383789, -13.95280647277832, -13.38934326171875, -12.825879096984863, -12.262415885925293, -11.698952674865723, -11.135488510131836, -10.572025299072266, -10.008562088012695, -9.445098876953125, -8.881635665893555, -8.318171501159668, -7.754708290100098, -7.191245079040527, -6.627781391143799, -6.06431770324707, -5.5008544921875, -4.93739128112793, -4.373927593231201, -3.8104641437530518, -3.2470006942749023, -2.683537244796753, -2.1200737953186035, -1.556610345840454, -0.9931449890136719, -0.42968153953552246, 0.13378190994262695, 0.6972453594207764, 1.2607088088989258, 1.8241722583770752, 2.3876357078552246, 2.951099157333374, 3.5145626068115234, 4.078025817871094, 4.641489505767822, 5.204953193664551, 5.768416404724121, 6.331879615783691, 6.89534330368042, 7.458806991577148, 8.022270202636719, 8.585733413696289, 9.14919662475586, 9.712660789489746, 10.276124000549316, 10.839587211608887, 11.403051376342773, 11.966514587402344, 12.529977798461914, 13.093441009521484, 13.656904220581055, 14.220368385314941, 14.783831596374512, 15.347294807434082, 15.910758972167969, 16.47422218322754, 17.03768539428711]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 0.0, 6.0, 5.0, 4.0, 18.0, 13.0, 14.0, 16.0, 19.0, 17.0, 17.0, 27.0, 28.0, 34.0, 29.0, 39.0, 31.0, 44.0, 36.0, 43.0, 29.0, 30.0, 37.0, 48.0, 28.0, 52.0, 49.0, 31.0, 27.0, 31.0, 21.0, 29.0, 30.0, 19.0, 20.0, 15.0, 17.0, 12.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.063995361328125, -15.55224609375, -15.040496826171875, -14.52874755859375, -14.016997337341309, -13.505248069763184, -12.993498802185059, -12.481749534606934, -11.969999313354492, -11.458250045776367, -10.946500778198242, -10.434751510620117, -9.923001289367676, -9.41125202178955, -8.899502754211426, -8.3877534866333, -7.876004219055176, -7.364254951477051, -6.852505207061768, -6.340755939483643, -5.829006195068359, -5.317256927490234, -4.805507659912109, -4.293758392333984, -3.782008647918701, -3.270259141921997, -2.758509635925293, -2.246760368347168, -1.7350108623504639, -1.2232613563537598, -0.7115120887756348, -0.19976258277893066, 0.31198692321777344, 0.8237363696098328, 1.335485816001892, 1.8472352027893066, 2.3589847087860107, 2.870734214782715, 3.38248348236084, 3.894232988357544, 4.405982494354248, 4.917731761932373, 5.429481506347656, 5.941230773925781, 6.452980041503906, 6.9647297859191895, 7.4764790534973145, 7.988228797912598, 8.499978065490723, 9.011727333068848, 9.523476600646973, 10.035226821899414, 10.546976089477539, 11.058725357055664, 11.570474624633789, 12.082223892211914, 12.593973159790039, 13.105722427368164, 13.617471694946289, 14.129220962524414, 14.640971183776855, 15.15272045135498, 15.664469718933105, 16.176219940185547, 16.687969207763672]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 11.0, 17.0, 23.0, 41.0, 59.0, 96.0, 153.0, 222.0, 389.0, 550.0, 777.0, 1295.0, 1889.0, 2921.0, 4461.0, 6301.0, 9243.0, 13621.0, 19382.0, 27045.0, 37338.0, 49335.0, 63444.0, 77593.0, 90373.0, 97928.0, 99175.0, 93690.0, 82764.0, 69304.0, 55081.0, 41819.0, 30902.0, 22062.0, 15432.0, 11044.0, 7479.0, 5049.0, 3511.0, 2325.0, 1546.0, 996.0, 621.0, 429.0, 280.0, 170.0, 125.0, 93.0, 57.0, 34.0, 16.0, 17.0, 12.0, 9.0, 9.0, 1.0, 0.0, 3.0], "bins": [-4.6640625, -4.51922607421875, -4.3743896484375, -4.22955322265625, -4.084716796875, -3.93988037109375, -3.7950439453125, -3.65020751953125, -3.50537109375, -3.36053466796875, -3.2156982421875, -3.07086181640625, -2.926025390625, -2.78118896484375, -2.6363525390625, -2.49151611328125, -2.3466796875, -2.20184326171875, -2.0570068359375, -1.91217041015625, -1.767333984375, -1.62249755859375, -1.4776611328125, -1.33282470703125, -1.18798828125, -1.04315185546875, -0.8983154296875, -0.75347900390625, -0.608642578125, -0.46380615234375, -0.3189697265625, -0.17413330078125, -0.029296875, 0.11553955078125, 0.2603759765625, 0.40521240234375, 0.550048828125, 0.69488525390625, 0.8397216796875, 0.98455810546875, 1.12939453125, 1.27423095703125, 1.4190673828125, 1.56390380859375, 1.708740234375, 1.85357666015625, 1.9984130859375, 2.14324951171875, 2.2880859375, 2.43292236328125, 2.5777587890625, 2.72259521484375, 2.867431640625, 3.01226806640625, 3.1571044921875, 3.30194091796875, 3.44677734375, 3.59161376953125, 3.7364501953125, 3.88128662109375, 4.026123046875, 4.17095947265625, 4.3157958984375, 4.46063232421875, 4.60546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 6.0, 5.0, 5.0, 17.0, 14.0, 11.0, 18.0, 20.0, 16.0, 20.0, 21.0, 32.0, 33.0, 32.0, 34.0, 33.0, 44.0, 38.0, 40.0, 31.0, 30.0, 37.0, 47.0, 30.0, 49.0, 44.0, 32.0, 32.0, 31.0, 21.0, 31.0, 29.0, 17.0, 21.0, 13.0, 20.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.171875, -15.656982421875, -15.14208984375, -14.627197265625, -14.1123046875, -13.597412109375, -13.08251953125, -12.567626953125, -12.052734375, -11.537841796875, -11.02294921875, -10.508056640625, -9.9931640625, -9.478271484375, -8.96337890625, -8.448486328125, -7.93359375, -7.418701171875, -6.90380859375, -6.388916015625, -5.8740234375, -5.359130859375, -4.84423828125, -4.329345703125, -3.814453125, -3.299560546875, -2.78466796875, -2.269775390625, -1.7548828125, -1.239990234375, -0.72509765625, -0.210205078125, 0.3046875, 0.819580078125, 1.33447265625, 1.849365234375, 2.3642578125, 2.879150390625, 3.39404296875, 3.908935546875, 4.423828125, 4.938720703125, 5.45361328125, 5.968505859375, 6.4833984375, 6.998291015625, 7.51318359375, 8.028076171875, 8.54296875, 9.057861328125, 9.57275390625, 10.087646484375, 10.6025390625, 11.117431640625, 11.63232421875, 12.147216796875, 12.662109375, 13.177001953125, 13.69189453125, 14.206787109375, 14.7216796875, 15.236572265625, 15.75146484375, 16.266357421875, 16.78125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 8.0, 17.0, 28.0, 37.0, 66.0, 85.0, 155.0, 284.0, 518.0, 968.0, 1943.0, 4035.0, 7929.0, 16254.0, 35686.0, 750460.0, 175384.0, 28261.0, 13204.0, 6515.0, 3228.0, 1572.0, 809.0, 470.0, 243.0, 149.0, 81.0, 53.0, 32.0, 18.0, 20.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.671875, -22.951416015625, -22.23095703125, -21.510498046875, -20.7900390625, -20.069580078125, -19.34912109375, -18.628662109375, -17.908203125, -17.187744140625, -16.46728515625, -15.746826171875, -15.0263671875, -14.305908203125, -13.58544921875, -12.864990234375, -12.14453125, -11.424072265625, -10.70361328125, -9.983154296875, -9.2626953125, -8.542236328125, -7.82177734375, -7.101318359375, -6.380859375, -5.660400390625, -4.93994140625, -4.219482421875, -3.4990234375, -2.778564453125, -2.05810546875, -1.337646484375, -0.6171875, 0.103271484375, 0.82373046875, 1.544189453125, 2.2646484375, 2.985107421875, 3.70556640625, 4.426025390625, 5.146484375, 5.866943359375, 6.58740234375, 7.307861328125, 8.0283203125, 8.748779296875, 9.46923828125, 10.189697265625, 10.91015625, 11.630615234375, 12.35107421875, 13.071533203125, 13.7919921875, 14.512451171875, 15.23291015625, 15.953369140625, 16.673828125, 17.394287109375, 18.11474609375, 18.835205078125, 19.5556640625, 20.276123046875, 20.99658203125, 21.717041015625, 22.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 5.0, 10.0, 8.0, 18.0, 14.0, 17.0, 19.0, 11.0, 24.0, 24.0, 28.0, 28.0, 38.0, 24.0, 34.0, 34.0, 42.0, 40.0, 43.0, 36.0, 40.0, 29.0, 37.0, 35.0, 39.0, 33.0, 34.0, 34.0, 17.0, 18.0, 31.0, 17.0, 22.0, 15.0, 15.0, 19.0, 13.0, 12.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.78125, -10.4539794921875, -10.126708984375, -9.7994384765625, -9.47216796875, -9.1448974609375, -8.817626953125, -8.4903564453125, -8.1630859375, -7.8358154296875, -7.508544921875, -7.1812744140625, -6.85400390625, -6.5267333984375, -6.199462890625, -5.8721923828125, -5.544921875, -5.2176513671875, -4.890380859375, -4.5631103515625, -4.23583984375, -3.9085693359375, -3.581298828125, -3.2540283203125, -2.9267578125, -2.5994873046875, -2.272216796875, -1.9449462890625, -1.61767578125, -1.2904052734375, -0.963134765625, -0.6358642578125, -0.30859375, 0.0186767578125, 0.345947265625, 0.6732177734375, 1.00048828125, 1.3277587890625, 1.655029296875, 1.9822998046875, 2.3095703125, 2.6368408203125, 2.964111328125, 3.2913818359375, 3.61865234375, 3.9459228515625, 4.273193359375, 4.6004638671875, 4.927734375, 5.2550048828125, 5.582275390625, 5.9095458984375, 6.23681640625, 6.5640869140625, 6.891357421875, 7.2186279296875, 7.5458984375, 7.8731689453125, 8.200439453125, 8.5277099609375, 8.85498046875, 9.1822509765625, 9.509521484375, 9.8367919921875, 10.1640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 11.0, 15.0, 18.0, 23.0, 38.0, 53.0, 70.0, 115.0, 143.0, 188.0, 276.0, 407.0, 655.0, 962.0, 1571.0, 2488.0, 4240.0, 7146.0, 12855.0, 25106.0, 92749.0, 804474.0, 47792.0, 20306.0, 10771.0, 6077.0, 3668.0, 2277.0, 1375.0, 867.0, 538.0, 372.0, 262.0, 173.0, 127.0, 96.0, 52.0, 48.0, 33.0, 25.0, 20.0, 11.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.97802734375, -0.9468307495117188, -0.9156341552734375, -0.8844375610351562, -0.853240966796875, -0.8220443725585938, -0.7908477783203125, -0.7596511840820312, -0.72845458984375, -0.6972579956054688, -0.6660614013671875, -0.6348648071289062, -0.603668212890625, -0.5724716186523438, -0.5412750244140625, -0.5100784301757812, -0.4788818359375, -0.44768524169921875, -0.4164886474609375, -0.38529205322265625, -0.354095458984375, -0.32289886474609375, -0.2917022705078125, -0.26050567626953125, -0.22930908203125, -0.19811248779296875, -0.1669158935546875, -0.13571929931640625, -0.104522705078125, -0.07332611083984375, -0.0421295166015625, -0.01093292236328125, 0.020263671875, 0.05146026611328125, 0.0826568603515625, 0.11385345458984375, 0.145050048828125, 0.17624664306640625, 0.2074432373046875, 0.23863983154296875, 0.26983642578125, 0.30103302001953125, 0.3322296142578125, 0.36342620849609375, 0.394622802734375, 0.42581939697265625, 0.4570159912109375, 0.48821258544921875, 0.5194091796875, 0.5506057739257812, 0.5818023681640625, 0.6129989624023438, 0.644195556640625, 0.6753921508789062, 0.7065887451171875, 0.7377853393554688, 0.76898193359375, 0.8001785278320312, 0.8313751220703125, 0.8625717163085938, 0.893768310546875, 0.9249649047851562, 0.9561614990234375, 0.9873580932617188, 1.0185546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 4.0, 9.0, 10.0, 19.0, 26.0, 35.0, 33.0, 56.0, 60.0, 102.0, 101.0, 84.0, 94.0, 72.0, 58.0, 57.0, 40.0, 34.0, 23.0, 22.0, 13.0, 10.0, 5.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021193921566009521, -0.0002047717571258545, -0.00019760429859161377, -0.00019043684005737305, -0.00018326938152313232, -0.0001761019229888916, -0.00016893446445465088, -0.00016176700592041016, -0.00015459954738616943, -0.0001474320888519287, -0.000140264630317688, -0.00013309717178344727, -0.00012592971324920654, -0.00011876225471496582, -0.0001115947961807251, -0.00010442733764648438, -9.725987911224365e-05, -9.009242057800293e-05, -8.292496204376221e-05, -7.575750350952148e-05, -6.859004497528076e-05, -6.142258644104004e-05, -5.4255127906799316e-05, -4.7087669372558594e-05, -3.992021083831787e-05, -3.275275230407715e-05, -2.5585293769836426e-05, -1.8417835235595703e-05, -1.125037670135498e-05, -4.082918167114258e-06, 3.084540367126465e-06, 1.0251998901367188e-05, 1.741945743560791e-05, 2.4586915969848633e-05, 3.1754374504089355e-05, 3.892183303833008e-05, 4.60892915725708e-05, 5.3256750106811523e-05, 6.0424208641052246e-05, 6.759166717529297e-05, 7.475912570953369e-05, 8.192658424377441e-05, 8.909404277801514e-05, 9.626150131225586e-05, 0.00010342895984649658, 0.0001105964183807373, 0.00011776387691497803, 0.00012493133544921875, 0.00013209879398345947, 0.0001392662525177002, 0.00014643371105194092, 0.00015360116958618164, 0.00016076862812042236, 0.00016793608665466309, 0.0001751035451889038, 0.00018227100372314453, 0.00018943846225738525, 0.00019660592079162598, 0.0002037733793258667, 0.00021094083786010742, 0.00021810829639434814, 0.00022527575492858887, 0.0002324432134628296, 0.0002396106719970703]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 10.0, 10.0, 13.0, 31.0, 33.0, 34.0, 48.0, 77.0, 102.0, 144.0, 181.0, 290.0, 382.0, 559.0, 810.0, 1402.0, 2237.0, 3910.0, 6982.0, 13569.0, 25767.0, 48526.0, 86517.0, 136475.0, 179999.0, 183399.0, 145286.0, 94333.0, 54310.0, 29001.0, 15143.0, 7851.0, 4389.0, 2332.0, 1429.0, 938.0, 600.0, 436.0, 284.0, 171.0, 157.0, 107.0, 76.0, 56.0, 41.0, 21.0, 29.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7923812866210938, -0.7668914794921875, -0.7414016723632812, -0.715911865234375, -0.6904220581054688, -0.6649322509765625, -0.6394424438476562, -0.61395263671875, -0.5884628295898438, -0.5629730224609375, -0.5374832153320312, -0.511993408203125, -0.48650360107421875, -0.4610137939453125, -0.43552398681640625, -0.4100341796875, -0.38454437255859375, -0.3590545654296875, -0.33356475830078125, -0.308074951171875, -0.28258514404296875, -0.2570953369140625, -0.23160552978515625, -0.20611572265625, -0.18062591552734375, -0.1551361083984375, -0.12964630126953125, -0.104156494140625, -0.07866668701171875, -0.0531768798828125, -0.02768707275390625, -0.002197265625, 0.02329254150390625, 0.0487823486328125, 0.07427215576171875, 0.099761962890625, 0.12525177001953125, 0.1507415771484375, 0.17623138427734375, 0.20172119140625, 0.22721099853515625, 0.2527008056640625, 0.27819061279296875, 0.303680419921875, 0.32917022705078125, 0.3546600341796875, 0.38014984130859375, 0.4056396484375, 0.43112945556640625, 0.4566192626953125, 0.48210906982421875, 0.507598876953125, 0.5330886840820312, 0.5585784912109375, 0.5840682983398438, 0.60955810546875, 0.6350479125976562, 0.6605377197265625, 0.6860275268554688, 0.711517333984375, 0.7370071411132812, 0.7624969482421875, 0.7879867553710938, 0.8134765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 9.0, 7.0, 17.0, 11.0, 23.0, 21.0, 32.0, 38.0, 46.0, 42.0, 51.0, 52.0, 65.0, 47.0, 51.0, 52.0, 53.0, 35.0, 51.0, 39.0, 41.0, 35.0, 36.0, 27.0, 24.0, 18.0, 19.0, 12.0, 12.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29443359375, -0.2855873107910156, -0.27674102783203125, -0.2678947448730469, -0.2590484619140625, -0.2502021789550781, -0.24135589599609375, -0.23250961303710938, -0.223663330078125, -0.21481704711914062, -0.20597076416015625, -0.19712448120117188, -0.1882781982421875, -0.17943191528320312, -0.17058563232421875, -0.16173934936523438, -0.15289306640625, -0.14404678344726562, -0.13520050048828125, -0.12635421752929688, -0.1175079345703125, -0.10866165161132812, -0.09981536865234375, -0.09096908569335938, -0.082122802734375, -0.07327651977539062, -0.06443023681640625, -0.055583953857421875, -0.0467376708984375, -0.037891387939453125, -0.02904510498046875, -0.020198822021484375, -0.0113525390625, -0.002506256103515625, 0.00634002685546875, 0.015186309814453125, 0.0240325927734375, 0.032878875732421875, 0.04172515869140625, 0.050571441650390625, 0.059417724609375, 0.06826400756835938, 0.07711029052734375, 0.08595657348632812, 0.0948028564453125, 0.10364913940429688, 0.11249542236328125, 0.12134170532226562, 0.13018798828125, 0.13903427124023438, 0.14788055419921875, 0.15672683715820312, 0.1655731201171875, 0.17441940307617188, 0.18326568603515625, 0.19211196899414062, 0.200958251953125, 0.20980453491210938, 0.21865081787109375, 0.22749710083007812, 0.2363433837890625, 0.24518966674804688, 0.25403594970703125, 0.2628822326660156, 0.271728515625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 3.0, 8.0, 14.0, 13.0, 13.0, 10.0, 27.0, 20.0, 18.0, 27.0, 30.0, 32.0, 47.0, 51.0, 38.0, 55.0, 35.0, 50.0, 45.0, 60.0, 58.0, 44.0, 55.0, 36.0, 32.0, 24.0, 28.0, 23.0, 23.0, 9.0, 13.0, 11.0, 14.0, 7.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3533992767334, -20.755352020263672, -20.157302856445312, -19.559255599975586, -18.96120834350586, -18.3631591796875, -17.765111923217773, -17.167064666748047, -16.569015502929688, -15.970967292785645, -15.372920036315918, -14.774871826171875, -14.176823616027832, -13.578775405883789, -12.980728149414062, -12.38267993927002, -11.784632682800293, -11.18658447265625, -10.588537216186523, -9.99048900604248, -9.392440795898438, -8.794393539428711, -8.196345329284668, -7.598297119140625, -7.00024938583374, -6.4022016525268555, -5.8041534423828125, -5.206105709075928, -4.608057975769043, -4.010009765625, -3.4119620323181152, -2.8139138221740723, -2.2158660888671875, -1.6178181171417236, -1.0197702646255493, -0.421722412109375, 0.17632555961608887, 0.7743735313415527, 1.3724212646484375, 1.9704694747924805, 2.5685172080993652, 3.166565179824829, 3.764613151550293, 4.362660884857178, 4.9607086181640625, 5.5587568283081055, 6.15680456161499, 6.754852771759033, 7.352900505065918, 7.950948238372803, 8.548995971679688, 9.14704418182373, 9.745092391967773, 10.3431396484375, 10.941187858581543, 11.539236068725586, 12.137283325195312, 12.735331535339355, 13.333378791809082, 13.931427001953125, 14.529475212097168, 15.127523422241211, 15.725570678710938, 16.323619842529297, 16.921667098999023]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 2.0, 1.0, 6.0, 4.0, 6.0, 18.0, 14.0, 8.0, 20.0, 21.0, 14.0, 15.0, 24.0, 34.0, 33.0, 28.0, 35.0, 34.0, 44.0, 36.0, 37.0, 39.0, 28.0, 37.0, 46.0, 31.0, 44.0, 47.0, 33.0, 33.0, 31.0, 20.0, 28.0, 30.0, 22.0, 19.0, 10.0, 23.0, 13.0, 9.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.204660415649414, -15.690380096435547, -15.17609977722168, -14.661819458007812, -14.147539138793945, -13.633258819580078, -13.118978500366211, -12.604698181152344, -12.090417861938477, -11.57613754272461, -11.061857223510742, -10.547576904296875, -10.033296585083008, -9.51901626586914, -9.004735946655273, -8.490455627441406, -7.976175308227539, -7.461894989013672, -6.947614669799805, -6.4333343505859375, -5.91905403137207, -5.404773712158203, -4.890493392944336, -4.376213073730469, -3.8619327545166016, -3.3476524353027344, -2.833372116088867, -2.319091796875, -1.8048114776611328, -1.2905311584472656, -0.7762508392333984, -0.26197052001953125, 0.25230979919433594, 0.7665901184082031, 1.2808704376220703, 1.7951507568359375, 2.3094310760498047, 2.823711395263672, 3.337991714477539, 3.8522720336914062, 4.366552352905273, 4.880832672119141, 5.395112991333008, 5.909393310546875, 6.423673629760742, 6.937953948974609, 7.452234268188477, 7.966514587402344, 8.480794906616211, 8.995075225830078, 9.509355545043945, 10.023635864257812, 10.53791618347168, 11.052196502685547, 11.566476821899414, 12.080757141113281, 12.595037460327148, 13.109317779541016, 13.623598098754883, 14.13787841796875, 14.652158737182617, 15.166439056396484, 15.680719375610352, 16.19499969482422, 16.709280014038086]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 11.0, 9.0, 22.0, 33.0, 53.0, 81.0, 117.0, 215.0, 383.0, 537.0, 950.0, 1502.0, 2551.0, 4239.0, 6698.0, 11146.0, 17785.0, 27206.0, 40594.0, 58267.0, 78402.0, 98621.0, 113396.0, 119100.0, 113651.0, 99319.0, 78884.0, 58459.0, 41349.0, 27661.0, 18069.0, 11292.0, 7009.0, 4202.0, 2679.0, 1595.0, 956.0, 564.0, 351.0, 224.0, 152.0, 89.0, 38.0, 31.0, 23.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.060302734375, -14.59716796875, -14.134033203125, -13.6708984375, -13.207763671875, -12.74462890625, -12.281494140625, -11.818359375, -11.355224609375, -10.89208984375, -10.428955078125, -9.9658203125, -9.502685546875, -9.03955078125, -8.576416015625, -8.11328125, -7.650146484375, -7.18701171875, -6.723876953125, -6.2607421875, -5.797607421875, -5.33447265625, -4.871337890625, -4.408203125, -3.945068359375, -3.48193359375, -3.018798828125, -2.5556640625, -2.092529296875, -1.62939453125, -1.166259765625, -0.703125, -0.239990234375, 0.22314453125, 0.686279296875, 1.1494140625, 1.612548828125, 2.07568359375, 2.538818359375, 3.001953125, 3.465087890625, 3.92822265625, 4.391357421875, 4.8544921875, 5.317626953125, 5.78076171875, 6.243896484375, 6.70703125, 7.170166015625, 7.63330078125, 8.096435546875, 8.5595703125, 9.022705078125, 9.48583984375, 9.948974609375, 10.412109375, 10.875244140625, 11.33837890625, 11.801513671875, 12.2646484375, 12.727783203125, 13.19091796875, 13.654052734375, 14.1171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 7.0, 4.0, 5.0, 20.0, 13.0, 6.0, 24.0, 19.0, 16.0, 14.0, 27.0, 30.0, 32.0, 31.0, 29.0, 39.0, 45.0, 37.0, 35.0, 39.0, 28.0, 36.0, 44.0, 32.0, 45.0, 47.0, 36.0, 29.0, 31.0, 17.0, 28.0, 34.0, 20.0, 20.0, 12.0, 17.0, 15.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.421875, -14.93212890625, -14.4423828125, -13.95263671875, -13.462890625, -12.97314453125, -12.4833984375, -11.99365234375, -11.50390625, -11.01416015625, -10.5244140625, -10.03466796875, -9.544921875, -9.05517578125, -8.5654296875, -8.07568359375, -7.5859375, -7.09619140625, -6.6064453125, -6.11669921875, -5.626953125, -5.13720703125, -4.6474609375, -4.15771484375, -3.66796875, -3.17822265625, -2.6884765625, -2.19873046875, -1.708984375, -1.21923828125, -0.7294921875, -0.23974609375, 0.25, 0.73974609375, 1.2294921875, 1.71923828125, 2.208984375, 2.69873046875, 3.1884765625, 3.67822265625, 4.16796875, 4.65771484375, 5.1474609375, 5.63720703125, 6.126953125, 6.61669921875, 7.1064453125, 7.59619140625, 8.0859375, 8.57568359375, 9.0654296875, 9.55517578125, 10.044921875, 10.53466796875, 11.0244140625, 11.51416015625, 12.00390625, 12.49365234375, 12.9833984375, 13.47314453125, 13.962890625, 14.45263671875, 14.9423828125, 15.43212890625, 15.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 17.0, 18.0, 22.0, 49.0, 91.0, 122.0, 223.0, 316.0, 483.0, 763.0, 1211.0, 1841.0, 3014.0, 4571.0, 6878.0, 10774.0, 16021.0, 23547.0, 33993.0, 47444.0, 62228.0, 78737.0, 92586.0, 102971.0, 105551.0, 100995.0, 88504.0, 73181.0, 57056.0, 42618.0, 30872.0, 21105.0, 14290.0, 9276.0, 6110.0, 4039.0, 2498.0, 1657.0, 1057.0, 643.0, 404.0, 288.0, 190.0, 94.0, 70.0, 58.0, 26.0, 26.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.296875, -11.8916015625, -11.486328125, -11.0810546875, -10.67578125, -10.2705078125, -9.865234375, -9.4599609375, -9.0546875, -8.6494140625, -8.244140625, -7.8388671875, -7.43359375, -7.0283203125, -6.623046875, -6.2177734375, -5.8125, -5.4072265625, -5.001953125, -4.5966796875, -4.19140625, -3.7861328125, -3.380859375, -2.9755859375, -2.5703125, -2.1650390625, -1.759765625, -1.3544921875, -0.94921875, -0.5439453125, -0.138671875, 0.2666015625, 0.671875, 1.0771484375, 1.482421875, 1.8876953125, 2.29296875, 2.6982421875, 3.103515625, 3.5087890625, 3.9140625, 4.3193359375, 4.724609375, 5.1298828125, 5.53515625, 5.9404296875, 6.345703125, 6.7509765625, 7.15625, 7.5615234375, 7.966796875, 8.3720703125, 8.77734375, 9.1826171875, 9.587890625, 9.9931640625, 10.3984375, 10.8037109375, 11.208984375, 11.6142578125, 12.01953125, 12.4248046875, 12.830078125, 13.2353515625, 13.640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 9.0, 6.0, 10.0, 14.0, 6.0, 8.0, 14.0, 12.0, 23.0, 23.0, 29.0, 27.0, 27.0, 24.0, 23.0, 28.0, 41.0, 39.0, 32.0, 35.0, 35.0, 51.0, 45.0, 36.0, 41.0, 47.0, 28.0, 37.0, 33.0, 33.0, 28.0, 22.0, 26.0, 22.0, 18.0, 13.0, 10.0, 11.0, 14.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.0777587890625, -9.757080078125, -9.4364013671875, -9.11572265625, -8.7950439453125, -8.474365234375, -8.1536865234375, -7.8330078125, -7.5123291015625, -7.191650390625, -6.8709716796875, -6.55029296875, -6.2296142578125, -5.908935546875, -5.5882568359375, -5.267578125, -4.9468994140625, -4.626220703125, -4.3055419921875, -3.98486328125, -3.6641845703125, -3.343505859375, -3.0228271484375, -2.7021484375, -2.3814697265625, -2.060791015625, -1.7401123046875, -1.41943359375, -1.0987548828125, -0.778076171875, -0.4573974609375, -0.13671875, 0.1839599609375, 0.504638671875, 0.8253173828125, 1.14599609375, 1.4666748046875, 1.787353515625, 2.1080322265625, 2.4287109375, 2.7493896484375, 3.070068359375, 3.3907470703125, 3.71142578125, 4.0321044921875, 4.352783203125, 4.6734619140625, 4.994140625, 5.3148193359375, 5.635498046875, 5.9561767578125, 6.27685546875, 6.5975341796875, 6.918212890625, 7.2388916015625, 7.5595703125, 7.8802490234375, 8.200927734375, 8.5216064453125, 8.84228515625, 9.1629638671875, 9.483642578125, 9.8043212890625, 10.125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 9.0, 12.0, 20.0, 36.0, 48.0, 78.0, 124.0, 198.0, 323.0, 547.0, 916.0, 1552.0, 2789.0, 5175.0, 10570.0, 21912.0, 46586.0, 94500.0, 165161.0, 218825.0, 202794.0, 135553.0, 72269.0, 34867.0, 16409.0, 7733.0, 4135.0, 2221.0, 1228.0, 801.0, 445.0, 252.0, 152.0, 112.0, 66.0, 40.0, 34.0, 18.0, 13.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8203125, -9.52978515625, -9.2392578125, -8.94873046875, -8.658203125, -8.36767578125, -8.0771484375, -7.78662109375, -7.49609375, -7.20556640625, -6.9150390625, -6.62451171875, -6.333984375, -6.04345703125, -5.7529296875, -5.46240234375, -5.171875, -4.88134765625, -4.5908203125, -4.30029296875, -4.009765625, -3.71923828125, -3.4287109375, -3.13818359375, -2.84765625, -2.55712890625, -2.2666015625, -1.97607421875, -1.685546875, -1.39501953125, -1.1044921875, -0.81396484375, -0.5234375, -0.23291015625, 0.0576171875, 0.34814453125, 0.638671875, 0.92919921875, 1.2197265625, 1.51025390625, 1.80078125, 2.09130859375, 2.3818359375, 2.67236328125, 2.962890625, 3.25341796875, 3.5439453125, 3.83447265625, 4.125, 4.41552734375, 4.7060546875, 4.99658203125, 5.287109375, 5.57763671875, 5.8681640625, 6.15869140625, 6.44921875, 6.73974609375, 7.0302734375, 7.32080078125, 7.611328125, 7.90185546875, 8.1923828125, 8.48291015625, 8.7734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 15.0, 12.0, 21.0, 30.0, 28.0, 58.0, 40.0, 53.0, 58.0, 79.0, 83.0, 93.0, 75.0, 69.0, 46.0, 48.0, 48.0, 28.0, 20.0, 26.0, 18.0, 12.0, 14.0, 4.0, 7.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011987686157226562, -0.0011665523052215576, -0.001134335994720459, -0.0011021196842193604, -0.0010699033737182617, -0.001037687063217163, -0.0010054707527160645, -0.0009732544422149658, -0.0009410381317138672, -0.0009088218212127686, -0.0008766055107116699, -0.0008443892002105713, -0.0008121728897094727, -0.000779956579208374, -0.0007477402687072754, -0.0007155239582061768, -0.0006833076477050781, -0.0006510913372039795, -0.0006188750267028809, -0.0005866587162017822, -0.0005544424057006836, -0.000522226095199585, -0.0004900097846984863, -0.0004577934741973877, -0.00042557716369628906, -0.00039336085319519043, -0.0003611445426940918, -0.00032892823219299316, -0.00029671192169189453, -0.0002644956111907959, -0.00023227930068969727, -0.00020006299018859863, -0.0001678466796875, -0.00013563036918640137, -0.00010341405868530273, -7.11977481842041e-05, -3.898143768310547e-05, -6.765127182006836e-06, 2.5451183319091797e-05, 5.766749382019043e-05, 8.988380432128906e-05, 0.0001221001148223877, 0.00015431642532348633, 0.00018653273582458496, 0.0002187490463256836, 0.0002509653568267822, 0.00028318166732788086, 0.0003153979778289795, 0.0003476142883300781, 0.00037983059883117676, 0.0004120469093322754, 0.000444263219833374, 0.00047647953033447266, 0.0005086958408355713, 0.0005409121513366699, 0.0005731284618377686, 0.0006053447723388672, 0.0006375610828399658, 0.0006697773933410645, 0.0007019937038421631, 0.0007342100143432617, 0.0007664263248443604, 0.000798642635345459, 0.0008308589458465576, 0.0008630752563476562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 15.0, 11.0, 16.0, 30.0, 33.0, 52.0, 86.0, 119.0, 177.0, 232.0, 343.0, 513.0, 706.0, 1012.0, 1581.0, 2564.0, 4054.0, 6531.0, 10848.0, 18289.0, 32014.0, 55131.0, 90143.0, 133934.0, 166406.0, 166935.0, 132907.0, 90051.0, 55296.0, 31455.0, 18209.0, 10875.0, 6478.0, 3946.0, 2515.0, 1585.0, 1070.0, 742.0, 519.0, 360.0, 251.0, 163.0, 107.0, 86.0, 42.0, 53.0, 21.0, 16.0, 9.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-7.76953125, -7.5340576171875, -7.298583984375, -7.0631103515625, -6.82763671875, -6.5921630859375, -6.356689453125, -6.1212158203125, -5.8857421875, -5.6502685546875, -5.414794921875, -5.1793212890625, -4.94384765625, -4.7083740234375, -4.472900390625, -4.2374267578125, -4.001953125, -3.7664794921875, -3.531005859375, -3.2955322265625, -3.06005859375, -2.8245849609375, -2.589111328125, -2.3536376953125, -2.1181640625, -1.8826904296875, -1.647216796875, -1.4117431640625, -1.17626953125, -0.9407958984375, -0.705322265625, -0.4698486328125, -0.234375, 0.0010986328125, 0.236572265625, 0.4720458984375, 0.70751953125, 0.9429931640625, 1.178466796875, 1.4139404296875, 1.6494140625, 1.8848876953125, 2.120361328125, 2.3558349609375, 2.59130859375, 2.8267822265625, 3.062255859375, 3.2977294921875, 3.533203125, 3.7686767578125, 4.004150390625, 4.2396240234375, 4.47509765625, 4.7105712890625, 4.946044921875, 5.1815185546875, 5.4169921875, 5.6524658203125, 5.887939453125, 6.1234130859375, 6.35888671875, 6.5943603515625, 6.829833984375, 7.0653076171875, 7.30078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 10.0, 12.0, 5.0, 10.0, 14.0, 12.0, 23.0, 23.0, 25.0, 48.0, 52.0, 54.0, 53.0, 49.0, 60.0, 48.0, 51.0, 64.0, 49.0, 53.0, 49.0, 38.0, 39.0, 26.0, 26.0, 21.0, 24.0, 10.0, 9.0, 10.0, 5.0, 7.0, 7.0, 1.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.435546875, -3.34283447265625, -3.2501220703125, -3.15740966796875, -3.064697265625, -2.97198486328125, -2.8792724609375, -2.78656005859375, -2.69384765625, -2.60113525390625, -2.5084228515625, -2.41571044921875, -2.322998046875, -2.23028564453125, -2.1375732421875, -2.04486083984375, -1.9521484375, -1.85943603515625, -1.7667236328125, -1.67401123046875, -1.581298828125, -1.48858642578125, -1.3958740234375, -1.30316162109375, -1.21044921875, -1.11773681640625, -1.0250244140625, -0.93231201171875, -0.839599609375, -0.74688720703125, -0.6541748046875, -0.56146240234375, -0.46875, -0.37603759765625, -0.2833251953125, -0.19061279296875, -0.097900390625, -0.00518798828125, 0.0875244140625, 0.18023681640625, 0.27294921875, 0.36566162109375, 0.4583740234375, 0.55108642578125, 0.643798828125, 0.73651123046875, 0.8292236328125, 0.92193603515625, 1.0146484375, 1.10736083984375, 1.2000732421875, 1.29278564453125, 1.385498046875, 1.47821044921875, 1.5709228515625, 1.66363525390625, 1.75634765625, 1.84906005859375, 1.9417724609375, 2.03448486328125, 2.127197265625, 2.21990966796875, 2.3126220703125, 2.40533447265625, 2.498046875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 6.0, 12.0, 8.0, 16.0, 17.0, 11.0, 19.0, 23.0, 28.0, 32.0, 28.0, 44.0, 31.0, 35.0, 38.0, 45.0, 48.0, 34.0, 68.0, 49.0, 56.0, 40.0, 44.0, 25.0, 32.0, 26.0, 29.0, 18.0, 25.0, 16.0, 16.0, 10.0, 10.0, 9.0, 8.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0], "bins": [-19.33016014099121, -18.796630859375, -18.26310157775879, -17.729572296142578, -17.196041107177734, -16.662511825561523, -16.128982543945312, -15.595453262329102, -15.06192398071289, -14.52839469909668, -13.994865417480469, -13.461335182189941, -12.92780590057373, -12.39427661895752, -11.860746383666992, -11.327217102050781, -10.79368782043457, -10.26015853881836, -9.726629257202148, -9.193099021911621, -8.65956974029541, -8.1260404586792, -7.59251070022583, -7.058980941772461, -6.52545166015625, -5.991922378540039, -5.45839262008667, -4.924862861633301, -4.39133358001709, -3.8578040599823, -3.3242745399475098, -2.7907450199127197, -2.2572174072265625, -1.7236878871917725, -1.1901583671569824, -0.6566288471221924, -0.12309932708740234, 0.4104301929473877, 0.9439597129821777, 1.4774892330169678, 2.011018753051758, 2.544548273086548, 3.078077793121338, 3.611607313156128, 4.145136833190918, 4.678666114807129, 5.212195873260498, 5.745725631713867, 6.279254913330078, 6.812784194946289, 7.346313953399658, 7.879843711853027, 8.413372993469238, 8.94690227508545, 9.480432510375977, 10.013961791992188, 10.547491073608398, 11.08102035522461, 11.61454963684082, 12.148079872131348, 12.681609153747559, 13.21513843536377, 13.748668670654297, 14.282197952270508, 14.815727233886719]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 5.0, 5.0, 6.0, 8.0, 9.0, 10.0, 12.0, 20.0, 20.0, 22.0, 14.0, 27.0, 21.0, 29.0, 29.0, 28.0, 36.0, 34.0, 44.0, 39.0, 47.0, 33.0, 38.0, 35.0, 38.0, 30.0, 47.0, 35.0, 28.0, 40.0, 36.0, 38.0, 32.0, 12.0, 20.0, 12.0, 8.0, 12.0, 12.0, 7.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.04225730895996, -16.521116256713867, -15.999974250793457, -15.478833198547363, -14.95769214630127, -14.43655014038086, -13.915409088134766, -13.394268035888672, -12.873126983642578, -12.351985931396484, -11.830843925476074, -11.30970287322998, -10.788561820983887, -10.267419815063477, -9.746278762817383, -9.225137710571289, -8.703995704650879, -8.182854652404785, -7.661713123321533, -7.140571594238281, -6.6194305419921875, -6.0982890129089355, -5.577147483825684, -5.05600643157959, -4.534864902496338, -4.013723373413086, -3.492582321166992, -2.9714407920837402, -2.4502995014190674, -1.9291582107543945, -1.4080166816711426, -0.8868753910064697, -0.3657341003417969, 0.15540724992752075, 0.6765486001968384, 1.1976900100708008, 1.7188313007354736, 2.2399725914001465, 2.7611141204833984, 3.2822554111480713, 3.803396701812744, 4.324538230895996, 4.84567928314209, 5.366820812225342, 5.887962341308594, 6.4091033935546875, 6.9302449226379395, 7.451386451721191, 7.972527503967285, 8.493668556213379, 9.014810562133789, 9.535951614379883, 10.057092666625977, 10.57823371887207, 11.09937572479248, 11.620516777038574, 12.141658782958984, 12.662799835205078, 13.183941841125488, 13.705082893371582, 14.226223945617676, 14.747365951538086, 15.26850700378418, 15.789648056030273, 16.310789108276367]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 9.0, 13.0, 30.0, 35.0, 53.0, 83.0, 106.0, 182.0, 295.0, 439.0, 715.0, 1197.0, 1930.0, 3210.0, 5222.0, 8721.0, 14763.0, 25444.0, 44534.0, 77614.0, 134849.0, 232610.0, 375754.0, 543356.0, 664508.0, 657022.0, 525941.0, 357943.0, 219142.0, 127717.0, 72774.0, 41187.0, 23795.0, 13744.0, 7870.0, 4497.0, 2761.0, 1602.0, 1014.0, 620.0, 363.0, 220.0, 136.0, 100.0, 52.0, 38.0, 27.0, 12.0, 16.0, 9.0, 3.0, 2.0, 2.0, 5.0], "bins": [-18.53125, -18.0008544921875, -17.470458984375, -16.9400634765625, -16.40966796875, -15.8792724609375, -15.348876953125, -14.8184814453125, -14.2880859375, -13.7576904296875, -13.227294921875, -12.6968994140625, -12.16650390625, -11.6361083984375, -11.105712890625, -10.5753173828125, -10.044921875, -9.5145263671875, -8.984130859375, -8.4537353515625, -7.92333984375, -7.3929443359375, -6.862548828125, -6.3321533203125, -5.8017578125, -5.2713623046875, -4.740966796875, -4.2105712890625, -3.68017578125, -3.1497802734375, -2.619384765625, -2.0889892578125, -1.55859375, -1.0281982421875, -0.497802734375, 0.0325927734375, 0.56298828125, 1.0933837890625, 1.623779296875, 2.1541748046875, 2.6845703125, 3.2149658203125, 3.745361328125, 4.2757568359375, 4.80615234375, 5.3365478515625, 5.866943359375, 6.3973388671875, 6.927734375, 7.4581298828125, 7.988525390625, 8.5189208984375, 9.04931640625, 9.5797119140625, 10.110107421875, 10.6405029296875, 11.1708984375, 11.7012939453125, 12.231689453125, 12.7620849609375, 13.29248046875, 13.8228759765625, 14.353271484375, 14.8836669921875, 15.4140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 6.0, 5.0, 5.0, 11.0, 9.0, 5.0, 19.0, 18.0, 23.0, 14.0, 23.0, 25.0, 25.0, 25.0, 31.0, 34.0, 30.0, 37.0, 41.0, 45.0, 44.0, 29.0, 38.0, 38.0, 31.0, 38.0, 35.0, 39.0, 32.0, 42.0, 38.0, 33.0, 23.0, 18.0, 17.0, 13.0, 4.0, 13.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.734375, -14.2796630859375, -13.824951171875, -13.3702392578125, -12.91552734375, -12.4608154296875, -12.006103515625, -11.5513916015625, -11.0966796875, -10.6419677734375, -10.187255859375, -9.7325439453125, -9.27783203125, -8.8231201171875, -8.368408203125, -7.9136962890625, -7.458984375, -7.0042724609375, -6.549560546875, -6.0948486328125, -5.64013671875, -5.1854248046875, -4.730712890625, -4.2760009765625, -3.8212890625, -3.3665771484375, -2.911865234375, -2.4571533203125, -2.00244140625, -1.5477294921875, -1.093017578125, -0.6383056640625, -0.18359375, 0.2711181640625, 0.725830078125, 1.1805419921875, 1.63525390625, 2.0899658203125, 2.544677734375, 2.9993896484375, 3.4541015625, 3.9088134765625, 4.363525390625, 4.8182373046875, 5.27294921875, 5.7276611328125, 6.182373046875, 6.6370849609375, 7.091796875, 7.5465087890625, 8.001220703125, 8.4559326171875, 8.91064453125, 9.3653564453125, 9.820068359375, 10.2747802734375, 10.7294921875, 11.1842041015625, 11.638916015625, 12.0936279296875, 12.54833984375, 13.0030517578125, 13.457763671875, 13.9124755859375, 14.3671875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 14.0, 15.0, 31.0, 42.0, 69.0, 111.0, 172.0, 291.0, 428.0, 676.0, 1131.0, 1708.0, 2850.0, 4401.0, 7189.0, 11674.0, 18923.0, 30652.0, 49281.0, 78871.0, 123327.0, 189698.0, 278984.0, 382191.0, 481555.0, 535924.0, 522133.0, 446247.0, 341766.0, 242477.0, 162541.0, 104933.0, 65959.0, 40962.0, 25330.0, 16035.0, 9682.0, 5894.0, 3712.0, 2364.0, 1478.0, 919.0, 621.0, 393.0, 226.0, 108.0, 116.0, 63.0, 39.0, 38.0, 17.0, 14.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.1171875, -14.6419677734375, -14.166748046875, -13.6915283203125, -13.21630859375, -12.7410888671875, -12.265869140625, -11.7906494140625, -11.3154296875, -10.8402099609375, -10.364990234375, -9.8897705078125, -9.41455078125, -8.9393310546875, -8.464111328125, -7.9888916015625, -7.513671875, -7.0384521484375, -6.563232421875, -6.0880126953125, -5.61279296875, -5.1375732421875, -4.662353515625, -4.1871337890625, -3.7119140625, -3.2366943359375, -2.761474609375, -2.2862548828125, -1.81103515625, -1.3358154296875, -0.860595703125, -0.3853759765625, 0.08984375, 0.5650634765625, 1.040283203125, 1.5155029296875, 1.99072265625, 2.4659423828125, 2.941162109375, 3.4163818359375, 3.8916015625, 4.3668212890625, 4.842041015625, 5.3172607421875, 5.79248046875, 6.2677001953125, 6.742919921875, 7.2181396484375, 7.693359375, 8.1685791015625, 8.643798828125, 9.1190185546875, 9.59423828125, 10.0694580078125, 10.544677734375, 11.0198974609375, 11.4951171875, 11.9703369140625, 12.445556640625, 12.9207763671875, 13.39599609375, 13.8712158203125, 14.346435546875, 14.8216552734375, 15.296875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 10.0, 12.0, 23.0, 27.0, 35.0, 44.0, 52.0, 73.0, 99.0, 96.0, 120.0, 172.0, 173.0, 197.0, 222.0, 240.0, 257.0, 235.0, 239.0, 242.0, 250.0, 215.0, 186.0, 169.0, 119.0, 104.0, 96.0, 88.0, 61.0, 54.0, 35.0, 28.0, 16.0, 18.0, 14.0, 14.0, 8.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.16107177734375, -6.9119873046875, -6.66290283203125, -6.413818359375, -6.16473388671875, -5.9156494140625, -5.66656494140625, -5.41748046875, -5.16839599609375, -4.9193115234375, -4.67022705078125, -4.421142578125, -4.17205810546875, -3.9229736328125, -3.67388916015625, -3.4248046875, -3.17572021484375, -2.9266357421875, -2.67755126953125, -2.428466796875, -2.17938232421875, -1.9302978515625, -1.68121337890625, -1.43212890625, -1.18304443359375, -0.9339599609375, -0.68487548828125, -0.435791015625, -0.18670654296875, 0.0623779296875, 0.31146240234375, 0.560546875, 0.80963134765625, 1.0587158203125, 1.30780029296875, 1.556884765625, 1.80596923828125, 2.0550537109375, 2.30413818359375, 2.55322265625, 2.80230712890625, 3.0513916015625, 3.30047607421875, 3.549560546875, 3.79864501953125, 4.0477294921875, 4.29681396484375, 4.5458984375, 4.79498291015625, 5.0440673828125, 5.29315185546875, 5.542236328125, 5.79132080078125, 6.0404052734375, 6.28948974609375, 6.53857421875, 6.78765869140625, 7.0367431640625, 7.28582763671875, 7.534912109375, 7.78399658203125, 8.0330810546875, 8.28216552734375, 8.53125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 6.0, 4.0, 12.0, 10.0, 15.0, 15.0, 14.0, 27.0, 24.0, 34.0, 32.0, 41.0, 46.0, 64.0, 34.0, 51.0, 41.0, 56.0, 45.0, 54.0, 49.0, 49.0, 53.0, 34.0, 25.0, 31.0, 26.0, 19.0, 19.0, 17.0, 13.0, 9.0, 8.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.411867141723633, -16.836896896362305, -16.26192855834961, -15.686959266662598, -15.111989974975586, -14.537019729614258, -13.962050437927246, -13.387081146240234, -12.812111854553223, -12.237142562866211, -11.6621732711792, -11.087203979492188, -10.51223373413086, -9.937265396118164, -9.362295150756836, -8.787325859069824, -8.212356567382812, -7.637387275695801, -7.062417984008789, -6.487448215484619, -5.912478923797607, -5.337509632110596, -4.762539863586426, -4.187570571899414, -3.6126012802124023, -3.0376319885253906, -2.4626624584198, -1.8876930475234985, -1.3127236366271973, -0.7377543449401855, -0.16278481483459473, 0.4121847152709961, 0.9871559143066406, 1.562125325202942, 2.137094736099243, 2.712064266204834, 3.2870335578918457, 3.8620028495788574, 4.436972618103027, 5.011941909790039, 5.586911201477051, 6.1618804931640625, 6.736849784851074, 7.311819553375244, 7.886788845062256, 8.46175765991211, 9.036727905273438, 9.61169719696045, 10.186666488647461, 10.761635780334473, 11.336605072021484, 11.911574363708496, 12.486543655395508, 13.061513900756836, 13.636483192443848, 14.21145248413086, 14.786421775817871, 15.361391067504883, 15.936360359191895, 16.511329650878906, 17.086299896240234, 17.66126823425293, 18.236238479614258, 18.811206817626953, 19.38617706298828]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 7.0, 3.0, 5.0, 11.0, 9.0, 9.0, 13.0, 19.0, 25.0, 20.0, 21.0, 42.0, 24.0, 30.0, 38.0, 37.0, 46.0, 39.0, 39.0, 41.0, 40.0, 50.0, 37.0, 42.0, 38.0, 38.0, 36.0, 30.0, 27.0, 30.0, 24.0, 26.0, 21.0, 21.0, 12.0, 4.0, 8.0, 13.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-19.561710357666016, -19.025951385498047, -18.490190505981445, -17.954431533813477, -17.418670654296875, -16.882911682128906, -16.347150802612305, -15.811391830444336, -15.275630950927734, -14.73987102508545, -14.204111099243164, -13.668351173400879, -13.132591247558594, -12.596831321716309, -12.061071395874023, -11.525312423706055, -10.98955249786377, -10.453792572021484, -9.9180326461792, -9.382272720336914, -8.846512794494629, -8.310752868652344, -7.774993419647217, -7.239233493804932, -6.7034735679626465, -6.167713642120361, -5.631953716278076, -5.096194267272949, -4.560434341430664, -4.024674415588379, -3.4889144897460938, -2.9531545639038086, -2.417393684387207, -1.8816337585449219, -1.3458739519119263, -0.8101141452789307, -0.2743542194366455, 0.26140570640563965, 0.7971653938293457, 1.3329253196716309, 1.868685245513916, 2.404445171356201, 2.9402050971984863, 3.4759647846221924, 4.011724472045898, 4.547484397888184, 5.083244323730469, 5.619004249572754, 6.154764175415039, 6.690524101257324, 7.226284027099609, 7.7620439529418945, 8.29780387878418, 8.833563804626465, 9.36932373046875, 9.905082702636719, 10.44084358215332, 10.976603507995605, 11.51236343383789, 12.048123359680176, 12.583883285522461, 13.119643211364746, 13.655403137207031, 14.191162109375, 14.726922035217285]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 15.0, 15.0, 27.0, 44.0, 68.0, 119.0, 161.0, 302.0, 484.0, 837.0, 1351.0, 2189.0, 3743.0, 6019.0, 9935.0, 15733.0, 24415.0, 37926.0, 54863.0, 77045.0, 99707.0, 118235.0, 125733.0, 119720.0, 102111.0, 79606.0, 58080.0, 39507.0, 26296.0, 16785.0, 10649.0, 6494.0, 4087.0, 2495.0, 1546.0, 823.0, 553.0, 292.0, 213.0, 118.0, 75.0, 51.0, 33.0, 25.0, 14.0, 6.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99951171875, -4.8505859375, -4.70166015625, -4.552734375, -4.40380859375, -4.2548828125, -4.10595703125, -3.95703125, -3.80810546875, -3.6591796875, -3.51025390625, -3.361328125, -3.21240234375, -3.0634765625, -2.91455078125, -2.765625, -2.61669921875, -2.4677734375, -2.31884765625, -2.169921875, -2.02099609375, -1.8720703125, -1.72314453125, -1.57421875, -1.42529296875, -1.2763671875, -1.12744140625, -0.978515625, -0.82958984375, -0.6806640625, -0.53173828125, -0.3828125, -0.23388671875, -0.0849609375, 0.06396484375, 0.212890625, 0.36181640625, 0.5107421875, 0.65966796875, 0.80859375, 0.95751953125, 1.1064453125, 1.25537109375, 1.404296875, 1.55322265625, 1.7021484375, 1.85107421875, 2.0, 2.14892578125, 2.2978515625, 2.44677734375, 2.595703125, 2.74462890625, 2.8935546875, 3.04248046875, 3.19140625, 3.34033203125, 3.4892578125, 3.63818359375, 3.787109375, 3.93603515625, 4.0849609375, 4.23388671875, 4.3828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 3.0, 3.0, 12.0, 10.0, 9.0, 13.0, 19.0, 22.0, 22.0, 23.0, 39.0, 29.0, 26.0, 37.0, 36.0, 48.0, 38.0, 37.0, 44.0, 39.0, 51.0, 36.0, 40.0, 38.0, 42.0, 35.0, 28.0, 25.0, 32.0, 23.0, 25.0, 26.0, 19.0, 12.0, 4.0, 10.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-19.578125, -19.0416259765625, -18.505126953125, -17.9686279296875, -17.43212890625, -16.8956298828125, -16.359130859375, -15.8226318359375, -15.2861328125, -14.7496337890625, -14.213134765625, -13.6766357421875, -13.14013671875, -12.6036376953125, -12.067138671875, -11.5306396484375, -10.994140625, -10.4576416015625, -9.921142578125, -9.3846435546875, -8.84814453125, -8.3116455078125, -7.775146484375, -7.2386474609375, -6.7021484375, -6.1656494140625, -5.629150390625, -5.0926513671875, -4.55615234375, -4.0196533203125, -3.483154296875, -2.9466552734375, -2.41015625, -1.8736572265625, -1.337158203125, -0.8006591796875, -0.26416015625, 0.2723388671875, 0.808837890625, 1.3453369140625, 1.8818359375, 2.4183349609375, 2.954833984375, 3.4913330078125, 4.02783203125, 4.5643310546875, 5.100830078125, 5.6373291015625, 6.173828125, 6.7103271484375, 7.246826171875, 7.7833251953125, 8.31982421875, 8.8563232421875, 9.392822265625, 9.9293212890625, 10.4658203125, 11.0023193359375, 11.538818359375, 12.0753173828125, 12.61181640625, 13.1483154296875, 13.684814453125, 14.2213134765625, 14.7578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 6.0, 17.0, 11.0, 14.0, 25.0, 43.0, 56.0, 95.0, 136.0, 210.0, 378.0, 522.0, 953.0, 1445.0, 2464.0, 4117.0, 6904.0, 11730.0, 21013.0, 41091.0, 820811.0, 76760.0, 25269.0, 14069.0, 8109.0, 4905.0, 2838.0, 1735.0, 1031.0, 603.0, 405.0, 247.0, 178.0, 96.0, 78.0, 49.0, 30.0, 25.0, 16.0, 13.0, 14.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0], "bins": [-15.28125, -14.8133544921875, -14.345458984375, -13.8775634765625, -13.40966796875, -12.9417724609375, -12.473876953125, -12.0059814453125, -11.5380859375, -11.0701904296875, -10.602294921875, -10.1343994140625, -9.66650390625, -9.1986083984375, -8.730712890625, -8.2628173828125, -7.794921875, -7.3270263671875, -6.859130859375, -6.3912353515625, -5.92333984375, -5.4554443359375, -4.987548828125, -4.5196533203125, -4.0517578125, -3.5838623046875, -3.115966796875, -2.6480712890625, -2.18017578125, -1.7122802734375, -1.244384765625, -0.7764892578125, -0.30859375, 0.1593017578125, 0.627197265625, 1.0950927734375, 1.56298828125, 2.0308837890625, 2.498779296875, 2.9666748046875, 3.4345703125, 3.9024658203125, 4.370361328125, 4.8382568359375, 5.30615234375, 5.7740478515625, 6.241943359375, 6.7098388671875, 7.177734375, 7.6456298828125, 8.113525390625, 8.5814208984375, 9.04931640625, 9.5172119140625, 9.985107421875, 10.4530029296875, 10.9208984375, 11.3887939453125, 11.856689453125, 12.3245849609375, 12.79248046875, 13.2603759765625, 13.728271484375, 14.1961669921875, 14.6640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 6.0, 13.0, 8.0, 8.0, 13.0, 14.0, 17.0, 19.0, 25.0, 24.0, 34.0, 24.0, 39.0, 38.0, 38.0, 40.0, 42.0, 39.0, 40.0, 36.0, 37.0, 38.0, 27.0, 36.0, 30.0, 41.0, 31.0, 29.0, 30.0, 24.0, 19.0, 15.0, 18.0, 26.0, 10.0, 10.0, 12.0, 13.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.5606689453125, -8.222900390625, -7.8851318359375, -7.54736328125, -7.2095947265625, -6.871826171875, -6.5340576171875, -6.1962890625, -5.8585205078125, -5.520751953125, -5.1829833984375, -4.84521484375, -4.5074462890625, -4.169677734375, -3.8319091796875, -3.494140625, -3.1563720703125, -2.818603515625, -2.4808349609375, -2.14306640625, -1.8052978515625, -1.467529296875, -1.1297607421875, -0.7919921875, -0.4542236328125, -0.116455078125, 0.2213134765625, 0.55908203125, 0.8968505859375, 1.234619140625, 1.5723876953125, 1.91015625, 2.2479248046875, 2.585693359375, 2.9234619140625, 3.26123046875, 3.5989990234375, 3.936767578125, 4.2745361328125, 4.6123046875, 4.9500732421875, 5.287841796875, 5.6256103515625, 5.96337890625, 6.3011474609375, 6.638916015625, 6.9766845703125, 7.314453125, 7.6522216796875, 7.989990234375, 8.3277587890625, 8.66552734375, 9.0032958984375, 9.341064453125, 9.6788330078125, 10.0166015625, 10.3543701171875, 10.692138671875, 11.0299072265625, 11.36767578125, 11.7054443359375, 12.043212890625, 12.3809814453125, 12.71875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 13.0, 14.0, 26.0, 20.0, 39.0, 63.0, 96.0, 120.0, 186.0, 272.0, 406.0, 612.0, 962.0, 1635.0, 2519.0, 4280.0, 7135.0, 12626.0, 23838.0, 71413.0, 824973.0, 48374.0, 21006.0, 11217.0, 6509.0, 3817.0, 2310.0, 1445.0, 866.0, 598.0, 357.0, 274.0, 146.0, 95.0, 97.0, 47.0, 47.0, 14.0, 18.0, 18.0, 11.0, 8.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.7886428833007812, -0.7608795166015625, -0.7331161499023438, -0.705352783203125, -0.6775894165039062, -0.6498260498046875, -0.6220626831054688, -0.59429931640625, -0.5665359497070312, -0.5387725830078125, -0.5110092163085938, -0.483245849609375, -0.45548248291015625, -0.4277191162109375, -0.39995574951171875, -0.3721923828125, -0.34442901611328125, -0.3166656494140625, -0.28890228271484375, -0.261138916015625, -0.23337554931640625, -0.2056121826171875, -0.17784881591796875, -0.15008544921875, -0.12232208251953125, -0.0945587158203125, -0.06679534912109375, -0.039031982421875, -0.01126861572265625, 0.0164947509765625, 0.04425811767578125, 0.072021484375, 0.09978485107421875, 0.1275482177734375, 0.15531158447265625, 0.183074951171875, 0.21083831787109375, 0.2386016845703125, 0.26636505126953125, 0.29412841796875, 0.32189178466796875, 0.3496551513671875, 0.37741851806640625, 0.405181884765625, 0.43294525146484375, 0.4607086181640625, 0.48847198486328125, 0.5162353515625, 0.5439987182617188, 0.5717620849609375, 0.5995254516601562, 0.627288818359375, 0.6550521850585938, 0.6828155517578125, 0.7105789184570312, 0.73834228515625, 0.7661056518554688, 0.7938690185546875, 0.8216323852539062, 0.849395751953125, 0.8771591186523438, 0.9049224853515625, 0.9326858520507812, 0.96044921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 7.0, 11.0, 12.0, 11.0, 17.0, 13.0, 23.0, 29.0, 39.0, 40.0, 38.0, 54.0, 57.0, 65.0, 67.0, 62.0, 64.0, 50.0, 48.0, 44.0, 45.0, 27.0, 35.0, 15.0, 24.0, 16.0, 12.0, 15.0, 7.0, 4.0, 10.0, 5.0, 1.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-8.499622344970703e-05, -8.279364556074142e-05, -8.059106767177582e-05, -7.838848978281021e-05, -7.61859118938446e-05, -7.3983334004879e-05, -7.178075611591339e-05, -6.957817822694778e-05, -6.737560033798218e-05, -6.517302244901657e-05, -6.297044456005096e-05, -6.076786667108536e-05, -5.856528878211975e-05, -5.6362710893154144e-05, -5.416013300418854e-05, -5.195755511522293e-05, -4.9754977226257324e-05, -4.755239933729172e-05, -4.534982144832611e-05, -4.3147243559360504e-05, -4.09446656703949e-05, -3.874208778142929e-05, -3.6539509892463684e-05, -3.433693200349808e-05, -3.213435411453247e-05, -2.9931776225566864e-05, -2.7729198336601257e-05, -2.552662044763565e-05, -2.3324042558670044e-05, -2.1121464669704437e-05, -1.891888678073883e-05, -1.6716308891773224e-05, -1.4513731002807617e-05, -1.231115311384201e-05, -1.0108575224876404e-05, -7.905997335910797e-06, -5.7034194469451904e-06, -3.5008415579795837e-06, -1.298263669013977e-06, 9.043142199516296e-07, 3.1068921089172363e-06, 5.309469997882843e-06, 7.51204788684845e-06, 9.714625775814056e-06, 1.1917203664779663e-05, 1.411978155374527e-05, 1.6322359442710876e-05, 1.8524937331676483e-05, 2.072751522064209e-05, 2.2930093109607697e-05, 2.5132670998573303e-05, 2.733524888753891e-05, 2.9537826776504517e-05, 3.174040466547012e-05, 3.394298255443573e-05, 3.614556044340134e-05, 3.834813833236694e-05, 4.055071622133255e-05, 4.275329411029816e-05, 4.4955871999263763e-05, 4.715844988822937e-05, 4.936102777719498e-05, 5.1563605666160583e-05, 5.376618355512619e-05, 5.59687614440918e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 11.0, 17.0, 39.0, 61.0, 105.0, 141.0, 249.0, 367.0, 631.0, 1077.0, 1657.0, 2765.0, 4339.0, 6979.0, 11102.0, 17576.0, 26967.0, 40755.0, 59006.0, 81850.0, 104069.0, 121312.0, 125876.0, 116213.0, 97663.0, 74391.0, 52850.0, 36010.0, 23583.0, 15170.0, 9781.0, 6060.0, 3777.0, 2377.0, 1412.0, 850.0, 540.0, 331.0, 205.0, 133.0, 79.0, 60.0, 30.0, 31.0, 16.0, 14.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67626953125, -0.654693603515625, -0.63311767578125, -0.611541748046875, -0.5899658203125, -0.568389892578125, -0.54681396484375, -0.525238037109375, -0.503662109375, -0.482086181640625, -0.46051025390625, -0.438934326171875, -0.4173583984375, -0.395782470703125, -0.37420654296875, -0.352630615234375, -0.3310546875, -0.309478759765625, -0.28790283203125, -0.266326904296875, -0.2447509765625, -0.223175048828125, -0.20159912109375, -0.180023193359375, -0.158447265625, -0.136871337890625, -0.11529541015625, -0.093719482421875, -0.0721435546875, -0.050567626953125, -0.02899169921875, -0.007415771484375, 0.01416015625, 0.035736083984375, 0.05731201171875, 0.078887939453125, 0.1004638671875, 0.122039794921875, 0.14361572265625, 0.165191650390625, 0.186767578125, 0.208343505859375, 0.22991943359375, 0.251495361328125, 0.2730712890625, 0.294647216796875, 0.31622314453125, 0.337799072265625, 0.359375, 0.380950927734375, 0.40252685546875, 0.424102783203125, 0.4456787109375, 0.467254638671875, 0.48883056640625, 0.510406494140625, 0.531982421875, 0.553558349609375, 0.57513427734375, 0.596710205078125, 0.6182861328125, 0.639862060546875, 0.66143798828125, 0.683013916015625, 0.70458984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 6.0, 9.0, 11.0, 13.0, 13.0, 15.0, 18.0, 24.0, 32.0, 28.0, 26.0, 33.0, 40.0, 38.0, 46.0, 42.0, 43.0, 51.0, 38.0, 45.0, 44.0, 39.0, 37.0, 36.0, 36.0, 38.0, 34.0, 25.0, 17.0, 12.0, 17.0, 16.0, 16.0, 7.0, 12.0, 6.0, 5.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268310546875, -0.2587890625, -0.249267578125, -0.23974609375, -0.230224609375, -0.220703125, -0.211181640625, -0.20166015625, -0.192138671875, -0.1826171875, -0.173095703125, -0.16357421875, -0.154052734375, -0.14453125, -0.135009765625, -0.12548828125, -0.115966796875, -0.1064453125, -0.096923828125, -0.08740234375, -0.077880859375, -0.068359375, -0.058837890625, -0.04931640625, -0.039794921875, -0.0302734375, -0.020751953125, -0.01123046875, -0.001708984375, 0.0078125, 0.017333984375, 0.02685546875, 0.036376953125, 0.0458984375, 0.055419921875, 0.06494140625, 0.074462890625, 0.083984375, 0.093505859375, 0.10302734375, 0.112548828125, 0.1220703125, 0.131591796875, 0.14111328125, 0.150634765625, 0.16015625, 0.169677734375, 0.17919921875, 0.188720703125, 0.1982421875, 0.207763671875, 0.21728515625, 0.226806640625, 0.236328125, 0.245849609375, 0.25537109375, 0.264892578125, 0.2744140625, 0.283935546875, 0.29345703125, 0.302978515625, 0.3125, 0.322021484375, 0.33154296875, 0.341064453125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 15.0, 8.0, 12.0, 11.0, 16.0, 22.0, 24.0, 31.0, 38.0, 35.0, 45.0, 56.0, 42.0, 47.0, 42.0, 47.0, 56.0, 43.0, 60.0, 43.0, 49.0, 38.0, 28.0, 36.0, 35.0, 15.0, 17.0, 21.0, 12.0, 6.0, 14.0, 10.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.721406936645508, -17.143901824951172, -16.566396713256836, -15.9888916015625, -15.411385536193848, -14.833880424499512, -14.256375312805176, -13.678869247436523, -13.101364135742188, -12.523859024047852, -11.946353912353516, -11.36884880065918, -10.791342735290527, -10.213837623596191, -9.636332511901855, -9.058826446533203, -8.481322288513184, -7.903817176818848, -7.3263115882873535, -6.748806476593018, -6.171300888061523, -5.5937957763671875, -5.016290664672852, -4.438785076141357, -3.8612799644470215, -3.2837746143341064, -2.7062692642211914, -2.1287641525268555, -1.5512588024139404, -0.9737534523010254, -0.39624834060668945, 0.1812572479248047, 0.7587623596191406, 1.3362677097320557, 1.9137729406356812, 2.4912781715393066, 3.0687835216522217, 3.6462888717651367, 4.223793983459473, 4.801299571990967, 5.378804683685303, 5.956309795379639, 6.533815383911133, 7.111320495605469, 7.688825607299805, 8.26633071899414, 8.843835830688477, 9.421341896057129, 9.998847007751465, 10.5763521194458, 11.153857231140137, 11.731363296508789, 12.308868408203125, 12.886373519897461, 13.463878631591797, 14.041383743286133, 14.618888854980469, 15.196393966674805, 15.77389907836914, 16.351404190063477, 16.928909301757812, 17.50641632080078, 18.083919525146484, 18.661426544189453, 19.23893165588379]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 3.0, 2.0, 12.0, 9.0, 11.0, 14.0, 15.0, 24.0, 20.0, 24.0, 41.0, 27.0, 27.0, 40.0, 31.0, 51.0, 33.0, 47.0, 40.0, 35.0, 54.0, 35.0, 41.0, 40.0, 39.0, 37.0, 26.0, 32.0, 29.0, 23.0, 23.0, 25.0, 23.0, 8.0, 7.0, 10.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-19.69591522216797, -19.156055450439453, -18.616195678710938, -18.076337814331055, -17.53647804260254, -16.996618270874023, -16.456758499145508, -15.916899681091309, -15.37704086303711, -14.837181091308594, -14.297322273254395, -13.757462501525879, -13.21760368347168, -12.677743911743164, -12.137884140014648, -11.59802532196045, -11.058165550231934, -10.518305778503418, -9.978446960449219, -9.438587188720703, -8.898728370666504, -8.358868598937988, -7.819009304046631, -7.279150009155273, -6.739290714263916, -6.199431419372559, -5.659572124481201, -5.119712829589844, -4.579853057861328, -4.039994239807129, -3.5001344680786133, -2.960275173187256, -2.420414924621582, -1.8805556297302246, -1.3406962156295776, -0.8008368015289307, -0.26097750663757324, 0.2788817882537842, 0.8187413215637207, 1.3586006164550781, 1.8984599113464355, 2.438319206237793, 2.9781785011291504, 3.518038034439087, 4.057897567749023, 4.597756385803223, 5.137616157531738, 5.677475452423096, 6.217334747314453, 6.7571940422058105, 7.297053337097168, 7.836913108825684, 8.376771926879883, 8.916631698608398, 9.456491470336914, 9.996350288391113, 10.536209106445312, 11.076068878173828, 11.615927696228027, 12.155787467956543, 12.695646286010742, 13.235506057739258, 13.775365829467773, 14.315224647521973, 14.855084419250488]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 14.0, 17.0, 36.0, 49.0, 71.0, 129.0, 191.0, 318.0, 483.0, 798.0, 1300.0, 2081.0, 3383.0, 5592.0, 8917.0, 14152.0, 21537.0, 32795.0, 46858.0, 64420.0, 82127.0, 98116.0, 110115.0, 112663.0, 105678.0, 91251.0, 74179.0, 55739.0, 39763.0, 27490.0, 17785.0, 11403.0, 7318.0, 4584.0, 2758.0, 1670.0, 1030.0, 693.0, 383.0, 250.0, 151.0, 104.0, 56.0, 41.0, 24.0, 17.0, 10.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.203125, -11.771484375, -11.33984375, -10.908203125, -10.4765625, -10.044921875, -9.61328125, -9.181640625, -8.75, -8.318359375, -7.88671875, -7.455078125, -7.0234375, -6.591796875, -6.16015625, -5.728515625, -5.296875, -4.865234375, -4.43359375, -4.001953125, -3.5703125, -3.138671875, -2.70703125, -2.275390625, -1.84375, -1.412109375, -0.98046875, -0.548828125, -0.1171875, 0.314453125, 0.74609375, 1.177734375, 1.609375, 2.041015625, 2.47265625, 2.904296875, 3.3359375, 3.767578125, 4.19921875, 4.630859375, 5.0625, 5.494140625, 5.92578125, 6.357421875, 6.7890625, 7.220703125, 7.65234375, 8.083984375, 8.515625, 8.947265625, 9.37890625, 9.810546875, 10.2421875, 10.673828125, 11.10546875, 11.537109375, 11.96875, 12.400390625, 12.83203125, 13.263671875, 13.6953125, 14.126953125, 14.55859375, 14.990234375, 15.421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 2.0, 9.0, 11.0, 10.0, 13.0, 21.0, 19.0, 19.0, 22.0, 39.0, 30.0, 28.0, 37.0, 30.0, 52.0, 33.0, 46.0, 38.0, 39.0, 54.0, 33.0, 41.0, 39.0, 46.0, 34.0, 24.0, 32.0, 30.0, 17.0, 27.0, 27.0, 20.0, 15.0, 6.0, 10.0, 11.0, 6.0, 6.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0], "bins": [-18.9375, -18.4207763671875, -17.904052734375, -17.3873291015625, -16.87060546875, -16.3538818359375, -15.837158203125, -15.3204345703125, -14.8037109375, -14.2869873046875, -13.770263671875, -13.2535400390625, -12.73681640625, -12.2200927734375, -11.703369140625, -11.1866455078125, -10.669921875, -10.1531982421875, -9.636474609375, -9.1197509765625, -8.60302734375, -8.0863037109375, -7.569580078125, -7.0528564453125, -6.5361328125, -6.0194091796875, -5.502685546875, -4.9859619140625, -4.46923828125, -3.9525146484375, -3.435791015625, -2.9190673828125, -2.40234375, -1.8856201171875, -1.368896484375, -0.8521728515625, -0.33544921875, 0.1812744140625, 0.697998046875, 1.2147216796875, 1.7314453125, 2.2481689453125, 2.764892578125, 3.2816162109375, 3.79833984375, 4.3150634765625, 4.831787109375, 5.3485107421875, 5.865234375, 6.3819580078125, 6.898681640625, 7.4154052734375, 7.93212890625, 8.4488525390625, 8.965576171875, 9.4822998046875, 9.9990234375, 10.5157470703125, 11.032470703125, 11.5491943359375, 12.06591796875, 12.5826416015625, 13.099365234375, 13.6160888671875, 14.1328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 11.0, 11.0, 11.0, 24.0, 41.0, 53.0, 80.0, 111.0, 209.0, 282.0, 464.0, 644.0, 1004.0, 1543.0, 2326.0, 3631.0, 5648.0, 8757.0, 13000.0, 19431.0, 28152.0, 40362.0, 54974.0, 71174.0, 87294.0, 99099.0, 105986.0, 104947.0, 95828.0, 81546.0, 64752.0, 48890.0, 35190.0, 24564.0, 16411.0, 11035.0, 7294.0, 4838.0, 3084.0, 1968.0, 1298.0, 917.0, 585.0, 383.0, 227.0, 162.0, 103.0, 83.0, 52.0, 32.0, 20.0, 8.0, 9.0, 3.0, 6.0, 2.0, 4.0], "bins": [-13.1640625, -12.774658203125, -12.38525390625, -11.995849609375, -11.6064453125, -11.217041015625, -10.82763671875, -10.438232421875, -10.048828125, -9.659423828125, -9.27001953125, -8.880615234375, -8.4912109375, -8.101806640625, -7.71240234375, -7.322998046875, -6.93359375, -6.544189453125, -6.15478515625, -5.765380859375, -5.3759765625, -4.986572265625, -4.59716796875, -4.207763671875, -3.818359375, -3.428955078125, -3.03955078125, -2.650146484375, -2.2607421875, -1.871337890625, -1.48193359375, -1.092529296875, -0.703125, -0.313720703125, 0.07568359375, 0.465087890625, 0.8544921875, 1.243896484375, 1.63330078125, 2.022705078125, 2.412109375, 2.801513671875, 3.19091796875, 3.580322265625, 3.9697265625, 4.359130859375, 4.74853515625, 5.137939453125, 5.52734375, 5.916748046875, 6.30615234375, 6.695556640625, 7.0849609375, 7.474365234375, 7.86376953125, 8.253173828125, 8.642578125, 9.031982421875, 9.42138671875, 9.810791015625, 10.2001953125, 10.589599609375, 10.97900390625, 11.368408203125, 11.7578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 8.0, 3.0, 3.0, 8.0, 14.0, 14.0, 18.0, 21.0, 29.0, 30.0, 36.0, 37.0, 38.0, 38.0, 38.0, 52.0, 51.0, 46.0, 45.0, 46.0, 34.0, 39.0, 54.0, 41.0, 42.0, 43.0, 21.0, 25.0, 23.0, 23.0, 17.0, 9.0, 10.0, 11.0, 6.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.213623046875, -12.84130859375, -12.468994140625, -12.0966796875, -11.724365234375, -11.35205078125, -10.979736328125, -10.607421875, -10.235107421875, -9.86279296875, -9.490478515625, -9.1181640625, -8.745849609375, -8.37353515625, -8.001220703125, -7.62890625, -7.256591796875, -6.88427734375, -6.511962890625, -6.1396484375, -5.767333984375, -5.39501953125, -5.022705078125, -4.650390625, -4.278076171875, -3.90576171875, -3.533447265625, -3.1611328125, -2.788818359375, -2.41650390625, -2.044189453125, -1.671875, -1.299560546875, -0.92724609375, -0.554931640625, -0.1826171875, 0.189697265625, 0.56201171875, 0.934326171875, 1.306640625, 1.678955078125, 2.05126953125, 2.423583984375, 2.7958984375, 3.168212890625, 3.54052734375, 3.912841796875, 4.28515625, 4.657470703125, 5.02978515625, 5.402099609375, 5.7744140625, 6.146728515625, 6.51904296875, 6.891357421875, 7.263671875, 7.635986328125, 8.00830078125, 8.380615234375, 8.7529296875, 9.125244140625, 9.49755859375, 9.869873046875, 10.2421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 11.0, 18.0, 27.0, 52.0, 66.0, 113.0, 173.0, 258.0, 441.0, 858.0, 1480.0, 2636.0, 5189.0, 10235.0, 20605.0, 40899.0, 76879.0, 131091.0, 181637.0, 195770.0, 159186.0, 103548.0, 57493.0, 29232.0, 14850.0, 7361.0, 3861.0, 1955.0, 1061.0, 577.0, 355.0, 218.0, 132.0, 103.0, 69.0, 35.0, 18.0, 17.0, 8.0, 12.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.9453125, -8.6842041015625, -8.423095703125, -8.1619873046875, -7.90087890625, -7.6397705078125, -7.378662109375, -7.1175537109375, -6.8564453125, -6.5953369140625, -6.334228515625, -6.0731201171875, -5.81201171875, -5.5509033203125, -5.289794921875, -5.0286865234375, -4.767578125, -4.5064697265625, -4.245361328125, -3.9842529296875, -3.72314453125, -3.4620361328125, -3.200927734375, -2.9398193359375, -2.6787109375, -2.4176025390625, -2.156494140625, -1.8953857421875, -1.63427734375, -1.3731689453125, -1.112060546875, -0.8509521484375, -0.58984375, -0.3287353515625, -0.067626953125, 0.1934814453125, 0.45458984375, 0.7156982421875, 0.976806640625, 1.2379150390625, 1.4990234375, 1.7601318359375, 2.021240234375, 2.2823486328125, 2.54345703125, 2.8045654296875, 3.065673828125, 3.3267822265625, 3.587890625, 3.8489990234375, 4.110107421875, 4.3712158203125, 4.63232421875, 4.8934326171875, 5.154541015625, 5.4156494140625, 5.6767578125, 5.9378662109375, 6.198974609375, 6.4600830078125, 6.72119140625, 6.9822998046875, 7.243408203125, 7.5045166015625, 7.765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 19.0, 9.0, 23.0, 18.0, 29.0, 21.0, 26.0, 37.0, 35.0, 41.0, 35.0, 53.0, 43.0, 52.0, 59.0, 56.0, 33.0, 43.0, 49.0, 42.0, 40.0, 29.0, 31.0, 24.0, 17.0, 17.0, 17.0, 15.0, 8.0, 8.0, 7.0, 7.0, 6.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005855560302734375, -0.0005657151341438293, -0.0005458742380142212, -0.000526033341884613, -0.0005061924457550049, -0.00048635154962539673, -0.0004665106534957886, -0.0004466697573661804, -0.00042682886123657227, -0.0004069879651069641, -0.00038714706897735596, -0.0003673061728477478, -0.00034746527671813965, -0.0003276243805885315, -0.00030778348445892334, -0.0002879425883293152, -0.00026810169219970703, -0.0002482607960700989, -0.00022841989994049072, -0.00020857900381088257, -0.00018873810768127441, -0.00016889721155166626, -0.0001490563154220581, -0.00012921541929244995, -0.0001093745231628418, -8.953362703323364e-05, -6.969273090362549e-05, -4.9851834774017334e-05, -3.001093864440918e-05, -1.0170042514801025e-05, 9.670853614807129e-06, 2.9511749744415283e-05, 4.935264587402344e-05, 6.919354200363159e-05, 8.903443813323975e-05, 0.0001088753342628479, 0.00012871623039245605, 0.0001485571265220642, 0.00016839802265167236, 0.00018823891878128052, 0.00020807981491088867, 0.00022792071104049683, 0.000247761607170105, 0.00026760250329971313, 0.0002874433994293213, 0.00030728429555892944, 0.0003271251916885376, 0.00034696608781814575, 0.0003668069839477539, 0.00038664788007736206, 0.0004064887762069702, 0.00042632967233657837, 0.0004461705684661865, 0.0004660114645957947, 0.00048585236072540283, 0.000505693256855011, 0.0005255341529846191, 0.0005453750491142273, 0.0005652159452438354, 0.0005850568413734436, 0.0006048977375030518, 0.0006247386336326599, 0.0006445795297622681, 0.0006644204258918762, 0.0006842613220214844]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 12.0, 25.0, 29.0, 66.0, 86.0, 129.0, 196.0, 270.0, 440.0, 719.0, 1089.0, 1743.0, 2838.0, 5035.0, 8844.0, 15357.0, 28082.0, 49293.0, 82607.0, 126366.0, 164051.0, 171663.0, 144224.0, 100673.0, 61705.0, 35881.0, 19986.0, 11242.0, 6442.0, 3640.0, 2119.0, 1292.0, 858.0, 496.0, 344.0, 228.0, 181.0, 103.0, 72.0, 41.0, 33.0, 22.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.05914306640625, -6.8175048828125, -6.57586669921875, -6.334228515625, -6.09259033203125, -5.8509521484375, -5.60931396484375, -5.36767578125, -5.12603759765625, -4.8843994140625, -4.64276123046875, -4.401123046875, -4.15948486328125, -3.9178466796875, -3.67620849609375, -3.4345703125, -3.19293212890625, -2.9512939453125, -2.70965576171875, -2.468017578125, -2.22637939453125, -1.9847412109375, -1.74310302734375, -1.50146484375, -1.25982666015625, -1.0181884765625, -0.77655029296875, -0.534912109375, -0.29327392578125, -0.0516357421875, 0.19000244140625, 0.431640625, 0.67327880859375, 0.9149169921875, 1.15655517578125, 1.398193359375, 1.63983154296875, 1.8814697265625, 2.12310791015625, 2.36474609375, 2.60638427734375, 2.8480224609375, 3.08966064453125, 3.331298828125, 3.57293701171875, 3.8145751953125, 4.05621337890625, 4.2978515625, 4.53948974609375, 4.7811279296875, 5.02276611328125, 5.264404296875, 5.50604248046875, 5.7476806640625, 5.98931884765625, 6.23095703125, 6.47259521484375, 6.7142333984375, 6.95587158203125, 7.197509765625, 7.43914794921875, 7.6807861328125, 7.92242431640625, 8.1640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 6.0, 8.0, 14.0, 25.0, 15.0, 25.0, 39.0, 50.0, 53.0, 54.0, 51.0, 58.0, 64.0, 52.0, 43.0, 51.0, 42.0, 60.0, 50.0, 34.0, 36.0, 46.0, 24.0, 11.0, 14.0, 11.0, 11.0, 6.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.224609375, -3.134552001953125, -3.04449462890625, -2.954437255859375, -2.8643798828125, -2.774322509765625, -2.68426513671875, -2.594207763671875, -2.504150390625, -2.414093017578125, -2.32403564453125, -2.233978271484375, -2.1439208984375, -2.053863525390625, -1.96380615234375, -1.873748779296875, -1.78369140625, -1.693634033203125, -1.60357666015625, -1.513519287109375, -1.4234619140625, -1.333404541015625, -1.24334716796875, -1.153289794921875, -1.063232421875, -0.973175048828125, -0.88311767578125, -0.793060302734375, -0.7030029296875, -0.612945556640625, -0.52288818359375, -0.432830810546875, -0.3427734375, -0.252716064453125, -0.16265869140625, -0.072601318359375, 0.0174560546875, 0.107513427734375, 0.19757080078125, 0.287628173828125, 0.377685546875, 0.467742919921875, 0.55780029296875, 0.647857666015625, 0.7379150390625, 0.827972412109375, 0.91802978515625, 1.008087158203125, 1.09814453125, 1.188201904296875, 1.27825927734375, 1.368316650390625, 1.4583740234375, 1.548431396484375, 1.63848876953125, 1.728546142578125, 1.818603515625, 1.908660888671875, 1.99871826171875, 2.088775634765625, 2.1788330078125, 2.268890380859375, 2.35894775390625, 2.449005126953125, 2.5390625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 0.0, 10.0, 4.0, 14.0, 4.0, 21.0, 25.0, 17.0, 17.0, 29.0, 29.0, 35.0, 41.0, 37.0, 43.0, 45.0, 41.0, 52.0, 38.0, 44.0, 53.0, 45.0, 37.0, 49.0, 36.0, 26.0, 37.0, 29.0, 19.0, 14.0, 11.0, 20.0, 18.0, 9.0, 8.0, 13.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.019598007202148, -14.498157501220703, -13.976716995239258, -13.455277442932129, -12.933836936950684, -12.412396430969238, -11.89095687866211, -11.369516372680664, -10.848075866699219, -10.326635360717773, -9.805194854736328, -9.2837553024292, -8.762314796447754, -8.240874290466309, -7.7194342613220215, -7.197994232177734, -6.676553726196289, -6.155113220214844, -5.633673191070557, -5.1122331619262695, -4.590792655944824, -4.069352149963379, -3.547912120819092, -3.0264718532562256, -2.5050315856933594, -1.9835913181304932, -1.462151050567627, -0.9407107830047607, -0.41927051544189453, 0.10216975212097168, 0.6236100196838379, 1.145050287246704, 1.6664905548095703, 2.1879308223724365, 2.7093710899353027, 3.230811357498169, 3.752251625061035, 4.2736921310424805, 4.795132160186768, 5.316572189331055, 5.8380126953125, 6.359453201293945, 6.880893230438232, 7.4023332595825195, 7.923773765563965, 8.44521427154541, 8.966653823852539, 9.488094329833984, 10.00953483581543, 10.530975341796875, 11.05241584777832, 11.57385540008545, 12.095295906066895, 12.61673641204834, 13.138175964355469, 13.659616470336914, 14.18105697631836, 14.702497482299805, 15.22393798828125, 15.745377540588379, 16.26681900024414, 16.788257598876953, 17.3096981048584, 17.831138610839844, 18.35257911682129]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 4.0, 7.0, 10.0, 15.0, 13.0, 20.0, 16.0, 21.0, 21.0, 28.0, 32.0, 26.0, 37.0, 42.0, 38.0, 29.0, 29.0, 40.0, 43.0, 27.0, 40.0, 32.0, 51.0, 30.0, 34.0, 34.0, 19.0, 25.0, 34.0, 21.0, 19.0, 20.0, 17.0, 23.0, 13.0, 10.0, 10.0, 11.0, 6.0, 6.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-14.489995956420898, -14.008938789367676, -13.527880668640137, -13.046823501586914, -12.565766334533691, -12.084709167480469, -11.60365104675293, -11.122593879699707, -10.641536712646484, -10.160479545593262, -9.679421424865723, -9.1983642578125, -8.717307090759277, -8.236249923706055, -7.755191802978516, -7.274134635925293, -6.793076515197754, -6.312018871307373, -5.83096170425415, -5.3499040603637695, -4.868846893310547, -4.387789249420166, -3.906731605529785, -3.4256742000579834, -2.9446167945861816, -2.46355938911438, -1.9825018644332886, -1.5014443397521973, -1.0203869342803955, -0.5393295288085938, -0.05827188491821289, 0.42278552055358887, 0.9038429260253906, 1.3849003314971924, 1.8659578561782837, 2.347015380859375, 2.8280727863311768, 3.3091301918029785, 3.7901878356933594, 4.271245002746582, 4.752302646636963, 5.233360290527344, 5.714417457580566, 6.195475101470947, 6.676532745361328, 7.157589912414551, 7.638647556304932, 8.119705200195312, 8.600762367248535, 9.081819534301758, 9.562877655029297, 10.04393482208252, 10.524991989135742, 11.006050109863281, 11.487107276916504, 11.968164443969727, 12.449222564697266, 12.930279731750488, 13.411337852478027, 13.89239501953125, 14.373452186584473, 14.854509353637695, 15.335567474365234, 15.816624641418457, 16.29768180847168]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 17.0, 32.0, 29.0, 52.0, 81.0, 134.0, 198.0, 280.0, 448.0, 680.0, 1012.0, 1685.0, 2677.0, 4401.0, 7209.0, 11761.0, 19451.0, 33003.0, 56196.0, 96301.0, 161772.0, 263419.0, 397278.0, 535010.0, 618217.0, 597751.0, 487061.0, 345780.0, 222250.0, 134153.0, 79799.0, 47082.0, 27954.0, 16128.0, 9781.0, 5703.0, 3601.0, 2175.0, 1328.0, 925.0, 536.0, 328.0, 242.0, 116.0, 91.0, 52.0, 25.0, 23.0, 17.0, 11.0, 9.0, 0.0, 5.0, 3.0], "bins": [-17.375, -16.8759765625, -16.376953125, -15.8779296875, -15.37890625, -14.8798828125, -14.380859375, -13.8818359375, -13.3828125, -12.8837890625, -12.384765625, -11.8857421875, -11.38671875, -10.8876953125, -10.388671875, -9.8896484375, -9.390625, -8.8916015625, -8.392578125, -7.8935546875, -7.39453125, -6.8955078125, -6.396484375, -5.8974609375, -5.3984375, -4.8994140625, -4.400390625, -3.9013671875, -3.40234375, -2.9033203125, -2.404296875, -1.9052734375, -1.40625, -0.9072265625, -0.408203125, 0.0908203125, 0.58984375, 1.0888671875, 1.587890625, 2.0869140625, 2.5859375, 3.0849609375, 3.583984375, 4.0830078125, 4.58203125, 5.0810546875, 5.580078125, 6.0791015625, 6.578125, 7.0771484375, 7.576171875, 8.0751953125, 8.57421875, 9.0732421875, 9.572265625, 10.0712890625, 10.5703125, 11.0693359375, 11.568359375, 12.0673828125, 12.56640625, 13.0654296875, 13.564453125, 14.0634765625, 14.5625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 11.0, 5.0, 4.0, 7.0, 11.0, 14.0, 19.0, 19.0, 17.0, 27.0, 16.0, 27.0, 28.0, 36.0, 37.0, 33.0, 37.0, 29.0, 31.0, 45.0, 36.0, 38.0, 47.0, 37.0, 37.0, 33.0, 27.0, 33.0, 18.0, 25.0, 30.0, 21.0, 24.0, 20.0, 15.0, 21.0, 15.0, 10.0, 7.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.546875, -12.1260986328125, -11.705322265625, -11.2845458984375, -10.86376953125, -10.4429931640625, -10.022216796875, -9.6014404296875, -9.1806640625, -8.7598876953125, -8.339111328125, -7.9183349609375, -7.49755859375, -7.0767822265625, -6.656005859375, -6.2352294921875, -5.814453125, -5.3936767578125, -4.972900390625, -4.5521240234375, -4.13134765625, -3.7105712890625, -3.289794921875, -2.8690185546875, -2.4482421875, -2.0274658203125, -1.606689453125, -1.1859130859375, -0.76513671875, -0.3443603515625, 0.076416015625, 0.4971923828125, 0.91796875, 1.3387451171875, 1.759521484375, 2.1802978515625, 2.60107421875, 3.0218505859375, 3.442626953125, 3.8634033203125, 4.2841796875, 4.7049560546875, 5.125732421875, 5.5465087890625, 5.96728515625, 6.3880615234375, 6.808837890625, 7.2296142578125, 7.650390625, 8.0711669921875, 8.491943359375, 8.9127197265625, 9.33349609375, 9.7542724609375, 10.175048828125, 10.5958251953125, 11.0166015625, 11.4373779296875, 11.858154296875, 12.2789306640625, 12.69970703125, 13.1204833984375, 13.541259765625, 13.9620361328125, 14.3828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 8.0, 14.0, 22.0, 25.0, 46.0, 62.0, 89.0, 136.0, 208.0, 332.0, 489.0, 718.0, 1201.0, 1795.0, 2685.0, 4211.0, 6342.0, 9923.0, 15447.0, 24108.0, 36986.0, 57665.0, 87612.0, 131690.0, 190673.0, 264826.0, 347669.0, 421552.0, 469107.0, 470047.0, 428091.0, 354665.0, 272048.0, 196415.0, 136424.0, 91386.0, 60343.0, 38865.0, 25227.0, 15848.0, 10264.0, 6643.0, 4319.0, 2768.0, 1806.0, 1189.0, 800.0, 522.0, 343.0, 227.0, 158.0, 96.0, 54.0, 44.0, 21.0, 14.0, 10.0, 8.0, 5.0, 0.0, 4.0], "bins": [-13.6171875, -13.1922607421875, -12.767333984375, -12.3424072265625, -11.91748046875, -11.4925537109375, -11.067626953125, -10.6427001953125, -10.2177734375, -9.7928466796875, -9.367919921875, -8.9429931640625, -8.51806640625, -8.0931396484375, -7.668212890625, -7.2432861328125, -6.818359375, -6.3934326171875, -5.968505859375, -5.5435791015625, -5.11865234375, -4.6937255859375, -4.268798828125, -3.8438720703125, -3.4189453125, -2.9940185546875, -2.569091796875, -2.1441650390625, -1.71923828125, -1.2943115234375, -0.869384765625, -0.4444580078125, -0.01953125, 0.4053955078125, 0.830322265625, 1.2552490234375, 1.68017578125, 2.1051025390625, 2.530029296875, 2.9549560546875, 3.3798828125, 3.8048095703125, 4.229736328125, 4.6546630859375, 5.07958984375, 5.5045166015625, 5.929443359375, 6.3543701171875, 6.779296875, 7.2042236328125, 7.629150390625, 8.0540771484375, 8.47900390625, 8.9039306640625, 9.328857421875, 9.7537841796875, 10.1787109375, 10.6036376953125, 11.028564453125, 11.4534912109375, 11.87841796875, 12.3033447265625, 12.728271484375, 13.1531982421875, 13.578125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 4.0, 11.0, 13.0, 18.0, 27.0, 27.0, 41.0, 40.0, 59.0, 62.0, 85.0, 79.0, 89.0, 116.0, 138.0, 155.0, 147.0, 201.0, 194.0, 217.0, 178.0, 207.0, 217.0, 200.0, 216.0, 188.0, 194.0, 162.0, 124.0, 98.0, 107.0, 85.0, 65.0, 66.0, 63.0, 46.0, 28.0, 27.0, 27.0, 11.0, 9.0, 11.0, 4.0, 7.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.4296875, -7.2138671875, -6.998046875, -6.7822265625, -6.56640625, -6.3505859375, -6.134765625, -5.9189453125, -5.703125, -5.4873046875, -5.271484375, -5.0556640625, -4.83984375, -4.6240234375, -4.408203125, -4.1923828125, -3.9765625, -3.7607421875, -3.544921875, -3.3291015625, -3.11328125, -2.8974609375, -2.681640625, -2.4658203125, -2.25, -2.0341796875, -1.818359375, -1.6025390625, -1.38671875, -1.1708984375, -0.955078125, -0.7392578125, -0.5234375, -0.3076171875, -0.091796875, 0.1240234375, 0.33984375, 0.5556640625, 0.771484375, 0.9873046875, 1.203125, 1.4189453125, 1.634765625, 1.8505859375, 2.06640625, 2.2822265625, 2.498046875, 2.7138671875, 2.9296875, 3.1455078125, 3.361328125, 3.5771484375, 3.79296875, 4.0087890625, 4.224609375, 4.4404296875, 4.65625, 4.8720703125, 5.087890625, 5.3037109375, 5.51953125, 5.7353515625, 5.951171875, 6.1669921875, 6.3828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 5.0, 14.0, 9.0, 24.0, 24.0, 24.0, 33.0, 36.0, 42.0, 41.0, 58.0, 63.0, 45.0, 71.0, 59.0, 48.0, 52.0, 61.0, 44.0, 45.0, 42.0, 26.0, 27.0, 18.0, 20.0, 18.0, 8.0, 5.0, 13.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.374731063842773, -19.740201950073242, -19.105670928955078, -18.471141815185547, -17.836610794067383, -17.20208168029785, -16.567550659179688, -15.933021545410156, -15.298492431640625, -14.663962364196777, -14.02943229675293, -13.394903182983398, -12.76037311553955, -12.125843048095703, -11.491312980651855, -10.856782913208008, -10.22225284576416, -9.587722778320312, -8.953192710876465, -8.318662643432617, -7.684133529663086, -7.049603462219238, -6.415073394775391, -5.780543804168701, -5.1460137367248535, -4.511483669281006, -3.8769540786743164, -3.2424240112304688, -2.6078941822052, -1.9733643531799316, -1.338834285736084, -0.7043046951293945, -0.06977462768554688, 0.5647552609443665, 1.1992851495742798, 1.833815097808838, 2.4683449268341064, 3.102874755859375, 3.7374048233032227, 4.371934413909912, 5.00646448135376, 5.640994548797607, 6.275524139404297, 6.9100542068481445, 7.544584274291992, 8.179113388061523, 8.813644409179688, 9.448173522949219, 10.082703590393066, 10.717233657836914, 11.351763725280762, 11.98629379272461, 12.62082290649414, 13.255352973937988, 13.889883041381836, 14.524412155151367, 15.158943176269531, 15.793473243713379, 16.428003311157227, 17.062532424926758, 17.697063446044922, 18.331592559814453, 18.966121673583984, 19.60065269470215, 20.23518180847168]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 7.0, 6.0, 7.0, 17.0, 13.0, 15.0, 28.0, 28.0, 28.0, 21.0, 34.0, 45.0, 35.0, 41.0, 34.0, 41.0, 46.0, 49.0, 53.0, 34.0, 32.0, 48.0, 36.0, 35.0, 34.0, 31.0, 31.0, 28.0, 18.0, 18.0, 20.0, 14.0, 17.0, 9.0, 7.0, 8.0, 2.0, 3.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.138290405273438, -16.615663528442383, -16.093036651611328, -15.57040786743164, -15.047780990600586, -14.525154113769531, -14.00252628326416, -13.479898452758789, -12.957271575927734, -12.43464469909668, -11.912016868591309, -11.389389038085938, -10.866762161254883, -10.344135284423828, -9.821507453918457, -9.298879623413086, -8.776252746582031, -8.253625869750977, -7.7309980392456055, -7.208370685577393, -6.68574333190918, -6.163115978240967, -5.640488624572754, -5.117861270904541, -4.595233917236328, -4.072606563568115, -3.5499792098999023, -3.0273518562316895, -2.5047245025634766, -1.9820971488952637, -1.4594697952270508, -0.9368424415588379, -0.4142169952392578, 0.10841035842895508, 0.631037712097168, 1.1536650657653809, 1.6762924194335938, 2.1989197731018066, 2.7215471267700195, 3.2441744804382324, 3.7668018341064453, 4.289429187774658, 4.812056541442871, 5.334683895111084, 5.857311248779297, 6.37993860244751, 6.902565956115723, 7.4251933097839355, 7.947820663452148, 8.470447540283203, 8.993075370788574, 9.515703201293945, 10.038330078125, 10.560956954956055, 11.083584785461426, 11.606212615966797, 12.128839492797852, 12.651466369628906, 13.174094200134277, 13.696722030639648, 14.219348907470703, 14.741975784301758, 15.264603614807129, 15.7872314453125, 16.309858322143555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 12.0, 29.0, 41.0, 54.0, 124.0, 204.0, 350.0, 608.0, 1037.0, 1866.0, 3303.0, 5476.0, 9675.0, 15770.0, 26117.0, 41374.0, 63190.0, 93087.0, 122856.0, 144924.0, 143643.0, 120910.0, 89960.0, 61974.0, 40062.0, 24939.0, 15170.0, 9180.0, 5229.0, 3173.0, 1788.0, 984.0, 604.0, 348.0, 197.0, 126.0, 62.0, 37.0, 23.0, 16.0, 6.0, 8.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.746856689453125, -3.61285400390625, -3.478851318359375, -3.3448486328125, -3.210845947265625, -3.07684326171875, -2.942840576171875, -2.808837890625, -2.674835205078125, -2.54083251953125, -2.406829833984375, -2.2728271484375, -2.138824462890625, -2.00482177734375, -1.870819091796875, -1.73681640625, -1.602813720703125, -1.46881103515625, -1.334808349609375, -1.2008056640625, -1.066802978515625, -0.93280029296875, -0.798797607421875, -0.664794921875, -0.530792236328125, -0.39678955078125, -0.262786865234375, -0.1287841796875, 0.005218505859375, 0.13922119140625, 0.273223876953125, 0.4072265625, 0.541229248046875, 0.67523193359375, 0.809234619140625, 0.9432373046875, 1.077239990234375, 1.21124267578125, 1.345245361328125, 1.479248046875, 1.613250732421875, 1.74725341796875, 1.881256103515625, 2.0152587890625, 2.149261474609375, 2.28326416015625, 2.417266845703125, 2.55126953125, 2.685272216796875, 2.81927490234375, 2.953277587890625, 3.0872802734375, 3.221282958984375, 3.35528564453125, 3.489288330078125, 3.623291015625, 3.757293701171875, 3.89129638671875, 4.025299072265625, 4.1593017578125, 4.293304443359375, 4.42730712890625, 4.561309814453125, 4.6953125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 5.0, 8.0, 5.0, 8.0, 16.0, 13.0, 15.0, 29.0, 30.0, 25.0, 21.0, 36.0, 45.0, 35.0, 39.0, 34.0, 42.0, 46.0, 49.0, 53.0, 33.0, 33.0, 46.0, 35.0, 37.0, 32.0, 33.0, 29.0, 29.0, 18.0, 17.0, 21.0, 14.0, 17.0, 10.0, 6.0, 8.0, 3.0, 3.0, 6.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.125, -16.60400390625, -16.0830078125, -15.56201171875, -15.041015625, -14.52001953125, -13.9990234375, -13.47802734375, -12.95703125, -12.43603515625, -11.9150390625, -11.39404296875, -10.873046875, -10.35205078125, -9.8310546875, -9.31005859375, -8.7890625, -8.26806640625, -7.7470703125, -7.22607421875, -6.705078125, -6.18408203125, -5.6630859375, -5.14208984375, -4.62109375, -4.10009765625, -3.5791015625, -3.05810546875, -2.537109375, -2.01611328125, -1.4951171875, -0.97412109375, -0.453125, 0.06787109375, 0.5888671875, 1.10986328125, 1.630859375, 2.15185546875, 2.6728515625, 3.19384765625, 3.71484375, 4.23583984375, 4.7568359375, 5.27783203125, 5.798828125, 6.31982421875, 6.8408203125, 7.36181640625, 7.8828125, 8.40380859375, 8.9248046875, 9.44580078125, 9.966796875, 10.48779296875, 11.0087890625, 11.52978515625, 12.05078125, 12.57177734375, 13.0927734375, 13.61376953125, 14.134765625, 14.65576171875, 15.1767578125, 15.69775390625, 16.21875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 4.0, 7.0, 5.0, 8.0, 19.0, 29.0, 46.0, 70.0, 71.0, 145.0, 209.0, 310.0, 489.0, 781.0, 1214.0, 2082.0, 3831.0, 6590.0, 12352.0, 23607.0, 71497.0, 843785.0, 39864.0, 18648.0, 9776.0, 5313.0, 3105.0, 1816.0, 1015.0, 608.0, 428.0, 287.0, 172.0, 108.0, 94.0, 34.0, 33.0, 31.0, 23.0, 16.0, 6.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.8359375, -14.3907470703125, -13.945556640625, -13.5003662109375, -13.05517578125, -12.6099853515625, -12.164794921875, -11.7196044921875, -11.2744140625, -10.8292236328125, -10.384033203125, -9.9388427734375, -9.49365234375, -9.0484619140625, -8.603271484375, -8.1580810546875, -7.712890625, -7.2677001953125, -6.822509765625, -6.3773193359375, -5.93212890625, -5.4869384765625, -5.041748046875, -4.5965576171875, -4.1513671875, -3.7061767578125, -3.260986328125, -2.8157958984375, -2.37060546875, -1.9254150390625, -1.480224609375, -1.0350341796875, -0.58984375, -0.1446533203125, 0.300537109375, 0.7457275390625, 1.19091796875, 1.6361083984375, 2.081298828125, 2.5264892578125, 2.9716796875, 3.4168701171875, 3.862060546875, 4.3072509765625, 4.75244140625, 5.1976318359375, 5.642822265625, 6.0880126953125, 6.533203125, 6.9783935546875, 7.423583984375, 7.8687744140625, 8.31396484375, 8.7591552734375, 9.204345703125, 9.6495361328125, 10.0947265625, 10.5399169921875, 10.985107421875, 11.4302978515625, 11.87548828125, 12.3206787109375, 12.765869140625, 13.2110595703125, 13.65625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 11.0, 6.0, 7.0, 6.0, 11.0, 21.0, 11.0, 19.0, 18.0, 21.0, 27.0, 28.0, 25.0, 30.0, 30.0, 29.0, 37.0, 33.0, 50.0, 35.0, 45.0, 26.0, 43.0, 36.0, 24.0, 31.0, 38.0, 34.0, 28.0, 30.0, 26.0, 26.0, 22.0, 27.0, 12.0, 18.0, 17.0, 6.0, 9.0, 11.0, 6.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0, -9.697021484375, -9.39404296875, -9.091064453125, -8.7880859375, -8.485107421875, -8.18212890625, -7.879150390625, -7.576171875, -7.273193359375, -6.97021484375, -6.667236328125, -6.3642578125, -6.061279296875, -5.75830078125, -5.455322265625, -5.15234375, -4.849365234375, -4.54638671875, -4.243408203125, -3.9404296875, -3.637451171875, -3.33447265625, -3.031494140625, -2.728515625, -2.425537109375, -2.12255859375, -1.819580078125, -1.5166015625, -1.213623046875, -0.91064453125, -0.607666015625, -0.3046875, -0.001708984375, 0.30126953125, 0.604248046875, 0.9072265625, 1.210205078125, 1.51318359375, 1.816162109375, 2.119140625, 2.422119140625, 2.72509765625, 3.028076171875, 3.3310546875, 3.634033203125, 3.93701171875, 4.239990234375, 4.54296875, 4.845947265625, 5.14892578125, 5.451904296875, 5.7548828125, 6.057861328125, 6.36083984375, 6.663818359375, 6.966796875, 7.269775390625, 7.57275390625, 7.875732421875, 8.1787109375, 8.481689453125, 8.78466796875, 9.087646484375, 9.390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 8.0, 14.0, 20.0, 50.0, 72.0, 80.0, 157.0, 209.0, 424.0, 713.0, 1284.0, 2310.0, 4513.0, 8682.0, 17530.0, 40395.0, 839344.0, 83882.0, 24178.0, 11748.0, 6025.0, 3102.0, 1640.0, 862.0, 506.0, 315.0, 168.0, 102.0, 66.0, 43.0, 35.0, 22.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8115234375, -0.7859344482421875, -0.760345458984375, -0.7347564697265625, -0.70916748046875, -0.6835784912109375, -0.657989501953125, -0.6324005126953125, -0.6068115234375, -0.5812225341796875, -0.555633544921875, -0.5300445556640625, -0.50445556640625, -0.4788665771484375, -0.453277587890625, -0.4276885986328125, -0.402099609375, -0.3765106201171875, -0.350921630859375, -0.3253326416015625, -0.29974365234375, -0.2741546630859375, -0.248565673828125, -0.2229766845703125, -0.1973876953125, -0.1717987060546875, -0.146209716796875, -0.1206207275390625, -0.09503173828125, -0.0694427490234375, -0.043853759765625, -0.0182647705078125, 0.00732421875, 0.0329132080078125, 0.058502197265625, 0.0840911865234375, 0.10968017578125, 0.1352691650390625, 0.160858154296875, 0.1864471435546875, 0.2120361328125, 0.2376251220703125, 0.263214111328125, 0.2888031005859375, 0.31439208984375, 0.3399810791015625, 0.365570068359375, 0.3911590576171875, 0.416748046875, 0.4423370361328125, 0.467926025390625, 0.4935150146484375, 0.51910400390625, 0.5446929931640625, 0.570281982421875, 0.5958709716796875, 0.6214599609375, 0.6470489501953125, 0.672637939453125, 0.6982269287109375, 0.72381591796875, 0.7494049072265625, 0.774993896484375, 0.8005828857421875, 0.826171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 2.0, 4.0, 9.0, 5.0, 4.0, 9.0, 9.0, 9.0, 27.0, 25.0, 19.0, 32.0, 31.0, 25.0, 44.0, 60.0, 53.0, 52.0, 41.0, 53.0, 54.0, 57.0, 51.0, 42.0, 53.0, 33.0, 29.0, 25.0, 29.0, 22.0, 16.0, 12.0, 19.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.93986701965332e-05, -3.82671132683754e-05, -3.713555634021759e-05, -3.6003999412059784e-05, -3.487244248390198e-05, -3.374088555574417e-05, -3.2609328627586365e-05, -3.147777169942856e-05, -3.0346214771270752e-05, -2.9214657843112946e-05, -2.808310091495514e-05, -2.6951543986797333e-05, -2.5819987058639526e-05, -2.468843013048172e-05, -2.3556873202323914e-05, -2.2425316274166107e-05, -2.12937593460083e-05, -2.0162202417850494e-05, -1.9030645489692688e-05, -1.789908856153488e-05, -1.6767531633377075e-05, -1.563597470521927e-05, -1.4504417777061462e-05, -1.3372860848903656e-05, -1.224130392074585e-05, -1.1109746992588043e-05, -9.978190064430237e-06, -8.84663313627243e-06, -7.715076208114624e-06, -6.583519279956818e-06, -5.451962351799011e-06, -4.320405423641205e-06, -3.1888484954833984e-06, -2.057291567325592e-06, -9.257346391677856e-07, 2.0582228899002075e-07, 1.3373792171478271e-06, 2.4689361453056335e-06, 3.60049307346344e-06, 4.732050001621246e-06, 5.863606929779053e-06, 6.995163857936859e-06, 8.126720786094666e-06, 9.258277714252472e-06, 1.0389834642410278e-05, 1.1521391570568085e-05, 1.2652948498725891e-05, 1.3784505426883698e-05, 1.4916062355041504e-05, 1.604761928319931e-05, 1.7179176211357117e-05, 1.8310733139514923e-05, 1.944229006767273e-05, 2.0573846995830536e-05, 2.1705403923988342e-05, 2.283696085214615e-05, 2.3968517780303955e-05, 2.510007470846176e-05, 2.6231631636619568e-05, 2.7363188564777374e-05, 2.849474549293518e-05, 2.9626302421092987e-05, 3.0757859349250793e-05, 3.18894162774086e-05, 3.3020973205566406e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 18.0, 18.0, 36.0, 49.0, 89.0, 151.0, 225.0, 368.0, 553.0, 839.0, 1276.0, 1846.0, 2893.0, 4360.0, 6360.0, 9382.0, 13638.0, 20250.0, 29208.0, 41834.0, 58219.0, 78760.0, 99552.0, 117711.0, 122132.0, 110567.0, 91141.0, 69978.0, 51524.0, 36383.0, 25566.0, 17217.0, 12031.0, 7819.0, 5530.0, 3748.0, 2492.0, 1641.0, 1112.0, 753.0, 466.0, 309.0, 209.0, 108.0, 74.0, 51.0, 21.0, 21.0, 14.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5767898559570312, -0.5583648681640625, -0.5399398803710938, -0.521514892578125, -0.5030899047851562, -0.4846649169921875, -0.46623992919921875, -0.44781494140625, -0.42938995361328125, -0.4109649658203125, -0.39253997802734375, -0.374114990234375, -0.35569000244140625, -0.3372650146484375, -0.31884002685546875, -0.3004150390625, -0.28199005126953125, -0.2635650634765625, -0.24514007568359375, -0.226715087890625, -0.20829010009765625, -0.1898651123046875, -0.17144012451171875, -0.15301513671875, -0.13459014892578125, -0.1161651611328125, -0.09774017333984375, -0.079315185546875, -0.06089019775390625, -0.0424652099609375, -0.02404022216796875, -0.005615234375, 0.01280975341796875, 0.0312347412109375, 0.04965972900390625, 0.068084716796875, 0.08650970458984375, 0.1049346923828125, 0.12335968017578125, 0.14178466796875, 0.16020965576171875, 0.1786346435546875, 0.19705963134765625, 0.215484619140625, 0.23390960693359375, 0.2523345947265625, 0.27075958251953125, 0.2891845703125, 0.30760955810546875, 0.3260345458984375, 0.34445953369140625, 0.362884521484375, 0.38130950927734375, 0.3997344970703125, 0.41815948486328125, 0.43658447265625, 0.45500946044921875, 0.4734344482421875, 0.49185943603515625, 0.510284423828125, 0.5287094116210938, 0.5471343994140625, 0.5655593872070312, 0.583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 8.0, 5.0, 4.0, 10.0, 12.0, 5.0, 4.0, 10.0, 16.0, 21.0, 21.0, 16.0, 25.0, 45.0, 27.0, 48.0, 33.0, 48.0, 52.0, 49.0, 43.0, 44.0, 43.0, 49.0, 47.0, 45.0, 29.0, 41.0, 32.0, 24.0, 23.0, 29.0, 10.0, 19.0, 11.0, 11.0, 8.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.2709312438964844, -0.26256561279296875, -0.2541999816894531, -0.2458343505859375, -0.23746871948242188, -0.22910308837890625, -0.22073745727539062, -0.212371826171875, -0.20400619506835938, -0.19564056396484375, -0.18727493286132812, -0.1789093017578125, -0.17054367065429688, -0.16217803955078125, -0.15381240844726562, -0.14544677734375, -0.13708114624023438, -0.12871551513671875, -0.12034988403320312, -0.1119842529296875, -0.10361862182617188, -0.09525299072265625, -0.08688735961914062, -0.078521728515625, -0.07015609741210938, -0.06179046630859375, -0.053424835205078125, -0.0450592041015625, -0.036693572998046875, -0.02832794189453125, -0.019962310791015625, -0.0115966796875, -0.003231048583984375, 0.00513458251953125, 0.013500213623046875, 0.0218658447265625, 0.030231475830078125, 0.03859710693359375, 0.046962738037109375, 0.055328369140625, 0.06369400024414062, 0.07205963134765625, 0.08042526245117188, 0.0887908935546875, 0.09715652465820312, 0.10552215576171875, 0.11388778686523438, 0.12225341796875, 0.13061904907226562, 0.13898468017578125, 0.14735031127929688, 0.1557159423828125, 0.16408157348632812, 0.17244720458984375, 0.18081283569335938, 0.189178466796875, 0.19754409790039062, 0.20590972900390625, 0.21427536010742188, 0.2226409912109375, 0.23100662231445312, 0.23937225341796875, 0.24773788452148438, 0.256103515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 11.0, 21.0, 27.0, 23.0, 29.0, 38.0, 31.0, 39.0, 52.0, 58.0, 48.0, 71.0, 53.0, 50.0, 61.0, 42.0, 54.0, 45.0, 37.0, 34.0, 35.0, 21.0, 20.0, 20.0, 12.0, 12.0, 5.0, 9.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.990995407104492, -19.376527786254883, -18.76205825805664, -18.14759063720703, -17.533123016357422, -16.91865348815918, -16.30418586730957, -15.689717292785645, -15.075248718261719, -14.460780143737793, -13.846311569213867, -13.231843948364258, -12.617375373840332, -12.002906799316406, -11.388439178466797, -10.773970603942871, -10.159502029418945, -9.54503345489502, -8.930564880371094, -8.316097259521484, -7.701628684997559, -7.087160110473633, -6.472692012786865, -5.858223915100098, -5.243755340576172, -4.629286766052246, -4.0148186683654785, -3.400350332260132, -2.785881996154785, -2.1714136600494385, -1.5569453239440918, -0.9424772262573242, -0.3280067443847656, 0.28646159172058105, 0.9009299278259277, 1.5153982639312744, 2.129866600036621, 2.7443349361419678, 3.3588032722473145, 3.973271369934082, 4.587739944458008, 5.202208518981934, 5.816676616668701, 6.431144714355469, 7.0456132888793945, 7.66008186340332, 8.27454948425293, 8.889018058776855, 9.503486633300781, 10.117955207824707, 10.732423782348633, 11.346891403198242, 11.961359977722168, 12.575828552246094, 13.190296173095703, 13.804764747619629, 14.419233322143555, 15.03370189666748, 15.648170471191406, 16.262638092041016, 16.877105712890625, 17.491575241088867, 18.106042861938477, 18.72051239013672, 19.334980010986328]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 9.0, 5.0, 6.0, 6.0, 7.0, 17.0, 13.0, 12.0, 24.0, 38.0, 25.0, 21.0, 33.0, 36.0, 43.0, 36.0, 37.0, 42.0, 50.0, 47.0, 53.0, 40.0, 26.0, 48.0, 34.0, 37.0, 34.0, 30.0, 28.0, 33.0, 18.0, 17.0, 20.0, 15.0, 17.0, 11.0, 7.0, 7.0, 2.0, 4.0, 6.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.317588806152344, -16.79276466369629, -16.267940521240234, -15.74311637878418, -15.218292236328125, -14.69346809387207, -14.168643951416016, -13.643819808959961, -13.118995666503906, -12.594171524047852, -12.069347381591797, -11.544523239135742, -11.019699096679688, -10.494874954223633, -9.970050811767578, -9.445226669311523, -8.920403480529785, -8.39557933807373, -7.870755195617676, -7.345931053161621, -6.821106910705566, -6.296282768249512, -5.771459102630615, -5.2466349601745605, -4.721810817718506, -4.196986675262451, -3.6721625328063965, -3.147338628768921, -2.622514486312866, -2.0976903438568115, -1.572866439819336, -1.0480422973632812, -0.5232181549072266, 0.0016059279441833496, 0.5264300107955933, 1.0512540340423584, 1.576078176498413, 2.1009023189544678, 2.6257262229919434, 3.150550365447998, 3.6753745079040527, 4.200198650360107, 4.725022792816162, 5.249846458435059, 5.774670600891113, 6.299494743347168, 6.824318885803223, 7.349143028259277, 7.873967170715332, 8.398791313171387, 8.923615455627441, 9.448439598083496, 9.97326374053955, 10.498087882995605, 11.022911071777344, 11.547735214233398, 12.072559356689453, 12.597383499145508, 13.122207641601562, 13.647031784057617, 14.171855926513672, 14.696680068969727, 15.221504211425781, 15.746328353881836, 16.27115249633789]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 10.0, 4.0, 8.0, 16.0, 32.0, 47.0, 65.0, 108.0, 177.0, 273.0, 403.0, 673.0, 1109.0, 1681.0, 2724.0, 4263.0, 6493.0, 10347.0, 15541.0, 23081.0, 32985.0, 45565.0, 60859.0, 76986.0, 91210.0, 101524.0, 104597.0, 101134.0, 90297.0, 75833.0, 59301.0, 44277.0, 32369.0, 22118.0, 14791.0, 9981.0, 6481.0, 4103.0, 2647.0, 1665.0, 1031.0, 629.0, 440.0, 274.0, 147.0, 110.0, 61.0, 35.0, 25.0, 20.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.7265625, -12.33447265625, -11.9423828125, -11.55029296875, -11.158203125, -10.76611328125, -10.3740234375, -9.98193359375, -9.58984375, -9.19775390625, -8.8056640625, -8.41357421875, -8.021484375, -7.62939453125, -7.2373046875, -6.84521484375, -6.453125, -6.06103515625, -5.6689453125, -5.27685546875, -4.884765625, -4.49267578125, -4.1005859375, -3.70849609375, -3.31640625, -2.92431640625, -2.5322265625, -2.14013671875, -1.748046875, -1.35595703125, -0.9638671875, -0.57177734375, -0.1796875, 0.21240234375, 0.6044921875, 0.99658203125, 1.388671875, 1.78076171875, 2.1728515625, 2.56494140625, 2.95703125, 3.34912109375, 3.7412109375, 4.13330078125, 4.525390625, 4.91748046875, 5.3095703125, 5.70166015625, 6.09375, 6.48583984375, 6.8779296875, 7.27001953125, 7.662109375, 8.05419921875, 8.4462890625, 8.83837890625, 9.23046875, 9.62255859375, 10.0146484375, 10.40673828125, 10.798828125, 11.19091796875, 11.5830078125, 11.97509765625, 12.3671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 10.0, 5.0, 5.0, 6.0, 9.0, 16.0, 13.0, 13.0, 20.0, 35.0, 27.0, 22.0, 30.0, 40.0, 36.0, 42.0, 39.0, 39.0, 50.0, 39.0, 61.0, 37.0, 31.0, 46.0, 32.0, 33.0, 43.0, 32.0, 21.0, 36.0, 17.0, 18.0, 23.0, 16.0, 16.0, 10.0, 5.0, 9.0, 3.0, 5.0, 5.0, 8.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.765625, -16.2591552734375, -15.752685546875, -15.2462158203125, -14.73974609375, -14.2332763671875, -13.726806640625, -13.2203369140625, -12.7138671875, -12.2073974609375, -11.700927734375, -11.1944580078125, -10.68798828125, -10.1815185546875, -9.675048828125, -9.1685791015625, -8.662109375, -8.1556396484375, -7.649169921875, -7.1427001953125, -6.63623046875, -6.1297607421875, -5.623291015625, -5.1168212890625, -4.6103515625, -4.1038818359375, -3.597412109375, -3.0909423828125, -2.58447265625, -2.0780029296875, -1.571533203125, -1.0650634765625, -0.55859375, -0.0521240234375, 0.454345703125, 0.9608154296875, 1.46728515625, 1.9737548828125, 2.480224609375, 2.9866943359375, 3.4931640625, 3.9996337890625, 4.506103515625, 5.0125732421875, 5.51904296875, 6.0255126953125, 6.531982421875, 7.0384521484375, 7.544921875, 8.0513916015625, 8.557861328125, 9.0643310546875, 9.57080078125, 10.0772705078125, 10.583740234375, 11.0902099609375, 11.5966796875, 12.1031494140625, 12.609619140625, 13.1160888671875, 13.62255859375, 14.1290283203125, 14.635498046875, 15.1419677734375, 15.6484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 16.0, 31.0, 55.0, 92.0, 147.0, 258.0, 519.0, 1025.0, 1864.0, 3577.0, 6802.0, 12711.0, 22577.0, 39512.0, 63975.0, 96170.0, 128977.0, 150056.0, 149019.0, 126711.0, 94659.0, 62958.0, 38317.0, 22321.0, 12242.0, 6514.0, 3494.0, 1870.0, 1004.0, 508.0, 253.0, 142.0, 80.0, 37.0, 28.0, 14.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.251708984375, -14.70654296875, -14.161376953125, -13.6162109375, -13.071044921875, -12.52587890625, -11.980712890625, -11.435546875, -10.890380859375, -10.34521484375, -9.800048828125, -9.2548828125, -8.709716796875, -8.16455078125, -7.619384765625, -7.07421875, -6.529052734375, -5.98388671875, -5.438720703125, -4.8935546875, -4.348388671875, -3.80322265625, -3.258056640625, -2.712890625, -2.167724609375, -1.62255859375, -1.077392578125, -0.5322265625, 0.012939453125, 0.55810546875, 1.103271484375, 1.6484375, 2.193603515625, 2.73876953125, 3.283935546875, 3.8291015625, 4.374267578125, 4.91943359375, 5.464599609375, 6.009765625, 6.554931640625, 7.10009765625, 7.645263671875, 8.1904296875, 8.735595703125, 9.28076171875, 9.825927734375, 10.37109375, 10.916259765625, 11.46142578125, 12.006591796875, 12.5517578125, 13.096923828125, 13.64208984375, 14.187255859375, 14.732421875, 15.277587890625, 15.82275390625, 16.367919921875, 16.9130859375, 17.458251953125, 18.00341796875, 18.548583984375, 19.09375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 6.0, 5.0, 12.0, 10.0, 13.0, 24.0, 11.0, 17.0, 25.0, 26.0, 34.0, 31.0, 20.0, 39.0, 42.0, 41.0, 50.0, 40.0, 47.0, 34.0, 36.0, 42.0, 35.0, 54.0, 40.0, 44.0, 30.0, 34.0, 27.0, 21.0, 20.0, 16.0, 12.0, 18.0, 9.0, 6.0, 5.0, 5.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.2828369140625, -9.940673828125, -9.5985107421875, -9.25634765625, -8.9141845703125, -8.572021484375, -8.2298583984375, -7.8876953125, -7.5455322265625, -7.203369140625, -6.8612060546875, -6.51904296875, -6.1768798828125, -5.834716796875, -5.4925537109375, -5.150390625, -4.8082275390625, -4.466064453125, -4.1239013671875, -3.78173828125, -3.4395751953125, -3.097412109375, -2.7552490234375, -2.4130859375, -2.0709228515625, -1.728759765625, -1.3865966796875, -1.04443359375, -0.7022705078125, -0.360107421875, -0.0179443359375, 0.32421875, 0.6663818359375, 1.008544921875, 1.3507080078125, 1.69287109375, 2.0350341796875, 2.377197265625, 2.7193603515625, 3.0615234375, 3.4036865234375, 3.745849609375, 4.0880126953125, 4.43017578125, 4.7723388671875, 5.114501953125, 5.4566650390625, 5.798828125, 6.1409912109375, 6.483154296875, 6.8253173828125, 7.16748046875, 7.5096435546875, 7.851806640625, 8.1939697265625, 8.5361328125, 8.8782958984375, 9.220458984375, 9.5626220703125, 9.90478515625, 10.2469482421875, 10.589111328125, 10.9312744140625, 11.2734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 13.0, 12.0, 28.0, 36.0, 57.0, 76.0, 100.0, 141.0, 285.0, 436.0, 745.0, 1218.0, 2156.0, 3843.0, 6685.0, 11823.0, 20256.0, 35324.0, 57684.0, 88717.0, 122100.0, 147469.0, 151530.0, 132030.0, 100050.0, 67168.0, 41480.0, 24354.0, 14052.0, 7805.0, 4478.0, 2579.0, 1489.0, 880.0, 498.0, 357.0, 205.0, 136.0, 71.0, 60.0, 39.0, 19.0, 20.0, 8.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.01953125, -5.82635498046875, -5.6331787109375, -5.44000244140625, -5.246826171875, -5.05364990234375, -4.8604736328125, -4.66729736328125, -4.47412109375, -4.28094482421875, -4.0877685546875, -3.89459228515625, -3.701416015625, -3.50823974609375, -3.3150634765625, -3.12188720703125, -2.9287109375, -2.73553466796875, -2.5423583984375, -2.34918212890625, -2.156005859375, -1.96282958984375, -1.7696533203125, -1.57647705078125, -1.38330078125, -1.19012451171875, -0.9969482421875, -0.80377197265625, -0.610595703125, -0.41741943359375, -0.2242431640625, -0.03106689453125, 0.162109375, 0.35528564453125, 0.5484619140625, 0.74163818359375, 0.934814453125, 1.12799072265625, 1.3211669921875, 1.51434326171875, 1.70751953125, 1.90069580078125, 2.0938720703125, 2.28704833984375, 2.480224609375, 2.67340087890625, 2.8665771484375, 3.05975341796875, 3.2529296875, 3.44610595703125, 3.6392822265625, 3.83245849609375, 4.025634765625, 4.21881103515625, 4.4119873046875, 4.60516357421875, 4.79833984375, 4.99151611328125, 5.1846923828125, 5.37786865234375, 5.571044921875, 5.76422119140625, 5.9573974609375, 6.15057373046875, 6.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 7.0, 8.0, 6.0, 11.0, 9.0, 6.0, 21.0, 11.0, 31.0, 20.0, 34.0, 47.0, 45.0, 69.0, 47.0, 72.0, 54.0, 54.0, 55.0, 61.0, 58.0, 56.0, 42.0, 42.0, 24.0, 24.0, 20.0, 18.0, 12.0, 9.0, 8.0, 3.0, 5.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007781982421875, -0.0007561147212982178, -0.0007340312004089355, -0.0007119476795196533, -0.0006898641586303711, -0.0006677806377410889, -0.0006456971168518066, -0.0006236135959625244, -0.0006015300750732422, -0.00057944655418396, -0.0005573630332946777, -0.0005352795124053955, -0.0005131959915161133, -0.0004911124706268311, -0.00046902894973754883, -0.0004469454288482666, -0.0004248619079589844, -0.00040277838706970215, -0.0003806948661804199, -0.0003586113452911377, -0.00033652782440185547, -0.00031444430351257324, -0.000292360782623291, -0.0002702772617340088, -0.00024819374084472656, -0.00022611021995544434, -0.0002040266990661621, -0.00018194317817687988, -0.00015985965728759766, -0.00013777613639831543, -0.0001156926155090332, -9.360909461975098e-05, -7.152557373046875e-05, -4.9442052841186523e-05, -2.7358531951904297e-05, -5.27501106262207e-06, 1.6808509826660156e-05, 3.889203071594238e-05, 6.097555160522461e-05, 8.305907249450684e-05, 0.00010514259338378906, 0.0001272261142730713, 0.00014930963516235352, 0.00017139315605163574, 0.00019347667694091797, 0.0002155601978302002, 0.00023764371871948242, 0.00025972723960876465, 0.0002818107604980469, 0.0003038942813873291, 0.00032597780227661133, 0.00034806132316589355, 0.0003701448440551758, 0.000392228364944458, 0.00041431188583374023, 0.00043639540672302246, 0.0004584789276123047, 0.0004805624485015869, 0.0005026459693908691, 0.0005247294902801514, 0.0005468130111694336, 0.0005688965320587158, 0.000590980052947998, 0.0006130635738372803, 0.0006351470947265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 4.0, 3.0, 15.0, 15.0, 13.0, 31.0, 36.0, 42.0, 74.0, 104.0, 156.0, 205.0, 329.0, 450.0, 678.0, 1019.0, 1514.0, 2379.0, 3671.0, 5821.0, 9094.0, 14178.0, 23112.0, 35815.0, 55178.0, 79558.0, 106460.0, 127471.0, 135449.0, 124833.0, 102054.0, 75619.0, 51336.0, 33402.0, 21075.0, 13504.0, 8517.0, 5223.0, 3529.0, 2118.0, 1445.0, 998.0, 650.0, 432.0, 305.0, 212.0, 121.0, 102.0, 72.0, 47.0, 31.0, 20.0, 20.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.125, -5.9300537109375, -5.735107421875, -5.5401611328125, -5.34521484375, -5.1502685546875, -4.955322265625, -4.7603759765625, -4.5654296875, -4.3704833984375, -4.175537109375, -3.9805908203125, -3.78564453125, -3.5906982421875, -3.395751953125, -3.2008056640625, -3.005859375, -2.8109130859375, -2.615966796875, -2.4210205078125, -2.22607421875, -2.0311279296875, -1.836181640625, -1.6412353515625, -1.4462890625, -1.2513427734375, -1.056396484375, -0.8614501953125, -0.66650390625, -0.4715576171875, -0.276611328125, -0.0816650390625, 0.11328125, 0.3082275390625, 0.503173828125, 0.6981201171875, 0.89306640625, 1.0880126953125, 1.282958984375, 1.4779052734375, 1.6728515625, 1.8677978515625, 2.062744140625, 2.2576904296875, 2.45263671875, 2.6475830078125, 2.842529296875, 3.0374755859375, 3.232421875, 3.4273681640625, 3.622314453125, 3.8172607421875, 4.01220703125, 4.2071533203125, 4.402099609375, 4.5970458984375, 4.7919921875, 4.9869384765625, 5.181884765625, 5.3768310546875, 5.57177734375, 5.7667236328125, 5.961669921875, 6.1566162109375, 6.3515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 4.0, 5.0, 5.0, 2.0, 8.0, 6.0, 13.0, 4.0, 19.0, 31.0, 25.0, 38.0, 30.0, 35.0, 41.0, 59.0, 46.0, 52.0, 60.0, 68.0, 51.0, 58.0, 46.0, 47.0, 45.0, 31.0, 28.0, 29.0, 25.0, 18.0, 18.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.839447021484375, -2.74530029296875, -2.651153564453125, -2.5570068359375, -2.462860107421875, -2.36871337890625, -2.274566650390625, -2.180419921875, -2.086273193359375, -1.99212646484375, -1.897979736328125, -1.8038330078125, -1.709686279296875, -1.61553955078125, -1.521392822265625, -1.42724609375, -1.333099365234375, -1.23895263671875, -1.144805908203125, -1.0506591796875, -0.956512451171875, -0.86236572265625, -0.768218994140625, -0.674072265625, -0.579925537109375, -0.48577880859375, -0.391632080078125, -0.2974853515625, -0.203338623046875, -0.10919189453125, -0.015045166015625, 0.0791015625, 0.173248291015625, 0.26739501953125, 0.361541748046875, 0.4556884765625, 0.549835205078125, 0.64398193359375, 0.738128662109375, 0.832275390625, 0.926422119140625, 1.02056884765625, 1.114715576171875, 1.2088623046875, 1.303009033203125, 1.39715576171875, 1.491302490234375, 1.58544921875, 1.679595947265625, 1.77374267578125, 1.867889404296875, 1.9620361328125, 2.056182861328125, 2.15032958984375, 2.244476318359375, 2.338623046875, 2.432769775390625, 2.52691650390625, 2.621063232421875, 2.7152099609375, 2.809356689453125, 2.90350341796875, 2.997650146484375, 3.091796875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 12.0, 13.0, 17.0, 24.0, 24.0, 34.0, 40.0, 49.0, 49.0, 48.0, 64.0, 62.0, 50.0, 51.0, 62.0, 41.0, 55.0, 46.0, 35.0, 57.0, 25.0, 23.0, 15.0, 17.0, 15.0, 17.0, 9.0, 6.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09556770324707, -18.480003356933594, -17.864437103271484, -17.248872756958008, -16.6333065032959, -16.017742156982422, -15.402176856994629, -14.786611557006836, -14.171046257019043, -13.55548095703125, -12.939915657043457, -12.324350357055664, -11.708786010742188, -11.093219757080078, -10.477655410766602, -9.862090110778809, -9.246524810791016, -8.630959510803223, -8.01539421081543, -7.399829387664795, -6.784264087677002, -6.168698787689209, -5.553133964538574, -4.937568664550781, -4.322003364562988, -3.7064380645751953, -3.0908730030059814, -2.4753079414367676, -1.8597426414489746, -1.2441773414611816, -0.6286122798919678, -0.013047218322753906, 0.6025161743164062, 1.2180813550949097, 1.833646535873413, 2.449211597442627, 3.06477689743042, 3.680342197418213, 4.295907020568848, 4.911472320556641, 5.527037620544434, 6.142602920532227, 6.7581682205200195, 7.373733043670654, 7.989298343658447, 8.604864120483398, 9.220428466796875, 9.835993766784668, 10.451559066772461, 11.067124366760254, 11.682689666748047, 12.29825496673584, 12.913820266723633, 13.52938461303711, 14.144949913024902, 14.760515213012695, 15.376080513000488, 15.991645812988281, 16.607210159301758, 17.222776412963867, 17.838340759277344, 18.453907012939453, 19.06947135925293, 19.685035705566406, 20.300601959228516]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 10.0, 15.0, 11.0, 10.0, 18.0, 25.0, 21.0, 20.0, 28.0, 22.0, 36.0, 32.0, 29.0, 43.0, 32.0, 39.0, 41.0, 27.0, 35.0, 43.0, 36.0, 36.0, 42.0, 29.0, 29.0, 29.0, 30.0, 19.0, 23.0, 23.0, 19.0, 21.0, 18.0, 14.0, 13.0, 10.0, 10.0, 6.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.203418731689453, -13.735404014587402, -13.267388343811035, -12.799373626708984, -12.331357955932617, -11.863343238830566, -11.395328521728516, -10.927312850952148, -10.459298133850098, -9.991283416748047, -9.52326774597168, -9.055253028869629, -8.587238311767578, -8.119222640991211, -7.65120792388916, -7.183192729949951, -6.715177536010742, -6.247162342071533, -5.779147148132324, -5.311132431030273, -4.8431172370910645, -4.3751020431518555, -3.9070870876312256, -3.4390721321105957, -2.9710569381713867, -2.5030417442321777, -2.035026788711548, -1.5670117139816284, -1.098996639251709, -0.6309814453125, -0.16296648979187012, 0.30504846572875977, 0.7730636596679688, 1.2410787343978882, 1.7090938091278076, 2.1771087646484375, 2.6451239585876465, 3.1131391525268555, 3.5811541080474854, 4.049169063568115, 4.517184257507324, 4.985199451446533, 5.453214645385742, 5.921229362487793, 6.389244556427002, 6.857259750366211, 7.325274467468262, 7.793289661407471, 8.26130485534668, 8.72931957244873, 9.197335243225098, 9.665349960327148, 10.133365631103516, 10.601380348205566, 11.069395065307617, 11.537410736083984, 12.005425453186035, 12.473440170288086, 12.941455841064453, 13.409470558166504, 13.877485275268555, 14.345500946044922, 14.813515663146973, 15.281530380249023, 15.74954605102539]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 8.0, 14.0, 28.0, 27.0, 53.0, 73.0, 106.0, 210.0, 282.0, 450.0, 736.0, 1243.0, 1952.0, 3126.0, 5145.0, 8704.0, 14289.0, 24278.0, 41046.0, 69269.0, 117538.0, 191491.0, 299084.0, 427131.0, 542616.0, 596287.0, 557862.0, 448609.0, 317390.0, 207205.0, 127400.0, 77197.0, 45880.0, 26935.0, 16017.0, 9556.0, 5849.0, 3513.0, 2126.0, 1363.0, 809.0, 548.0, 313.0, 181.0, 114.0, 80.0, 58.0, 33.0, 22.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-16.015625, -15.524169921875, -15.03271484375, -14.541259765625, -14.0498046875, -13.558349609375, -13.06689453125, -12.575439453125, -12.083984375, -11.592529296875, -11.10107421875, -10.609619140625, -10.1181640625, -9.626708984375, -9.13525390625, -8.643798828125, -8.15234375, -7.660888671875, -7.16943359375, -6.677978515625, -6.1865234375, -5.695068359375, -5.20361328125, -4.712158203125, -4.220703125, -3.729248046875, -3.23779296875, -2.746337890625, -2.2548828125, -1.763427734375, -1.27197265625, -0.780517578125, -0.2890625, 0.202392578125, 0.69384765625, 1.185302734375, 1.6767578125, 2.168212890625, 2.65966796875, 3.151123046875, 3.642578125, 4.134033203125, 4.62548828125, 5.116943359375, 5.6083984375, 6.099853515625, 6.59130859375, 7.082763671875, 7.57421875, 8.065673828125, 8.55712890625, 9.048583984375, 9.5400390625, 10.031494140625, 10.52294921875, 11.014404296875, 11.505859375, 11.997314453125, 12.48876953125, 12.980224609375, 13.4716796875, 13.963134765625, 14.45458984375, 14.946044921875, 15.4375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 3.0, 13.0, 9.0, 10.0, 13.0, 14.0, 24.0, 23.0, 20.0, 24.0, 31.0, 23.0, 33.0, 38.0, 38.0, 33.0, 35.0, 39.0, 38.0, 34.0, 36.0, 31.0, 40.0, 44.0, 33.0, 27.0, 27.0, 28.0, 26.0, 19.0, 23.0, 20.0, 21.0, 22.0, 13.0, 10.0, 15.0, 10.0, 6.0, 8.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.75, -12.334716796875, -11.91943359375, -11.504150390625, -11.0888671875, -10.673583984375, -10.25830078125, -9.843017578125, -9.427734375, -9.012451171875, -8.59716796875, -8.181884765625, -7.7666015625, -7.351318359375, -6.93603515625, -6.520751953125, -6.10546875, -5.690185546875, -5.27490234375, -4.859619140625, -4.4443359375, -4.029052734375, -3.61376953125, -3.198486328125, -2.783203125, -2.367919921875, -1.95263671875, -1.537353515625, -1.1220703125, -0.706787109375, -0.29150390625, 0.123779296875, 0.5390625, 0.954345703125, 1.36962890625, 1.784912109375, 2.2001953125, 2.615478515625, 3.03076171875, 3.446044921875, 3.861328125, 4.276611328125, 4.69189453125, 5.107177734375, 5.5224609375, 5.937744140625, 6.35302734375, 6.768310546875, 7.18359375, 7.598876953125, 8.01416015625, 8.429443359375, 8.8447265625, 9.260009765625, 9.67529296875, 10.090576171875, 10.505859375, 10.921142578125, 11.33642578125, 11.751708984375, 12.1669921875, 12.582275390625, 12.99755859375, 13.412841796875, 13.828125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 13.0, 15.0, 22.0, 44.0, 91.0, 129.0, 246.0, 376.0, 653.0, 1059.0, 1881.0, 3268.0, 5362.0, 9268.0, 16175.0, 27553.0, 48146.0, 81080.0, 134173.0, 213468.0, 319194.0, 437550.0, 532559.0, 570728.0, 527823.0, 428788.0, 310163.0, 207141.0, 130008.0, 77826.0, 46000.0, 26556.0, 15427.0, 8936.0, 5089.0, 3077.0, 1787.0, 1087.0, 622.0, 374.0, 213.0, 132.0, 84.0, 41.0, 30.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.984375, -16.461181640625, -15.93798828125, -15.414794921875, -14.8916015625, -14.368408203125, -13.84521484375, -13.322021484375, -12.798828125, -12.275634765625, -11.75244140625, -11.229248046875, -10.7060546875, -10.182861328125, -9.65966796875, -9.136474609375, -8.61328125, -8.090087890625, -7.56689453125, -7.043701171875, -6.5205078125, -5.997314453125, -5.47412109375, -4.950927734375, -4.427734375, -3.904541015625, -3.38134765625, -2.858154296875, -2.3349609375, -1.811767578125, -1.28857421875, -0.765380859375, -0.2421875, 0.281005859375, 0.80419921875, 1.327392578125, 1.8505859375, 2.373779296875, 2.89697265625, 3.420166015625, 3.943359375, 4.466552734375, 4.98974609375, 5.512939453125, 6.0361328125, 6.559326171875, 7.08251953125, 7.605712890625, 8.12890625, 8.652099609375, 9.17529296875, 9.698486328125, 10.2216796875, 10.744873046875, 11.26806640625, 11.791259765625, 12.314453125, 12.837646484375, 13.36083984375, 13.884033203125, 14.4072265625, 14.930419921875, 15.45361328125, 15.976806640625, 16.5]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 14.0, 16.0, 15.0, 27.0, 24.0, 39.0, 47.0, 51.0, 64.0, 85.0, 118.0, 123.0, 131.0, 140.0, 171.0, 201.0, 198.0, 218.0, 205.0, 202.0, 205.0, 189.0, 178.0, 178.0, 175.0, 162.0, 134.0, 129.0, 110.0, 97.0, 95.0, 50.0, 50.0, 42.0, 30.0, 37.0, 25.0, 22.0, 17.0, 18.0, 7.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-6.72265625, -6.51177978515625, -6.3009033203125, -6.09002685546875, -5.879150390625, -5.66827392578125, -5.4573974609375, -5.24652099609375, -5.03564453125, -4.82476806640625, -4.6138916015625, -4.40301513671875, -4.192138671875, -3.98126220703125, -3.7703857421875, -3.55950927734375, -3.3486328125, -3.13775634765625, -2.9268798828125, -2.71600341796875, -2.505126953125, -2.29425048828125, -2.0833740234375, -1.87249755859375, -1.66162109375, -1.45074462890625, -1.2398681640625, -1.02899169921875, -0.818115234375, -0.60723876953125, -0.3963623046875, -0.18548583984375, 0.025390625, 0.23626708984375, 0.4471435546875, 0.65802001953125, 0.868896484375, 1.07977294921875, 1.2906494140625, 1.50152587890625, 1.71240234375, 1.92327880859375, 2.1341552734375, 2.34503173828125, 2.555908203125, 2.76678466796875, 2.9776611328125, 3.18853759765625, 3.3994140625, 3.61029052734375, 3.8211669921875, 4.03204345703125, 4.242919921875, 4.45379638671875, 4.6646728515625, 4.87554931640625, 5.08642578125, 5.29730224609375, 5.5081787109375, 5.71905517578125, 5.929931640625, 6.14080810546875, 6.3516845703125, 6.56256103515625, 6.7734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 12.0, 13.0, 14.0, 10.0, 18.0, 42.0, 28.0, 39.0, 33.0, 49.0, 54.0, 32.0, 33.0, 40.0, 46.0, 45.0, 61.0, 50.0, 49.0, 45.0, 29.0, 36.0, 30.0, 29.0, 31.0, 33.0, 11.0, 13.0, 13.0, 7.0, 5.0, 8.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.272865295410156, -16.7117977142334, -16.150728225708008, -15.589659690856934, -15.02859115600586, -14.467523574829102, -13.906455039978027, -13.345386505126953, -12.784317970275879, -12.223249435424805, -11.66218090057373, -11.101112365722656, -10.540044784545898, -9.978975296020508, -9.41790771484375, -8.856839179992676, -8.295770645141602, -7.734702110290527, -7.173633575439453, -6.612565517425537, -6.051496982574463, -5.490428447723389, -4.929360389709473, -4.368291854858398, -3.807223320007324, -3.24615478515625, -2.685086488723755, -2.1240181922912598, -1.5629496574401855, -1.0018811225891113, -0.4408128261566162, 0.1202554702758789, 0.6813240051269531, 1.2423924207687378, 1.8034608364105225, 2.3645291328430176, 2.925597667694092, 3.486666202545166, 4.047734260559082, 4.608802795410156, 5.1698713302612305, 5.730939865112305, 6.292008399963379, 6.853076457977295, 7.414144992828369, 7.975213527679443, 8.53628158569336, 9.097350120544434, 9.658418655395508, 10.219487190246582, 10.780555725097656, 11.34162425994873, 11.902692794799805, 12.463760375976562, 13.024828910827637, 13.585897445678711, 14.146965980529785, 14.70803451538086, 15.269103050231934, 15.830171585083008, 16.391239166259766, 16.952308654785156, 17.513376235961914, 18.074443817138672, 18.635513305664062]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 5.0, 4.0, 7.0, 11.0, 7.0, 11.0, 18.0, 18.0, 10.0, 26.0, 19.0, 28.0, 20.0, 27.0, 26.0, 35.0, 34.0, 20.0, 36.0, 33.0, 36.0, 42.0, 35.0, 40.0, 30.0, 50.0, 32.0, 35.0, 29.0, 33.0, 26.0, 25.0, 18.0, 18.0, 16.0, 18.0, 22.0, 19.0, 11.0, 8.0, 6.0, 7.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.895451545715332, -12.44568920135498, -11.995927810668945, -11.546165466308594, -11.096403121948242, -10.64664077758789, -10.196878433227539, -9.747117042541504, -9.297354698181152, -8.8475923538208, -8.397830963134766, -7.948068618774414, -7.4983062744140625, -7.048543930053711, -6.598782062530518, -6.149020195007324, -5.699257850646973, -5.249495506286621, -4.799733638763428, -4.349971771240234, -3.900209426879883, -3.4504473209381104, -3.000685214996338, -2.5509231090545654, -2.101161003112793, -1.6513988971710205, -1.201636791229248, -0.7518746852874756, -0.3021125793457031, 0.14764952659606934, 0.5974116325378418, 1.0471737384796143, 1.4969358444213867, 1.9466979503631592, 2.3964600563049316, 2.846222162246704, 3.2959842681884766, 3.745746374130249, 4.1955084800720215, 4.645270347595215, 5.095032691955566, 5.544795036315918, 5.994556903839111, 6.444318771362305, 6.894081115722656, 7.343843460083008, 7.793605327606201, 8.243367195129395, 8.693129539489746, 9.142891883850098, 9.592653274536133, 10.042415618896484, 10.492177963256836, 10.941940307617188, 11.391702651977539, 11.841464042663574, 12.291226387023926, 12.740988731384277, 13.190750122070312, 13.640512466430664, 14.090274810791016, 14.540037155151367, 14.989799499511719, 15.439560890197754, 15.889323234558105]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 20.0, 20.0, 39.0, 42.0, 47.0, 104.0, 141.0, 202.0, 272.0, 473.0, 793.0, 1179.0, 1807.0, 2805.0, 4568.0, 6996.0, 11248.0, 17756.0, 27522.0, 41374.0, 60863.0, 84767.0, 108599.0, 126322.0, 129429.0, 116986.0, 94449.0, 70153.0, 48982.0, 32575.0, 21302.0, 13339.0, 8534.0, 5392.0, 3432.0, 2138.0, 1334.0, 835.0, 592.0, 356.0, 280.0, 167.0, 101.0, 66.0, 64.0, 33.0, 19.0, 10.0, 7.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0], "bins": [-3.126953125, -3.02984619140625, -2.9327392578125, -2.83563232421875, -2.738525390625, -2.64141845703125, -2.5443115234375, -2.44720458984375, -2.35009765625, -2.25299072265625, -2.1558837890625, -2.05877685546875, -1.961669921875, -1.86456298828125, -1.7674560546875, -1.67034912109375, -1.5732421875, -1.47613525390625, -1.3790283203125, -1.28192138671875, -1.184814453125, -1.08770751953125, -0.9906005859375, -0.89349365234375, -0.79638671875, -0.69927978515625, -0.6021728515625, -0.50506591796875, -0.407958984375, -0.31085205078125, -0.2137451171875, -0.11663818359375, -0.01953125, 0.07757568359375, 0.1746826171875, 0.27178955078125, 0.368896484375, 0.46600341796875, 0.5631103515625, 0.66021728515625, 0.75732421875, 0.85443115234375, 0.9515380859375, 1.04864501953125, 1.145751953125, 1.24285888671875, 1.3399658203125, 1.43707275390625, 1.5341796875, 1.63128662109375, 1.7283935546875, 1.82550048828125, 1.922607421875, 2.01971435546875, 2.1168212890625, 2.21392822265625, 2.31103515625, 2.40814208984375, 2.5052490234375, 2.60235595703125, 2.699462890625, 2.79656982421875, 2.8936767578125, 2.99078369140625, 3.087890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 4.0, 7.0, 11.0, 7.0, 12.0, 15.0, 18.0, 13.0, 24.0, 20.0, 26.0, 21.0, 26.0, 28.0, 35.0, 33.0, 20.0, 36.0, 35.0, 34.0, 40.0, 39.0, 37.0, 30.0, 49.0, 32.0, 37.0, 28.0, 35.0, 24.0, 24.0, 19.0, 17.0, 19.0, 17.0, 21.0, 20.0, 11.0, 8.0, 6.0, 8.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.921875, -12.472412109375, -12.02294921875, -11.573486328125, -11.1240234375, -10.674560546875, -10.22509765625, -9.775634765625, -9.326171875, -8.876708984375, -8.42724609375, -7.977783203125, -7.5283203125, -7.078857421875, -6.62939453125, -6.179931640625, -5.73046875, -5.281005859375, -4.83154296875, -4.382080078125, -3.9326171875, -3.483154296875, -3.03369140625, -2.584228515625, -2.134765625, -1.685302734375, -1.23583984375, -0.786376953125, -0.3369140625, 0.112548828125, 0.56201171875, 1.011474609375, 1.4609375, 1.910400390625, 2.35986328125, 2.809326171875, 3.2587890625, 3.708251953125, 4.15771484375, 4.607177734375, 5.056640625, 5.506103515625, 5.95556640625, 6.405029296875, 6.8544921875, 7.303955078125, 7.75341796875, 8.202880859375, 8.65234375, 9.101806640625, 9.55126953125, 10.000732421875, 10.4501953125, 10.899658203125, 11.34912109375, 11.798583984375, 12.248046875, 12.697509765625, 13.14697265625, 13.596435546875, 14.0458984375, 14.495361328125, 14.94482421875, 15.394287109375, 15.84375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 13.0, 18.0, 27.0, 37.0, 38.0, 69.0, 77.0, 101.0, 141.0, 208.0, 261.0, 377.0, 528.0, 799.0, 1078.0, 1580.0, 2416.0, 3655.0, 5650.0, 8871.0, 14135.0, 24272.0, 75351.0, 796897.0, 52675.0, 22014.0, 13097.0, 8026.0, 5399.0, 3418.0, 2207.0, 1511.0, 1009.0, 748.0, 543.0, 369.0, 251.0, 186.0, 106.0, 107.0, 67.0, 52.0, 47.0, 26.0, 18.0, 11.0, 9.0, 10.0, 11.0, 3.0, 3.0, 4.0, 0.0, 7.0], "bins": [-7.92578125, -7.68865966796875, -7.4515380859375, -7.21441650390625, -6.977294921875, -6.74017333984375, -6.5030517578125, -6.26593017578125, -6.02880859375, -5.79168701171875, -5.5545654296875, -5.31744384765625, -5.080322265625, -4.84320068359375, -4.6060791015625, -4.36895751953125, -4.1318359375, -3.89471435546875, -3.6575927734375, -3.42047119140625, -3.183349609375, -2.94622802734375, -2.7091064453125, -2.47198486328125, -2.23486328125, -1.99774169921875, -1.7606201171875, -1.52349853515625, -1.286376953125, -1.04925537109375, -0.8121337890625, -0.57501220703125, -0.337890625, -0.10076904296875, 0.1363525390625, 0.37347412109375, 0.610595703125, 0.84771728515625, 1.0848388671875, 1.32196044921875, 1.55908203125, 1.79620361328125, 2.0333251953125, 2.27044677734375, 2.507568359375, 2.74468994140625, 2.9818115234375, 3.21893310546875, 3.4560546875, 3.69317626953125, 3.9302978515625, 4.16741943359375, 4.404541015625, 4.64166259765625, 4.8787841796875, 5.11590576171875, 5.35302734375, 5.59014892578125, 5.8272705078125, 6.06439208984375, 6.301513671875, 6.53863525390625, 6.7757568359375, 7.01287841796875, 7.25]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 11.0, 10.0, 6.0, 7.0, 13.0, 16.0, 16.0, 16.0, 20.0, 11.0, 24.0, 30.0, 30.0, 22.0, 32.0, 38.0, 39.0, 33.0, 38.0, 40.0, 36.0, 37.0, 31.0, 44.0, 36.0, 30.0, 29.0, 39.0, 30.0, 23.0, 31.0, 29.0, 29.0, 23.0, 18.0, 5.0, 18.0, 8.0, 10.0, 14.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.7265625, -9.4117431640625, -9.096923828125, -8.7821044921875, -8.46728515625, -8.1524658203125, -7.837646484375, -7.5228271484375, -7.2080078125, -6.8931884765625, -6.578369140625, -6.2635498046875, -5.94873046875, -5.6339111328125, -5.319091796875, -5.0042724609375, -4.689453125, -4.3746337890625, -4.059814453125, -3.7449951171875, -3.43017578125, -3.1153564453125, -2.800537109375, -2.4857177734375, -2.1708984375, -1.8560791015625, -1.541259765625, -1.2264404296875, -0.91162109375, -0.5968017578125, -0.281982421875, 0.0328369140625, 0.34765625, 0.6624755859375, 0.977294921875, 1.2921142578125, 1.60693359375, 1.9217529296875, 2.236572265625, 2.5513916015625, 2.8662109375, 3.1810302734375, 3.495849609375, 3.8106689453125, 4.12548828125, 4.4403076171875, 4.755126953125, 5.0699462890625, 5.384765625, 5.6995849609375, 6.014404296875, 6.3292236328125, 6.64404296875, 6.9588623046875, 7.273681640625, 7.5885009765625, 7.9033203125, 8.2181396484375, 8.532958984375, 8.8477783203125, 9.16259765625, 9.4774169921875, 9.792236328125, 10.1070556640625, 10.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 4.0, 5.0, 6.0, 6.0, 11.0, 11.0, 11.0, 17.0, 35.0, 30.0, 59.0, 78.0, 124.0, 170.0, 319.0, 465.0, 937.0, 1696.0, 3268.0, 6606.0, 14242.0, 31773.0, 649725.0, 285342.0, 28345.0, 12666.0, 6079.0, 2882.0, 1545.0, 833.0, 458.0, 258.0, 188.0, 99.0, 82.0, 58.0, 36.0, 26.0, 14.0, 12.0, 6.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92578125, -0.89678955078125, -0.8677978515625, -0.83880615234375, -0.809814453125, -0.78082275390625, -0.7518310546875, -0.72283935546875, -0.69384765625, -0.66485595703125, -0.6358642578125, -0.60687255859375, -0.577880859375, -0.54888916015625, -0.5198974609375, -0.49090576171875, -0.4619140625, -0.43292236328125, -0.4039306640625, -0.37493896484375, -0.345947265625, -0.31695556640625, -0.2879638671875, -0.25897216796875, -0.22998046875, -0.20098876953125, -0.1719970703125, -0.14300537109375, -0.114013671875, -0.08502197265625, -0.0560302734375, -0.02703857421875, 0.001953125, 0.03094482421875, 0.0599365234375, 0.08892822265625, 0.117919921875, 0.14691162109375, 0.1759033203125, 0.20489501953125, 0.23388671875, 0.26287841796875, 0.2918701171875, 0.32086181640625, 0.349853515625, 0.37884521484375, 0.4078369140625, 0.43682861328125, 0.4658203125, 0.49481201171875, 0.5238037109375, 0.55279541015625, 0.581787109375, 0.61077880859375, 0.6397705078125, 0.66876220703125, 0.69775390625, 0.72674560546875, 0.7557373046875, 0.78472900390625, 0.813720703125, 0.84271240234375, 0.8717041015625, 0.90069580078125, 0.9296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 10.0, 4.0, 10.0, 13.0, 7.0, 9.0, 19.0, 25.0, 26.0, 28.0, 28.0, 28.0, 34.0, 33.0, 50.0, 58.0, 61.0, 51.0, 45.0, 50.0, 48.0, 53.0, 51.0, 50.0, 44.0, 33.0, 22.0, 9.0, 17.0, 24.0, 13.0, 12.0, 9.0, 3.0, 7.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8848648071289062e-05, -2.7942471206188202e-05, -2.703629434108734e-05, -2.613011747598648e-05, -2.522394061088562e-05, -2.431776374578476e-05, -2.34115868806839e-05, -2.250541001558304e-05, -2.1599233150482178e-05, -2.0693056285381317e-05, -1.9786879420280457e-05, -1.8880702555179596e-05, -1.7974525690078735e-05, -1.7068348824977875e-05, -1.6162171959877014e-05, -1.5255995094776154e-05, -1.4349818229675293e-05, -1.3443641364574432e-05, -1.2537464499473572e-05, -1.1631287634372711e-05, -1.072511076927185e-05, -9.81893390417099e-06, -8.91275703907013e-06, -8.006580173969269e-06, -7.100403308868408e-06, -6.194226443767548e-06, -5.288049578666687e-06, -4.381872713565826e-06, -3.475695848464966e-06, -2.5695189833641052e-06, -1.6633421182632446e-06, -7.57165253162384e-07, 1.4901161193847656e-07, 1.0551884770393372e-06, 1.9613653421401978e-06, 2.8675422072410583e-06, 3.773719072341919e-06, 4.6798959374427795e-06, 5.58607280254364e-06, 6.492249667644501e-06, 7.398426532745361e-06, 8.304603397846222e-06, 9.210780262947083e-06, 1.0116957128047943e-05, 1.1023133993148804e-05, 1.1929310858249664e-05, 1.2835487723350525e-05, 1.3741664588451385e-05, 1.4647841453552246e-05, 1.5554018318653107e-05, 1.6460195183753967e-05, 1.7366372048854828e-05, 1.827254891395569e-05, 1.917872577905655e-05, 2.008490264415741e-05, 2.099107950925827e-05, 2.189725637435913e-05, 2.280343323945999e-05, 2.3709610104560852e-05, 2.4615786969661713e-05, 2.5521963834762573e-05, 2.6428140699863434e-05, 2.7334317564964294e-05, 2.8240494430065155e-05, 2.9146671295166016e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 13.0, 13.0, 22.0, 25.0, 53.0, 80.0, 137.0, 198.0, 290.0, 468.0, 790.0, 1369.0, 2345.0, 4294.0, 7787.0, 14303.0, 25426.0, 44379.0, 74290.0, 114112.0, 158934.0, 178150.0, 151468.0, 107899.0, 68614.0, 40947.0, 23310.0, 12769.0, 6855.0, 3878.0, 2176.0, 1242.0, 687.0, 407.0, 286.0, 173.0, 127.0, 79.0, 52.0, 31.0, 19.0, 19.0, 9.0, 7.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8173828125, -0.7913665771484375, -0.765350341796875, -0.7393341064453125, -0.71331787109375, -0.6873016357421875, -0.661285400390625, -0.6352691650390625, -0.6092529296875, -0.5832366943359375, -0.557220458984375, -0.5312042236328125, -0.50518798828125, -0.4791717529296875, -0.453155517578125, -0.4271392822265625, -0.401123046875, -0.3751068115234375, -0.349090576171875, -0.3230743408203125, -0.29705810546875, -0.2710418701171875, -0.245025634765625, -0.2190093994140625, -0.1929931640625, -0.1669769287109375, -0.140960693359375, -0.1149444580078125, -0.08892822265625, -0.0629119873046875, -0.036895751953125, -0.0108795166015625, 0.01513671875, 0.0411529541015625, 0.067169189453125, 0.0931854248046875, 0.11920166015625, 0.1452178955078125, 0.171234130859375, 0.1972503662109375, 0.2232666015625, 0.2492828369140625, 0.275299072265625, 0.3013153076171875, 0.32733154296875, 0.3533477783203125, 0.379364013671875, 0.4053802490234375, 0.431396484375, 0.4574127197265625, 0.483428955078125, 0.5094451904296875, 0.53546142578125, 0.5614776611328125, 0.587493896484375, 0.6135101318359375, 0.6395263671875, 0.6655426025390625, 0.691558837890625, 0.7175750732421875, 0.74359130859375, 0.7696075439453125, 0.795623779296875, 0.8216400146484375, 0.84765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 7.0, 13.0, 19.0, 21.0, 30.0, 40.0, 37.0, 48.0, 69.0, 81.0, 67.0, 67.0, 81.0, 87.0, 65.0, 60.0, 44.0, 25.0, 26.0, 22.0, 13.0, 16.0, 16.0, 3.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3221244812011719, -0.31075286865234375, -0.2993812561035156, -0.2880096435546875, -0.2766380310058594, -0.26526641845703125, -0.2538948059082031, -0.242523193359375, -0.23115158081054688, -0.21977996826171875, -0.20840835571289062, -0.1970367431640625, -0.18566513061523438, -0.17429351806640625, -0.16292190551757812, -0.15155029296875, -0.14017868041992188, -0.12880706787109375, -0.11743545532226562, -0.1060638427734375, -0.09469223022460938, -0.08332061767578125, -0.07194900512695312, -0.060577392578125, -0.049205780029296875, -0.03783416748046875, -0.026462554931640625, -0.0150909423828125, -0.003719329833984375, 0.00765228271484375, 0.019023895263671875, 0.0303955078125, 0.041767120361328125, 0.05313873291015625, 0.06451034545898438, 0.0758819580078125, 0.08725357055664062, 0.09862518310546875, 0.10999679565429688, 0.121368408203125, 0.13274002075195312, 0.14411163330078125, 0.15548324584960938, 0.1668548583984375, 0.17822647094726562, 0.18959808349609375, 0.20096969604492188, 0.21234130859375, 0.22371292114257812, 0.23508453369140625, 0.24645614624023438, 0.2578277587890625, 0.2691993713378906, 0.28057098388671875, 0.2919425964355469, 0.303314208984375, 0.3146858215332031, 0.32605743408203125, 0.3374290466308594, 0.3488006591796875, 0.3601722717285156, 0.37154388427734375, 0.3829154968261719, 0.394287109375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 9.0, 11.0, 11.0, 13.0, 14.0, 19.0, 37.0, 28.0, 31.0, 54.0, 41.0, 48.0, 31.0, 48.0, 23.0, 57.0, 40.0, 58.0, 58.0, 40.0, 47.0, 31.0, 37.0, 34.0, 29.0, 29.0, 35.0, 6.0, 14.0, 12.0, 8.0, 7.0, 4.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.43577003479004, -16.86945343017578, -16.303136825561523, -15.736820220947266, -15.170504570007324, -14.604187965393066, -14.037871360778809, -13.47155475616455, -12.90523910522461, -12.338922500610352, -11.772605895996094, -11.206289291381836, -10.639973640441895, -10.073657035827637, -9.507340431213379, -8.941023826599121, -8.374707221984863, -7.8083906173706055, -7.242074489593506, -6.675757884979248, -6.109441757202148, -5.543125152587891, -4.976808547973633, -4.410491943359375, -3.8441758155822754, -3.2778594493865967, -2.711543083190918, -2.14522647857666, -1.5789101123809814, -1.0125937461853027, -0.4462771415710449, 0.12003922462463379, 0.6863555908203125, 1.2526719570159912, 1.8189884424209595, 2.3853049278259277, 2.9516212940216064, 3.517937660217285, 4.084254264831543, 4.650570869445801, 5.2168869972229, 5.783203601837158, 6.349519729614258, 6.915836334228516, 7.482152938842773, 8.048469543457031, 8.614786148071289, 9.18110179901123, 9.747418403625488, 10.313735008239746, 10.880051612854004, 11.446367263793945, 12.012683868408203, 12.579000473022461, 13.145317077636719, 13.711633682250977, 14.277950286865234, 14.844266891479492, 15.41058349609375, 15.976900100708008, 16.543216705322266, 17.10953140258789, 17.67584991455078, 18.242164611816406, 18.808481216430664]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 7.0, 1.0, 7.0, 4.0, 6.0, 12.0, 6.0, 12.0, 14.0, 18.0, 15.0, 23.0, 20.0, 25.0, 20.0, 30.0, 18.0, 42.0, 30.0, 23.0, 37.0, 30.0, 37.0, 38.0, 40.0, 36.0, 30.0, 52.0, 33.0, 32.0, 32.0, 35.0, 24.0, 24.0, 21.0, 16.0, 15.0, 19.0, 24.0, 18.0, 9.0, 11.0, 4.0, 10.0, 12.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.966719627380371, -12.517382621765137, -12.068044662475586, -11.618707656860352, -11.169370651245117, -10.720033645629883, -10.270696640014648, -9.821358680725098, -9.372021675109863, -8.922684669494629, -8.473346710205078, -8.024009704589844, -7.574672698974609, -7.125335693359375, -6.675998210906982, -6.22666072845459, -5.7773237228393555, -5.327986717224121, -4.8786492347717285, -4.429311752319336, -3.9799747467041016, -3.530637502670288, -3.0813002586364746, -2.631963014602661, -2.1826257705688477, -1.7332885265350342, -1.2839512825012207, -0.8346140384674072, -0.38527679443359375, 0.06406044960021973, 0.5133976936340332, 0.9627349376678467, 1.4120721817016602, 1.8614094257354736, 2.310746669769287, 2.7600839138031006, 3.209421157836914, 3.6587584018707275, 4.108095645904541, 4.557433128356934, 5.006770133972168, 5.456107139587402, 5.905444622039795, 6.3547821044921875, 6.804119110107422, 7.253456115722656, 7.702793598175049, 8.152131080627441, 8.601468086242676, 9.05080509185791, 9.500143051147461, 9.949480056762695, 10.39881706237793, 10.848154067993164, 11.297491073608398, 11.74682903289795, 12.196166038513184, 12.645503044128418, 13.094841003417969, 13.544178009033203, 13.993515014648438, 14.442852020263672, 14.892189025878906, 15.341526985168457, 15.790863990783691]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 13.0, 14.0, 30.0, 39.0, 84.0, 140.0, 222.0, 441.0, 694.0, 1257.0, 2112.0, 3710.0, 5866.0, 9932.0, 15417.0, 23597.0, 35346.0, 50398.0, 68237.0, 86342.0, 102140.0, 111947.0, 112435.0, 103581.0, 87848.0, 70310.0, 52516.0, 36759.0, 25149.0, 16151.0, 10188.0, 6207.0, 3880.0, 2285.0, 1383.0, 828.0, 464.0, 268.0, 146.0, 79.0, 42.0, 25.0, 16.0, 10.0, 8.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.037353515625, -10.61376953125, -10.190185546875, -9.7666015625, -9.343017578125, -8.91943359375, -8.495849609375, -8.072265625, -7.648681640625, -7.22509765625, -6.801513671875, -6.3779296875, -5.954345703125, -5.53076171875, -5.107177734375, -4.68359375, -4.260009765625, -3.83642578125, -3.412841796875, -2.9892578125, -2.565673828125, -2.14208984375, -1.718505859375, -1.294921875, -0.871337890625, -0.44775390625, -0.024169921875, 0.3994140625, 0.822998046875, 1.24658203125, 1.670166015625, 2.09375, 2.517333984375, 2.94091796875, 3.364501953125, 3.7880859375, 4.211669921875, 4.63525390625, 5.058837890625, 5.482421875, 5.906005859375, 6.32958984375, 6.753173828125, 7.1767578125, 7.600341796875, 8.02392578125, 8.447509765625, 8.87109375, 9.294677734375, 9.71826171875, 10.141845703125, 10.5654296875, 10.989013671875, 11.41259765625, 11.836181640625, 12.259765625, 12.683349609375, 13.10693359375, 13.530517578125, 13.9541015625, 14.377685546875, 14.80126953125, 15.224853515625, 15.6484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 7.0, 5.0, 6.0, 10.0, 7.0, 8.0, 17.0, 18.0, 13.0, 28.0, 21.0, 20.0, 26.0, 24.0, 25.0, 35.0, 33.0, 24.0, 32.0, 35.0, 41.0, 30.0, 46.0, 35.0, 26.0, 50.0, 36.0, 38.0, 27.0, 35.0, 25.0, 23.0, 21.0, 19.0, 15.0, 22.0, 18.0, 16.0, 14.0, 7.0, 5.0, 9.0, 13.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.12646484375, -11.6904296875, -11.25439453125, -10.818359375, -10.38232421875, -9.9462890625, -9.51025390625, -9.07421875, -8.63818359375, -8.2021484375, -7.76611328125, -7.330078125, -6.89404296875, -6.4580078125, -6.02197265625, -5.5859375, -5.14990234375, -4.7138671875, -4.27783203125, -3.841796875, -3.40576171875, -2.9697265625, -2.53369140625, -2.09765625, -1.66162109375, -1.2255859375, -0.78955078125, -0.353515625, 0.08251953125, 0.5185546875, 0.95458984375, 1.390625, 1.82666015625, 2.2626953125, 2.69873046875, 3.134765625, 3.57080078125, 4.0068359375, 4.44287109375, 4.87890625, 5.31494140625, 5.7509765625, 6.18701171875, 6.623046875, 7.05908203125, 7.4951171875, 7.93115234375, 8.3671875, 8.80322265625, 9.2392578125, 9.67529296875, 10.111328125, 10.54736328125, 10.9833984375, 11.41943359375, 11.85546875, 12.29150390625, 12.7275390625, 13.16357421875, 13.599609375, 14.03564453125, 14.4716796875, 14.90771484375, 15.34375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 9.0, 6.0, 23.0, 25.0, 59.0, 79.0, 122.0, 216.0, 383.0, 581.0, 958.0, 1620.0, 2634.0, 4199.0, 6698.0, 10386.0, 16240.0, 24094.0, 34953.0, 48621.0, 64618.0, 81174.0, 96415.0, 106064.0, 108045.0, 101008.0, 88555.0, 72074.0, 56058.0, 40036.0, 28694.0, 19495.0, 12751.0, 8188.0, 5134.0, 3226.0, 1961.0, 1225.0, 745.0, 449.0, 293.0, 165.0, 101.0, 75.0, 44.0, 29.0, 12.0, 12.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.3515625, -12.96142578125, -12.5712890625, -12.18115234375, -11.791015625, -11.40087890625, -11.0107421875, -10.62060546875, -10.23046875, -9.84033203125, -9.4501953125, -9.06005859375, -8.669921875, -8.27978515625, -7.8896484375, -7.49951171875, -7.109375, -6.71923828125, -6.3291015625, -5.93896484375, -5.548828125, -5.15869140625, -4.7685546875, -4.37841796875, -3.98828125, -3.59814453125, -3.2080078125, -2.81787109375, -2.427734375, -2.03759765625, -1.6474609375, -1.25732421875, -0.8671875, -0.47705078125, -0.0869140625, 0.30322265625, 0.693359375, 1.08349609375, 1.4736328125, 1.86376953125, 2.25390625, 2.64404296875, 3.0341796875, 3.42431640625, 3.814453125, 4.20458984375, 4.5947265625, 4.98486328125, 5.375, 5.76513671875, 6.1552734375, 6.54541015625, 6.935546875, 7.32568359375, 7.7158203125, 8.10595703125, 8.49609375, 8.88623046875, 9.2763671875, 9.66650390625, 10.056640625, 10.44677734375, 10.8369140625, 11.22705078125, 11.6171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 10.0, 4.0, 9.0, 13.0, 15.0, 23.0, 27.0, 27.0, 15.0, 17.0, 22.0, 27.0, 26.0, 33.0, 35.0, 35.0, 42.0, 44.0, 31.0, 40.0, 26.0, 37.0, 31.0, 39.0, 41.0, 39.0, 18.0, 34.0, 32.0, 27.0, 27.0, 20.0, 15.0, 10.0, 15.0, 18.0, 15.0, 5.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.6953125, -9.3974609375, -9.099609375, -8.8017578125, -8.50390625, -8.2060546875, -7.908203125, -7.6103515625, -7.3125, -7.0146484375, -6.716796875, -6.4189453125, -6.12109375, -5.8232421875, -5.525390625, -5.2275390625, -4.9296875, -4.6318359375, -4.333984375, -4.0361328125, -3.73828125, -3.4404296875, -3.142578125, -2.8447265625, -2.546875, -2.2490234375, -1.951171875, -1.6533203125, -1.35546875, -1.0576171875, -0.759765625, -0.4619140625, -0.1640625, 0.1337890625, 0.431640625, 0.7294921875, 1.02734375, 1.3251953125, 1.623046875, 1.9208984375, 2.21875, 2.5166015625, 2.814453125, 3.1123046875, 3.41015625, 3.7080078125, 4.005859375, 4.3037109375, 4.6015625, 4.8994140625, 5.197265625, 5.4951171875, 5.79296875, 6.0908203125, 6.388671875, 6.6865234375, 6.984375, 7.2822265625, 7.580078125, 7.8779296875, 8.17578125, 8.4736328125, 8.771484375, 9.0693359375, 9.3671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 15.0, 19.0, 35.0, 36.0, 84.0, 117.0, 222.0, 303.0, 510.0, 752.0, 1215.0, 1950.0, 2971.0, 4783.0, 7760.0, 12449.0, 20273.0, 32526.0, 50170.0, 72743.0, 99217.0, 122318.0, 133157.0, 128601.0, 109842.0, 83732.0, 58756.0, 38612.0, 24521.0, 15477.0, 9633.0, 5785.0, 3596.0, 2384.0, 1443.0, 902.0, 565.0, 371.0, 220.0, 185.0, 120.0, 60.0, 40.0, 32.0, 14.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.60430908203125, -5.4156494140625, -5.22698974609375, -5.038330078125, -4.84967041015625, -4.6610107421875, -4.47235107421875, -4.28369140625, -4.09503173828125, -3.9063720703125, -3.71771240234375, -3.529052734375, -3.34039306640625, -3.1517333984375, -2.96307373046875, -2.7744140625, -2.58575439453125, -2.3970947265625, -2.20843505859375, -2.019775390625, -1.83111572265625, -1.6424560546875, -1.45379638671875, -1.26513671875, -1.07647705078125, -0.8878173828125, -0.69915771484375, -0.510498046875, -0.32183837890625, -0.1331787109375, 0.05548095703125, 0.244140625, 0.43280029296875, 0.6214599609375, 0.81011962890625, 0.998779296875, 1.18743896484375, 1.3760986328125, 1.56475830078125, 1.75341796875, 1.94207763671875, 2.1307373046875, 2.31939697265625, 2.508056640625, 2.69671630859375, 2.8853759765625, 3.07403564453125, 3.2626953125, 3.45135498046875, 3.6400146484375, 3.82867431640625, 4.017333984375, 4.20599365234375, 4.3946533203125, 4.58331298828125, 4.77197265625, 4.96063232421875, 5.1492919921875, 5.33795166015625, 5.526611328125, 5.71527099609375, 5.9039306640625, 6.09259033203125, 6.28125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 7.0, 5.0, 8.0, 15.0, 16.0, 25.0, 16.0, 15.0, 28.0, 28.0, 29.0, 42.0, 43.0, 49.0, 44.0, 64.0, 42.0, 44.0, 50.0, 44.0, 39.0, 38.0, 43.0, 35.0, 31.0, 33.0, 28.0, 21.0, 10.0, 14.0, 11.0, 14.0, 9.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.0007410049438476562, -0.0007216185331344604, -0.0007022321224212646, -0.0006828457117080688, -0.000663459300994873, -0.0006440728902816772, -0.0006246864795684814, -0.0006053000688552856, -0.0005859136581420898, -0.000566527247428894, -0.0005471408367156982, -0.0005277544260025024, -0.0005083680152893066, -0.0004889816045761108, -0.00046959519386291504, -0.00045020878314971924, -0.00043082237243652344, -0.00041143596172332764, -0.00039204955101013184, -0.00037266314029693604, -0.00035327672958374023, -0.00033389031887054443, -0.00031450390815734863, -0.00029511749744415283, -0.00027573108673095703, -0.00025634467601776123, -0.00023695826530456543, -0.00021757185459136963, -0.00019818544387817383, -0.00017879903316497803, -0.00015941262245178223, -0.00014002621173858643, -0.00012063980102539062, -0.00010125339031219482, -8.186697959899902e-05, -6.248056888580322e-05, -4.309415817260742e-05, -2.370774745941162e-05, -4.32133674621582e-06, 1.506507396697998e-05, 3.445148468017578e-05, 5.383789539337158e-05, 7.322430610656738e-05, 9.261071681976318e-05, 0.00011199712753295898, 0.00013138353824615479, 0.00015076994895935059, 0.0001701563596725464, 0.0001895427703857422, 0.000208929181098938, 0.0002283155918121338, 0.0002477020025253296, 0.0002670884132385254, 0.0002864748239517212, 0.000305861234664917, 0.0003252476453781128, 0.0003446340560913086, 0.0003640204668045044, 0.0003834068775177002, 0.000402793288230896, 0.0004221796989440918, 0.0004415661096572876, 0.0004609525203704834, 0.0004803389310836792, 0.000499725341796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 16.0, 17.0, 37.0, 48.0, 84.0, 88.0, 170.0, 245.0, 421.0, 666.0, 1055.0, 1701.0, 2998.0, 5193.0, 8881.0, 15601.0, 27600.0, 47137.0, 77124.0, 115317.0, 149204.0, 161505.0, 146099.0, 110049.0, 72667.0, 44107.0, 25699.0, 14729.0, 8260.0, 4767.0, 2757.0, 1599.0, 1048.0, 581.0, 365.0, 250.0, 159.0, 118.0, 55.0, 36.0, 26.0, 28.0, 16.0, 12.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-9.125, -8.86749267578125, -8.6099853515625, -8.35247802734375, -8.094970703125, -7.83746337890625, -7.5799560546875, -7.32244873046875, -7.06494140625, -6.80743408203125, -6.5499267578125, -6.29241943359375, -6.034912109375, -5.77740478515625, -5.5198974609375, -5.26239013671875, -5.0048828125, -4.74737548828125, -4.4898681640625, -4.23236083984375, -3.974853515625, -3.71734619140625, -3.4598388671875, -3.20233154296875, -2.94482421875, -2.68731689453125, -2.4298095703125, -2.17230224609375, -1.914794921875, -1.65728759765625, -1.3997802734375, -1.14227294921875, -0.884765625, -0.62725830078125, -0.3697509765625, -0.11224365234375, 0.145263671875, 0.40277099609375, 0.6602783203125, 0.91778564453125, 1.17529296875, 1.43280029296875, 1.6903076171875, 1.94781494140625, 2.205322265625, 2.46282958984375, 2.7203369140625, 2.97784423828125, 3.2353515625, 3.49285888671875, 3.7503662109375, 4.00787353515625, 4.265380859375, 4.52288818359375, 4.7803955078125, 5.03790283203125, 5.29541015625, 5.55291748046875, 5.8104248046875, 6.06793212890625, 6.325439453125, 6.58294677734375, 6.8404541015625, 7.09796142578125, 7.35546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 7.0, 7.0, 6.0, 6.0, 13.0, 14.0, 23.0, 19.0, 26.0, 18.0, 36.0, 39.0, 42.0, 39.0, 53.0, 48.0, 48.0, 41.0, 50.0, 64.0, 46.0, 45.0, 47.0, 39.0, 35.0, 29.0, 29.0, 21.0, 16.0, 15.0, 9.0, 13.0, 7.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-2.8828125, -2.7989501953125, -2.715087890625, -2.6312255859375, -2.54736328125, -2.4635009765625, -2.379638671875, -2.2957763671875, -2.2119140625, -2.1280517578125, -2.044189453125, -1.9603271484375, -1.87646484375, -1.7926025390625, -1.708740234375, -1.6248779296875, -1.541015625, -1.4571533203125, -1.373291015625, -1.2894287109375, -1.20556640625, -1.1217041015625, -1.037841796875, -0.9539794921875, -0.8701171875, -0.7862548828125, -0.702392578125, -0.6185302734375, -0.53466796875, -0.4508056640625, -0.366943359375, -0.2830810546875, -0.19921875, -0.1153564453125, -0.031494140625, 0.0523681640625, 0.13623046875, 0.2200927734375, 0.303955078125, 0.3878173828125, 0.4716796875, 0.5555419921875, 0.639404296875, 0.7232666015625, 0.80712890625, 0.8909912109375, 0.974853515625, 1.0587158203125, 1.142578125, 1.2264404296875, 1.310302734375, 1.3941650390625, 1.47802734375, 1.5618896484375, 1.645751953125, 1.7296142578125, 1.8134765625, 1.8973388671875, 1.981201171875, 2.0650634765625, 2.14892578125, 2.2327880859375, 2.316650390625, 2.4005126953125, 2.484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 4.0, 8.0, 13.0, 13.0, 11.0, 24.0, 13.0, 35.0, 28.0, 29.0, 42.0, 39.0, 41.0, 37.0, 56.0, 40.0, 42.0, 35.0, 47.0, 54.0, 44.0, 44.0, 43.0, 35.0, 35.0, 28.0, 32.0, 22.0, 18.0, 14.0, 16.0, 9.0, 3.0, 8.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.99200439453125, -17.451509475708008, -16.911012649536133, -16.37051773071289, -15.830022811889648, -15.28952693939209, -14.749031066894531, -14.208536148071289, -13.668041229248047, -13.127545356750488, -12.587050437927246, -12.046554565429688, -11.506059646606445, -10.965563774108887, -10.425067901611328, -9.884572982788086, -9.344077110290527, -8.803581237792969, -8.263086318969727, -7.722590446472168, -7.182095527648926, -6.641599655151367, -6.101104259490967, -5.560608863830566, -5.020113468170166, -4.479618072509766, -3.9391226768493652, -3.3986270427703857, -2.8581316471099854, -2.317636251449585, -1.7771406173706055, -1.236645221710205, -0.6961498260498047, -0.15565437078475952, 0.38484108448028564, 0.9253365993499756, 1.465831995010376, 2.0063273906707764, 2.546823024749756, 3.0873184204101562, 3.6278138160705566, 4.168309211730957, 4.708804607391357, 5.249300003051758, 5.789795875549316, 6.330290794372559, 6.870786666870117, 7.411282062530518, 7.951777458190918, 8.492273330688477, 9.032768249511719, 9.573264122009277, 10.11375904083252, 10.654254913330078, 11.19474983215332, 11.735245704650879, 12.275741577148438, 12.816237449645996, 13.356732368469238, 13.897228240966797, 14.437723159790039, 14.978219032287598, 15.518714904785156, 16.0592098236084, 16.59970474243164]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 1.0, 4.0, 8.0, 9.0, 10.0, 27.0, 19.0, 18.0, 27.0, 25.0, 24.0, 26.0, 34.0, 31.0, 34.0, 38.0, 49.0, 40.0, 32.0, 38.0, 44.0, 32.0, 43.0, 35.0, 39.0, 35.0, 26.0, 34.0, 31.0, 26.0, 18.0, 16.0, 23.0, 12.0, 11.0, 10.0, 9.0, 9.0, 10.0, 6.0, 11.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-15.185629844665527, -14.681742668151855, -14.177855491638184, -13.673968315124512, -13.17008113861084, -12.666193962097168, -12.162307739257812, -11.65842056274414, -11.154533386230469, -10.650646209716797, -10.146759033203125, -9.642871856689453, -9.138984680175781, -8.63509750366211, -8.131210327148438, -7.627323627471924, -7.123435974121094, -6.619548797607422, -6.11566162109375, -5.611774444580078, -5.107887268066406, -4.604000091552734, -4.100113391876221, -3.596226215362549, -3.092339038848877, -2.588451862335205, -2.084564685821533, -1.5806777477264404, -1.0767905712127686, -0.5729033946990967, -0.0690164566040039, 0.43487071990966797, 0.9387569427490234, 1.4426441192626953, 1.9465311765670776, 2.45041823387146, 2.954305410385132, 3.4581925868988037, 3.9620795249938965, 4.465966701507568, 4.96985387802124, 5.473741054534912, 5.977628231048584, 6.481514930725098, 6.9854021072387695, 7.489289283752441, 7.993176460266113, 8.497063636779785, 9.000950813293457, 9.504837989807129, 10.0087251663208, 10.512612342834473, 11.016499519348145, 11.520386695861816, 12.024272918701172, 12.528160095214844, 13.032047271728516, 13.535934448242188, 14.03982162475586, 14.543708801269531, 15.047595977783203, 15.551483154296875, 16.055370330810547, 16.55925750732422, 17.06314468383789]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 8.0, 8.0, 13.0, 10.0, 27.0, 37.0, 51.0, 95.0, 156.0, 234.0, 367.0, 588.0, 931.0, 1442.0, 2391.0, 4084.0, 6710.0, 11268.0, 19001.0, 32608.0, 55283.0, 92105.0, 152198.0, 238977.0, 353704.0, 473272.0, 559128.0, 570703.0, 503368.0, 390835.0, 272728.0, 177345.0, 109290.0, 66122.0, 39295.0, 23622.0, 14007.0, 8513.0, 5232.0, 3135.0, 1921.0, 1251.0, 795.0, 500.0, 335.0, 200.0, 132.0, 86.0, 61.0, 40.0, 28.0, 19.0, 10.0, 7.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 4.0], "bins": [-14.7578125, -14.2686767578125, -13.779541015625, -13.2904052734375, -12.80126953125, -12.3121337890625, -11.822998046875, -11.3338623046875, -10.8447265625, -10.3555908203125, -9.866455078125, -9.3773193359375, -8.88818359375, -8.3990478515625, -7.909912109375, -7.4207763671875, -6.931640625, -6.4425048828125, -5.953369140625, -5.4642333984375, -4.97509765625, -4.4859619140625, -3.996826171875, -3.5076904296875, -3.0185546875, -2.5294189453125, -2.040283203125, -1.5511474609375, -1.06201171875, -0.5728759765625, -0.083740234375, 0.4053955078125, 0.89453125, 1.3836669921875, 1.872802734375, 2.3619384765625, 2.85107421875, 3.3402099609375, 3.829345703125, 4.3184814453125, 4.8076171875, 5.2967529296875, 5.785888671875, 6.2750244140625, 6.76416015625, 7.2532958984375, 7.742431640625, 8.2315673828125, 8.720703125, 9.2098388671875, 9.698974609375, 10.1881103515625, 10.67724609375, 11.1663818359375, 11.655517578125, 12.1446533203125, 12.6337890625, 13.1229248046875, 13.612060546875, 14.1011962890625, 14.59033203125, 15.0794677734375, 15.568603515625, 16.0577392578125, 16.546875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 2.0, 3.0, 5.0, 11.0, 7.0, 19.0, 20.0, 24.0, 17.0, 26.0, 24.0, 22.0, 36.0, 30.0, 28.0, 40.0, 42.0, 43.0, 36.0, 38.0, 42.0, 34.0, 40.0, 39.0, 34.0, 37.0, 32.0, 36.0, 27.0, 25.0, 28.0, 14.0, 22.0, 14.0, 17.0, 11.0, 7.0, 12.0, 4.0, 11.0, 9.0, 7.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.3984375, -12.9482421875, -12.498046875, -12.0478515625, -11.59765625, -11.1474609375, -10.697265625, -10.2470703125, -9.796875, -9.3466796875, -8.896484375, -8.4462890625, -7.99609375, -7.5458984375, -7.095703125, -6.6455078125, -6.1953125, -5.7451171875, -5.294921875, -4.8447265625, -4.39453125, -3.9443359375, -3.494140625, -3.0439453125, -2.59375, -2.1435546875, -1.693359375, -1.2431640625, -0.79296875, -0.3427734375, 0.107421875, 0.5576171875, 1.0078125, 1.4580078125, 1.908203125, 2.3583984375, 2.80859375, 3.2587890625, 3.708984375, 4.1591796875, 4.609375, 5.0595703125, 5.509765625, 5.9599609375, 6.41015625, 6.8603515625, 7.310546875, 7.7607421875, 8.2109375, 8.6611328125, 9.111328125, 9.5615234375, 10.01171875, 10.4619140625, 10.912109375, 11.3623046875, 11.8125, 12.2626953125, 12.712890625, 13.1630859375, 13.61328125, 14.0634765625, 14.513671875, 14.9638671875, 15.4140625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 11.0, 13.0, 24.0, 35.0, 76.0, 99.0, 183.0, 300.0, 529.0, 857.0, 1425.0, 2461.0, 4268.0, 7505.0, 13564.0, 24043.0, 43067.0, 74973.0, 128164.0, 207203.0, 315396.0, 438688.0, 541242.0, 580281.0, 541707.0, 438082.0, 317704.0, 208394.0, 128679.0, 75904.0, 43234.0, 24364.0, 13497.0, 7618.0, 4479.0, 2587.0, 1453.0, 872.0, 494.0, 315.0, 177.0, 111.0, 75.0, 45.0, 29.0, 21.0, 14.0, 5.0, 7.0, 2.0, 5.0, 1.0], "bins": [-19.421875, -18.8748779296875, -18.327880859375, -17.7808837890625, -17.23388671875, -16.6868896484375, -16.139892578125, -15.5928955078125, -15.0458984375, -14.4989013671875, -13.951904296875, -13.4049072265625, -12.85791015625, -12.3109130859375, -11.763916015625, -11.2169189453125, -10.669921875, -10.1229248046875, -9.575927734375, -9.0289306640625, -8.48193359375, -7.9349365234375, -7.387939453125, -6.8409423828125, -6.2939453125, -5.7469482421875, -5.199951171875, -4.6529541015625, -4.10595703125, -3.5589599609375, -3.011962890625, -2.4649658203125, -1.91796875, -1.3709716796875, -0.823974609375, -0.2769775390625, 0.27001953125, 0.8170166015625, 1.364013671875, 1.9110107421875, 2.4580078125, 3.0050048828125, 3.552001953125, 4.0989990234375, 4.64599609375, 5.1929931640625, 5.739990234375, 6.2869873046875, 6.833984375, 7.3809814453125, 7.927978515625, 8.4749755859375, 9.02197265625, 9.5689697265625, 10.115966796875, 10.6629638671875, 11.2099609375, 11.7569580078125, 12.303955078125, 12.8509521484375, 13.39794921875, 13.9449462890625, 14.491943359375, 15.0389404296875, 15.5859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 16.0, 12.0, 11.0, 18.0, 21.0, 24.0, 48.0, 33.0, 50.0, 65.0, 95.0, 109.0, 105.0, 107.0, 131.0, 162.0, 148.0, 174.0, 187.0, 190.0, 200.0, 178.0, 196.0, 188.0, 179.0, 199.0, 197.0, 147.0, 120.0, 130.0, 106.0, 81.0, 75.0, 81.0, 54.0, 45.0, 47.0, 37.0, 26.0, 22.0, 19.0, 8.0, 11.0, 5.0, 2.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.33489990234375, -6.1229248046875, -5.91094970703125, -5.698974609375, -5.48699951171875, -5.2750244140625, -5.06304931640625, -4.85107421875, -4.63909912109375, -4.4271240234375, -4.21514892578125, -4.003173828125, -3.79119873046875, -3.5792236328125, -3.36724853515625, -3.1552734375, -2.94329833984375, -2.7313232421875, -2.51934814453125, -2.307373046875, -2.09539794921875, -1.8834228515625, -1.67144775390625, -1.45947265625, -1.24749755859375, -1.0355224609375, -0.82354736328125, -0.611572265625, -0.39959716796875, -0.1876220703125, 0.02435302734375, 0.236328125, 0.44830322265625, 0.6602783203125, 0.87225341796875, 1.084228515625, 1.29620361328125, 1.5081787109375, 1.72015380859375, 1.93212890625, 2.14410400390625, 2.3560791015625, 2.56805419921875, 2.780029296875, 2.99200439453125, 3.2039794921875, 3.41595458984375, 3.6279296875, 3.83990478515625, 4.0518798828125, 4.26385498046875, 4.475830078125, 4.68780517578125, 4.8997802734375, 5.11175537109375, 5.32373046875, 5.53570556640625, 5.7476806640625, 5.95965576171875, 6.171630859375, 6.38360595703125, 6.5955810546875, 6.80755615234375, 7.01953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 6.0, 3.0, 16.0, 12.0, 20.0, 26.0, 21.0, 24.0, 37.0, 49.0, 54.0, 53.0, 57.0, 49.0, 44.0, 50.0, 75.0, 49.0, 56.0, 51.0, 40.0, 31.0, 42.0, 28.0, 22.0, 18.0, 10.0, 11.0, 17.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.895763397216797, -16.224443435668945, -15.553123474121094, -14.881803512573242, -14.21048355102539, -13.539163589477539, -12.867844581604004, -12.196524620056152, -11.5252046585083, -10.85388469696045, -10.182564735412598, -9.511245727539062, -8.839925765991211, -8.16860580444336, -7.497285842895508, -6.825965881347656, -6.154645919799805, -5.483325958251953, -4.812005996704102, -4.140686511993408, -3.4693665504455566, -2.798046588897705, -2.1267271041870117, -1.4554071426391602, -0.7840871810913086, -0.11276733875274658, 0.5585525035858154, 1.229872226715088, 1.9011921882629395, 2.572512149810791, 3.2438316345214844, 3.915151596069336, 4.5864715576171875, 5.257791519165039, 5.929111480712891, 6.600430965423584, 7.2717509269714355, 7.943070888519287, 8.61439037322998, 9.285710334777832, 9.957030296325684, 10.628350257873535, 11.299670219421387, 11.970989227294922, 12.642309188842773, 13.313629150390625, 13.984949111938477, 14.656269073486328, 15.32758903503418, 15.998908996582031, 16.670228958129883, 17.341548919677734, 18.012868881225586, 18.684188842773438, 19.355506896972656, 20.02682876586914, 20.69814682006836, 21.36946678161621, 22.040786743164062, 22.712106704711914, 23.383426666259766, 24.054746627807617, 24.72606658935547, 25.397384643554688, 26.068706512451172]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 8.0, 11.0, 17.0, 9.0, 15.0, 25.0, 22.0, 33.0, 39.0, 38.0, 37.0, 50.0, 38.0, 33.0, 40.0, 43.0, 35.0, 42.0, 59.0, 50.0, 41.0, 37.0, 38.0, 36.0, 20.0, 23.0, 22.0, 18.0, 21.0, 18.0, 13.0, 15.0, 14.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.033568382263184, -14.452958106994629, -13.872347831726074, -13.291738510131836, -12.711128234863281, -12.130517959594727, -11.549907684326172, -10.969297409057617, -10.388687133789062, -9.808076858520508, -9.227466583251953, -8.646856307983398, -8.06624698638916, -7.4856367111206055, -6.905026435852051, -6.324416637420654, -5.743806838989258, -5.163196563720703, -4.582586765289307, -4.001976490020752, -3.4213664531707764, -2.840756416320801, -2.260146141052246, -1.6795363426208496, -1.098926067352295, -0.5183159708976746, 0.0622941255569458, 0.6429042816162109, 1.2235143184661865, 1.804124355316162, 2.384734630584717, 2.9653444290161133, 3.5459537506103516, 4.126564025878906, 4.707173824310303, 5.287784099578857, 5.868393898010254, 6.449004173278809, 7.029614448547363, 7.61022424697876, 8.190834045410156, 8.771444320678711, 9.352054595947266, 9.93266487121582, 10.513274192810059, 11.093884468078613, 11.674494743347168, 12.255104064941406, 12.835715293884277, 13.416325569152832, 13.996935844421387, 14.577545166015625, 15.15815544128418, 15.738765716552734, 16.31937599182129, 16.899986267089844, 17.4805965423584, 18.061206817626953, 18.641817092895508, 19.222427368164062, 19.803037643432617, 20.383647918701172, 20.964256286621094, 21.54486656188965, 22.125476837158203]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 10.0, 11.0, 20.0, 47.0, 48.0, 62.0, 137.0, 232.0, 316.0, 513.0, 787.0, 1369.0, 2304.0, 4004.0, 6777.0, 11559.0, 19740.0, 33553.0, 55081.0, 85302.0, 121708.0, 152080.0, 157531.0, 133937.0, 97781.0, 64672.0, 39952.0, 24246.0, 14262.0, 8323.0, 4891.0, 2949.0, 1691.0, 1051.0, 600.0, 374.0, 233.0, 147.0, 94.0, 73.0, 36.0, 21.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.357177734375, -3.24951171875, -3.141845703125, -3.0341796875, -2.926513671875, -2.81884765625, -2.711181640625, -2.603515625, -2.495849609375, -2.38818359375, -2.280517578125, -2.1728515625, -2.065185546875, -1.95751953125, -1.849853515625, -1.7421875, -1.634521484375, -1.52685546875, -1.419189453125, -1.3115234375, -1.203857421875, -1.09619140625, -0.988525390625, -0.880859375, -0.773193359375, -0.66552734375, -0.557861328125, -0.4501953125, -0.342529296875, -0.23486328125, -0.127197265625, -0.01953125, 0.088134765625, 0.19580078125, 0.303466796875, 0.4111328125, 0.518798828125, 0.62646484375, 0.734130859375, 0.841796875, 0.949462890625, 1.05712890625, 1.164794921875, 1.2724609375, 1.380126953125, 1.48779296875, 1.595458984375, 1.703125, 1.810791015625, 1.91845703125, 2.026123046875, 2.1337890625, 2.241455078125, 2.34912109375, 2.456787109375, 2.564453125, 2.672119140625, 2.77978515625, 2.887451171875, 2.9951171875, 3.102783203125, 3.21044921875, 3.318115234375, 3.42578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 16.0, 10.0, 14.0, 26.0, 21.0, 32.0, 40.0, 38.0, 36.0, 53.0, 38.0, 30.0, 38.0, 43.0, 37.0, 44.0, 63.0, 46.0, 42.0, 36.0, 41.0, 33.0, 20.0, 22.0, 23.0, 17.0, 20.0, 20.0, 13.0, 14.0, 15.0, 8.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.4422607421875, -13.861083984375, -13.2799072265625, -12.69873046875, -12.1175537109375, -11.536376953125, -10.9552001953125, -10.3740234375, -9.7928466796875, -9.211669921875, -8.6304931640625, -8.04931640625, -7.4681396484375, -6.886962890625, -6.3057861328125, -5.724609375, -5.1434326171875, -4.562255859375, -3.9810791015625, -3.39990234375, -2.8187255859375, -2.237548828125, -1.6563720703125, -1.0751953125, -0.4940185546875, 0.087158203125, 0.6683349609375, 1.24951171875, 1.8306884765625, 2.411865234375, 2.9930419921875, 3.57421875, 4.1553955078125, 4.736572265625, 5.3177490234375, 5.89892578125, 6.4801025390625, 7.061279296875, 7.6424560546875, 8.2236328125, 8.8048095703125, 9.385986328125, 9.9671630859375, 10.54833984375, 11.1295166015625, 11.710693359375, 12.2918701171875, 12.873046875, 13.4542236328125, 14.035400390625, 14.6165771484375, 15.19775390625, 15.7789306640625, 16.360107421875, 16.9412841796875, 17.5224609375, 18.1036376953125, 18.684814453125, 19.2659912109375, 19.84716796875, 20.4283447265625, 21.009521484375, 21.5906982421875, 22.171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 6.0, 13.0, 12.0, 19.0, 17.0, 30.0, 33.0, 56.0, 91.0, 114.0, 181.0, 285.0, 371.0, 583.0, 814.0, 1270.0, 1901.0, 2906.0, 4546.0, 7116.0, 11355.0, 19305.0, 38713.0, 626233.0, 257485.0, 30311.0, 16578.0, 10005.0, 6463.0, 3972.0, 2572.0, 1690.0, 1151.0, 737.0, 525.0, 357.0, 207.0, 141.0, 122.0, 79.0, 53.0, 36.0, 27.0, 18.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.015625, -5.814208984375, -5.61279296875, -5.411376953125, -5.2099609375, -5.008544921875, -4.80712890625, -4.605712890625, -4.404296875, -4.202880859375, -4.00146484375, -3.800048828125, -3.5986328125, -3.397216796875, -3.19580078125, -2.994384765625, -2.79296875, -2.591552734375, -2.39013671875, -2.188720703125, -1.9873046875, -1.785888671875, -1.58447265625, -1.383056640625, -1.181640625, -0.980224609375, -0.77880859375, -0.577392578125, -0.3759765625, -0.174560546875, 0.02685546875, 0.228271484375, 0.4296875, 0.631103515625, 0.83251953125, 1.033935546875, 1.2353515625, 1.436767578125, 1.63818359375, 1.839599609375, 2.041015625, 2.242431640625, 2.44384765625, 2.645263671875, 2.8466796875, 3.048095703125, 3.24951171875, 3.450927734375, 3.65234375, 3.853759765625, 4.05517578125, 4.256591796875, 4.4580078125, 4.659423828125, 4.86083984375, 5.062255859375, 5.263671875, 5.465087890625, 5.66650390625, 5.867919921875, 6.0693359375, 6.270751953125, 6.47216796875, 6.673583984375, 6.875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 15.0, 13.0, 29.0, 21.0, 19.0, 25.0, 23.0, 33.0, 38.0, 40.0, 42.0, 41.0, 36.0, 44.0, 24.0, 39.0, 47.0, 44.0, 36.0, 35.0, 28.0, 29.0, 32.0, 20.0, 27.0, 21.0, 26.0, 24.0, 14.0, 17.0, 14.0, 12.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.96875, -10.63720703125, -10.3056640625, -9.97412109375, -9.642578125, -9.31103515625, -8.9794921875, -8.64794921875, -8.31640625, -7.98486328125, -7.6533203125, -7.32177734375, -6.990234375, -6.65869140625, -6.3271484375, -5.99560546875, -5.6640625, -5.33251953125, -5.0009765625, -4.66943359375, -4.337890625, -4.00634765625, -3.6748046875, -3.34326171875, -3.01171875, -2.68017578125, -2.3486328125, -2.01708984375, -1.685546875, -1.35400390625, -1.0224609375, -0.69091796875, -0.359375, -0.02783203125, 0.3037109375, 0.63525390625, 0.966796875, 1.29833984375, 1.6298828125, 1.96142578125, 2.29296875, 2.62451171875, 2.9560546875, 3.28759765625, 3.619140625, 3.95068359375, 4.2822265625, 4.61376953125, 4.9453125, 5.27685546875, 5.6083984375, 5.93994140625, 6.271484375, 6.60302734375, 6.9345703125, 7.26611328125, 7.59765625, 7.92919921875, 8.2607421875, 8.59228515625, 8.923828125, 9.25537109375, 9.5869140625, 9.91845703125, 10.25]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 15.0, 25.0, 24.0, 38.0, 62.0, 102.0, 155.0, 224.0, 482.0, 848.0, 1722.0, 3599.0, 8129.0, 18435.0, 47163.0, 882783.0, 49859.0, 19010.0, 8256.0, 3789.0, 1765.0, 900.0, 471.0, 290.0, 127.0, 90.0, 51.0, 38.0, 21.0, 16.0, 14.0, 8.0, 10.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98828125, -0.954803466796875, -0.92132568359375, -0.887847900390625, -0.8543701171875, -0.820892333984375, -0.78741455078125, -0.753936767578125, -0.720458984375, -0.686981201171875, -0.65350341796875, -0.620025634765625, -0.5865478515625, -0.553070068359375, -0.51959228515625, -0.486114501953125, -0.45263671875, -0.419158935546875, -0.38568115234375, -0.352203369140625, -0.3187255859375, -0.285247802734375, -0.25177001953125, -0.218292236328125, -0.184814453125, -0.151336669921875, -0.11785888671875, -0.084381103515625, -0.0509033203125, -0.017425537109375, 0.01605224609375, 0.049530029296875, 0.0830078125, 0.116485595703125, 0.14996337890625, 0.183441162109375, 0.2169189453125, 0.250396728515625, 0.28387451171875, 0.317352294921875, 0.350830078125, 0.384307861328125, 0.41778564453125, 0.451263427734375, 0.4847412109375, 0.518218994140625, 0.55169677734375, 0.585174560546875, 0.61865234375, 0.652130126953125, 0.68560791015625, 0.719085693359375, 0.7525634765625, 0.786041259765625, 0.81951904296875, 0.852996826171875, 0.886474609375, 0.919952392578125, 0.95343017578125, 0.986907958984375, 1.0203857421875, 1.053863525390625, 1.08734130859375, 1.120819091796875, 1.154296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 13.0, 13.0, 21.0, 12.0, 27.0, 31.0, 24.0, 33.0, 52.0, 45.0, 55.0, 55.0, 62.0, 52.0, 61.0, 72.0, 67.0, 39.0, 36.0, 56.0, 43.0, 24.0, 18.0, 16.0, 18.0, 10.0, 18.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.6722438633441925e-05, -2.584792673587799e-05, -2.4973414838314056e-05, -2.4098902940750122e-05, -2.3224391043186188e-05, -2.2349879145622253e-05, -2.147536724805832e-05, -2.0600855350494385e-05, -1.972634345293045e-05, -1.8851831555366516e-05, -1.7977319657802582e-05, -1.7102807760238647e-05, -1.6228295862674713e-05, -1.535378396511078e-05, -1.4479272067546844e-05, -1.360476016998291e-05, -1.2730248272418976e-05, -1.1855736374855042e-05, -1.0981224477291107e-05, -1.0106712579727173e-05, -9.232200682163239e-06, -8.357688784599304e-06, -7.48317688703537e-06, -6.6086649894714355e-06, -5.734153091907501e-06, -4.859641194343567e-06, -3.9851292967796326e-06, -3.1106173992156982e-06, -2.236105501651764e-06, -1.3615936040878296e-06, -4.870817065238953e-07, 3.8743019104003906e-07, 1.2619420886039734e-06, 2.1364539861679077e-06, 3.010965883731842e-06, 3.885477781295776e-06, 4.759989678859711e-06, 5.634501576423645e-06, 6.509013473987579e-06, 7.383525371551514e-06, 8.258037269115448e-06, 9.132549166679382e-06, 1.0007061064243317e-05, 1.0881572961807251e-05, 1.1756084859371185e-05, 1.263059675693512e-05, 1.3505108654499054e-05, 1.4379620552062988e-05, 1.5254132449626923e-05, 1.6128644347190857e-05, 1.700315624475479e-05, 1.7877668142318726e-05, 1.875218003988266e-05, 1.9626691937446594e-05, 2.050120383501053e-05, 2.1375715732574463e-05, 2.2250227630138397e-05, 2.312473952770233e-05, 2.3999251425266266e-05, 2.48737633228302e-05, 2.5748275220394135e-05, 2.662278711795807e-05, 2.7497299015522003e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 4.0, 7.0, 13.0, 18.0, 21.0, 30.0, 41.0, 83.0, 96.0, 151.0, 216.0, 342.0, 487.0, 664.0, 986.0, 1411.0, 2041.0, 3015.0, 4224.0, 6214.0, 8953.0, 13219.0, 19179.0, 27422.0, 39191.0, 54609.0, 75522.0, 99585.0, 123500.0, 130278.0, 115364.0, 91388.0, 68003.0, 48839.0, 35088.0, 24335.0, 16794.0, 11513.0, 7961.0, 5476.0, 3835.0, 2599.0, 1802.0, 1260.0, 911.0, 558.0, 441.0, 268.0, 202.0, 123.0, 102.0, 63.0, 29.0, 34.0, 16.0, 18.0, 8.0, 9.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.54833984375, -0.5308380126953125, -0.513336181640625, -0.4958343505859375, -0.47833251953125, -0.4608306884765625, -0.443328857421875, -0.4258270263671875, -0.4083251953125, -0.3908233642578125, -0.373321533203125, -0.3558197021484375, -0.33831787109375, -0.3208160400390625, -0.303314208984375, -0.2858123779296875, -0.268310546875, -0.2508087158203125, -0.233306884765625, -0.2158050537109375, -0.19830322265625, -0.1808013916015625, -0.163299560546875, -0.1457977294921875, -0.1282958984375, -0.1107940673828125, -0.093292236328125, -0.0757904052734375, -0.05828857421875, -0.0407867431640625, -0.023284912109375, -0.0057830810546875, 0.01171875, 0.0292205810546875, 0.046722412109375, 0.0642242431640625, 0.08172607421875, 0.0992279052734375, 0.116729736328125, 0.1342315673828125, 0.1517333984375, 0.1692352294921875, 0.186737060546875, 0.2042388916015625, 0.22174072265625, 0.2392425537109375, 0.256744384765625, 0.2742462158203125, 0.291748046875, 0.3092498779296875, 0.326751708984375, 0.3442535400390625, 0.36175537109375, 0.3792572021484375, 0.396759033203125, 0.4142608642578125, 0.4317626953125, 0.4492645263671875, 0.466766357421875, 0.4842681884765625, 0.50177001953125, 0.5192718505859375, 0.536773681640625, 0.5542755126953125, 0.57177734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 7.0, 16.0, 19.0, 16.0, 36.0, 39.0, 52.0, 56.0, 88.0, 105.0, 80.0, 87.0, 81.0, 56.0, 51.0, 28.0, 35.0, 34.0, 21.0, 22.0, 10.0, 10.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.3353767395019531, -0.32212066650390625, -0.3088645935058594, -0.2956085205078125, -0.2823524475097656, -0.26909637451171875, -0.2558403015136719, -0.242584228515625, -0.22932815551757812, -0.21607208251953125, -0.20281600952148438, -0.1895599365234375, -0.17630386352539062, -0.16304779052734375, -0.14979171752929688, -0.13653564453125, -0.12327957153320312, -0.11002349853515625, -0.09676742553710938, -0.0835113525390625, -0.07025527954101562, -0.05699920654296875, -0.043743133544921875, -0.030487060546875, -0.017230987548828125, -0.00397491455078125, 0.009281158447265625, 0.0225372314453125, 0.035793304443359375, 0.04904937744140625, 0.062305450439453125, 0.0755615234375, 0.08881759643554688, 0.10207366943359375, 0.11532974243164062, 0.1285858154296875, 0.14184188842773438, 0.15509796142578125, 0.16835403442382812, 0.181610107421875, 0.19486618041992188, 0.20812225341796875, 0.22137832641601562, 0.2346343994140625, 0.24789047241210938, 0.26114654541015625, 0.2744026184082031, 0.28765869140625, 0.3009147644042969, 0.31417083740234375, 0.3274269104003906, 0.3406829833984375, 0.3539390563964844, 0.36719512939453125, 0.3804512023925781, 0.393707275390625, 0.4069633483886719, 0.42021942138671875, 0.4334754943847656, 0.4467315673828125, 0.4599876403808594, 0.47324371337890625, 0.4864997863769531, 0.499755859375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 6.0, 12.0, 12.0, 16.0, 24.0, 29.0, 23.0, 37.0, 48.0, 49.0, 63.0, 51.0, 47.0, 47.0, 56.0, 73.0, 53.0, 57.0, 53.0, 30.0, 43.0, 37.0, 25.0, 24.0, 18.0, 14.0, 15.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.340423583984375, -16.648508071899414, -15.95659065246582, -15.264674186706543, -14.572757720947266, -13.880841255187988, -13.188924789428711, -12.49700927734375, -11.805091857910156, -11.113175392150879, -10.421258926391602, -9.729342460632324, -9.037425994873047, -8.34550952911377, -7.65359354019165, -6.961677074432373, -6.269761085510254, -5.577844619750977, -4.885928153991699, -4.194011688232422, -3.5020954608917236, -2.8101789951324463, -2.118262767791748, -1.4263463020324707, -0.7344298362731934, -0.04251343011856079, 0.6494029760360718, 1.3413193225860596, 2.033235788345337, 2.7251522541046143, 3.4170684814453125, 4.10898494720459, 4.800901412963867, 5.4928178787231445, 6.184734344482422, 6.876650810241699, 7.568567276000977, 8.260483741760254, 8.952400207519531, 9.644315719604492, 10.336233139038086, 11.028149604797363, 11.72006607055664, 12.411982536315918, 13.103899002075195, 13.795815467834473, 14.48773193359375, 15.179647445678711, 15.871563911437988, 16.563480377197266, 17.255395889282227, 17.94731330871582, 18.63922882080078, 19.331146240234375, 20.023061752319336, 20.71497917175293, 21.40689468383789, 22.09881019592285, 22.790727615356445, 23.482643127441406, 24.174560546875, 24.86647605895996, 25.558393478393555, 26.250308990478516, 26.94222640991211]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 9.0, 11.0, 18.0, 8.0, 15.0, 25.0, 24.0, 31.0, 37.0, 40.0, 38.0, 52.0, 37.0, 30.0, 45.0, 40.0, 34.0, 46.0, 58.0, 50.0, 39.0, 37.0, 38.0, 36.0, 18.0, 25.0, 21.0, 20.0, 21.0, 20.0, 12.0, 10.0, 16.0, 9.0, 4.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.009733200073242, -14.427873611450195, -13.846014022827148, -13.264155387878418, -12.682295799255371, -12.100436210632324, -11.518577575683594, -10.936717987060547, -10.3548583984375, -9.772998809814453, -9.191139221191406, -8.609280586242676, -8.027420997619629, -7.445561408996582, -6.863702297210693, -6.281843185424805, -5.699983596801758, -5.118124008178711, -4.536264896392822, -3.9544055461883545, -3.3725461959838867, -2.790686845779419, -2.208827495574951, -1.6269683837890625, -1.0451087951660156, -0.46324944496154785, 0.11860990524291992, 0.7004692554473877, 1.2823286056518555, 1.8641879558563232, 2.446047306060791, 3.0279064178466797, 3.6097679138183594, 4.191627502441406, 4.773486614227295, 5.355345726013184, 5.9372053146362305, 6.519064903259277, 7.100924015045166, 7.682783126831055, 8.264642715454102, 8.846502304077148, 9.428361892700195, 10.010220527648926, 10.592080116271973, 11.17393970489502, 11.75579833984375, 12.337657928466797, 12.919517517089844, 13.50137710571289, 14.083236694335938, 14.665095329284668, 15.246954917907715, 15.828814506530762, 16.410673141479492, 16.99253273010254, 17.574392318725586, 18.156251907348633, 18.73811149597168, 19.319971084594727, 19.90182876586914, 20.483688354492188, 21.065547943115234, 21.64740753173828, 22.229267120361328]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 8.0, 12.0, 26.0, 40.0, 69.0, 112.0, 184.0, 290.0, 454.0, 741.0, 1201.0, 1894.0, 2783.0, 4592.0, 7008.0, 10834.0, 16136.0, 23913.0, 33868.0, 45959.0, 60985.0, 75862.0, 89043.0, 99212.0, 102521.0, 99030.0, 88828.0, 75111.0, 59846.0, 45685.0, 33332.0, 23365.0, 15791.0, 10574.0, 6968.0, 4585.0, 2806.0, 1865.0, 1186.0, 693.0, 450.0, 265.0, 170.0, 100.0, 61.0, 40.0, 25.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.83056640625, -11.4423828125, -11.05419921875, -10.666015625, -10.27783203125, -9.8896484375, -9.50146484375, -9.11328125, -8.72509765625, -8.3369140625, -7.94873046875, -7.560546875, -7.17236328125, -6.7841796875, -6.39599609375, -6.0078125, -5.61962890625, -5.2314453125, -4.84326171875, -4.455078125, -4.06689453125, -3.6787109375, -3.29052734375, -2.90234375, -2.51416015625, -2.1259765625, -1.73779296875, -1.349609375, -0.96142578125, -0.5732421875, -0.18505859375, 0.203125, 0.59130859375, 0.9794921875, 1.36767578125, 1.755859375, 2.14404296875, 2.5322265625, 2.92041015625, 3.30859375, 3.69677734375, 4.0849609375, 4.47314453125, 4.861328125, 5.24951171875, 5.6376953125, 6.02587890625, 6.4140625, 6.80224609375, 7.1904296875, 7.57861328125, 7.966796875, 8.35498046875, 8.7431640625, 9.13134765625, 9.51953125, 9.90771484375, 10.2958984375, 10.68408203125, 11.072265625, 11.46044921875, 11.8486328125, 12.23681640625, 12.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 15.0, 12.0, 14.0, 26.0, 25.0, 31.0, 41.0, 39.0, 36.0, 54.0, 36.0, 31.0, 40.0, 44.0, 36.0, 48.0, 55.0, 46.0, 41.0, 44.0, 39.0, 27.0, 19.0, 28.0, 18.0, 22.0, 20.0, 17.0, 12.0, 10.0, 15.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -13.949462890625, -13.38330078125, -12.817138671875, -12.2509765625, -11.684814453125, -11.11865234375, -10.552490234375, -9.986328125, -9.420166015625, -8.85400390625, -8.287841796875, -7.7216796875, -7.155517578125, -6.58935546875, -6.023193359375, -5.45703125, -4.890869140625, -4.32470703125, -3.758544921875, -3.1923828125, -2.626220703125, -2.06005859375, -1.493896484375, -0.927734375, -0.361572265625, 0.20458984375, 0.770751953125, 1.3369140625, 1.903076171875, 2.46923828125, 3.035400390625, 3.6015625, 4.167724609375, 4.73388671875, 5.300048828125, 5.8662109375, 6.432373046875, 6.99853515625, 7.564697265625, 8.130859375, 8.697021484375, 9.26318359375, 9.829345703125, 10.3955078125, 10.961669921875, 11.52783203125, 12.093994140625, 12.66015625, 13.226318359375, 13.79248046875, 14.358642578125, 14.9248046875, 15.490966796875, 16.05712890625, 16.623291015625, 17.189453125, 17.755615234375, 18.32177734375, 18.887939453125, 19.4541015625, 20.020263671875, 20.58642578125, 21.152587890625, 21.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 18.0, 19.0, 41.0, 82.0, 113.0, 169.0, 311.0, 475.0, 736.0, 1169.0, 1885.0, 2834.0, 4386.0, 6632.0, 9853.0, 14481.0, 20949.0, 29346.0, 39861.0, 52376.0, 66198.0, 79680.0, 90352.0, 96493.0, 96657.0, 91579.0, 80764.0, 67831.0, 53932.0, 41518.0, 30446.0, 22122.0, 15147.0, 10300.0, 6947.0, 4567.0, 3025.0, 1917.0, 1204.0, 817.0, 488.0, 336.0, 179.0, 135.0, 61.0, 32.0, 35.0, 22.0, 11.0, 7.0, 9.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.453125, -11.106689453125, -10.76025390625, -10.413818359375, -10.0673828125, -9.720947265625, -9.37451171875, -9.028076171875, -8.681640625, -8.335205078125, -7.98876953125, -7.642333984375, -7.2958984375, -6.949462890625, -6.60302734375, -6.256591796875, -5.91015625, -5.563720703125, -5.21728515625, -4.870849609375, -4.5244140625, -4.177978515625, -3.83154296875, -3.485107421875, -3.138671875, -2.792236328125, -2.44580078125, -2.099365234375, -1.7529296875, -1.406494140625, -1.06005859375, -0.713623046875, -0.3671875, -0.020751953125, 0.32568359375, 0.672119140625, 1.0185546875, 1.364990234375, 1.71142578125, 2.057861328125, 2.404296875, 2.750732421875, 3.09716796875, 3.443603515625, 3.7900390625, 4.136474609375, 4.48291015625, 4.829345703125, 5.17578125, 5.522216796875, 5.86865234375, 6.215087890625, 6.5615234375, 6.907958984375, 7.25439453125, 7.600830078125, 7.947265625, 8.293701171875, 8.64013671875, 8.986572265625, 9.3330078125, 9.679443359375, 10.02587890625, 10.372314453125, 10.71875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 3.0, 5.0, 5.0, 5.0, 16.0, 5.0, 24.0, 13.0, 25.0, 26.0, 29.0, 35.0, 27.0, 48.0, 32.0, 45.0, 37.0, 41.0, 44.0, 46.0, 44.0, 42.0, 34.0, 38.0, 42.0, 30.0, 30.0, 37.0, 17.0, 19.0, 20.0, 20.0, 18.0, 10.0, 15.0, 13.0, 11.0, 6.0, 6.0, 3.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.5546875, -11.2178955078125, -10.881103515625, -10.5443115234375, -10.20751953125, -9.8707275390625, -9.533935546875, -9.1971435546875, -8.8603515625, -8.5235595703125, -8.186767578125, -7.8499755859375, -7.51318359375, -7.1763916015625, -6.839599609375, -6.5028076171875, -6.166015625, -5.8292236328125, -5.492431640625, -5.1556396484375, -4.81884765625, -4.4820556640625, -4.145263671875, -3.8084716796875, -3.4716796875, -3.1348876953125, -2.798095703125, -2.4613037109375, -2.12451171875, -1.7877197265625, -1.450927734375, -1.1141357421875, -0.77734375, -0.4405517578125, -0.103759765625, 0.2330322265625, 0.56982421875, 0.9066162109375, 1.243408203125, 1.5802001953125, 1.9169921875, 2.2537841796875, 2.590576171875, 2.9273681640625, 3.26416015625, 3.6009521484375, 3.937744140625, 4.2745361328125, 4.611328125, 4.9481201171875, 5.284912109375, 5.6217041015625, 5.95849609375, 6.2952880859375, 6.632080078125, 6.9688720703125, 7.3056640625, 7.6424560546875, 7.979248046875, 8.3160400390625, 8.65283203125, 8.9896240234375, 9.326416015625, 9.6632080078125, 10.0]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 10.0, 10.0, 12.0, 23.0, 47.0, 71.0, 115.0, 177.0, 291.0, 407.0, 625.0, 1058.0, 1567.0, 2423.0, 3947.0, 5840.0, 9150.0, 13865.0, 20635.0, 29646.0, 41977.0, 56464.0, 72966.0, 88529.0, 100656.0, 105931.0, 103531.0, 93934.0, 79638.0, 62931.0, 47506.0, 34279.0, 23918.0, 15907.0, 10612.0, 7045.0, 4505.0, 2976.0, 1854.0, 1247.0, 774.0, 489.0, 338.0, 230.0, 143.0, 89.0, 54.0, 41.0, 23.0, 18.0, 15.0, 8.0, 14.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5078125, -4.35601806640625, -4.2042236328125, -4.05242919921875, -3.900634765625, -3.74884033203125, -3.5970458984375, -3.44525146484375, -3.29345703125, -3.14166259765625, -2.9898681640625, -2.83807373046875, -2.686279296875, -2.53448486328125, -2.3826904296875, -2.23089599609375, -2.0791015625, -1.92730712890625, -1.7755126953125, -1.62371826171875, -1.471923828125, -1.32012939453125, -1.1683349609375, -1.01654052734375, -0.86474609375, -0.71295166015625, -0.5611572265625, -0.40936279296875, -0.257568359375, -0.10577392578125, 0.0460205078125, 0.19781494140625, 0.349609375, 0.50140380859375, 0.6531982421875, 0.80499267578125, 0.956787109375, 1.10858154296875, 1.2603759765625, 1.41217041015625, 1.56396484375, 1.71575927734375, 1.8675537109375, 2.01934814453125, 2.171142578125, 2.32293701171875, 2.4747314453125, 2.62652587890625, 2.7783203125, 2.93011474609375, 3.0819091796875, 3.23370361328125, 3.385498046875, 3.53729248046875, 3.6890869140625, 3.84088134765625, 3.99267578125, 4.14447021484375, 4.2962646484375, 4.44805908203125, 4.599853515625, 4.75164794921875, 4.9034423828125, 5.05523681640625, 5.20703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 8.0, 7.0, 11.0, 11.0, 18.0, 23.0, 23.0, 16.0, 19.0, 27.0, 30.0, 38.0, 30.0, 38.0, 42.0, 29.0, 41.0, 34.0, 39.0, 31.0, 38.0, 45.0, 44.0, 46.0, 22.0, 26.0, 29.0, 27.0, 29.0, 20.0, 14.0, 17.0, 16.0, 20.0, 13.0, 7.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0005383491516113281, -0.0005207434296607971, -0.0005031377077102661, -0.0004855319857597351, -0.0004679262638092041, -0.0004503205418586731, -0.0004327148199081421, -0.0004151090979576111, -0.0003975033760070801, -0.00037989765405654907, -0.00036229193210601807, -0.00034468621015548706, -0.00032708048820495605, -0.00030947476625442505, -0.00029186904430389404, -0.00027426332235336304, -0.00025665760040283203, -0.00023905187845230103, -0.00022144615650177002, -0.00020384043455123901, -0.000186234712600708, -0.000168628990650177, -0.000151023268699646, -0.000133417546749115, -0.00011581182479858398, -9.820610284805298e-05, -8.060038089752197e-05, -6.299465894699097e-05, -4.538893699645996e-05, -2.7783215045928955e-05, -1.017749309539795e-05, 7.428228855133057e-06, 2.5033950805664062e-05, 4.263967275619507e-05, 6.0245394706726074e-05, 7.785111665725708e-05, 9.545683860778809e-05, 0.00011306256055831909, 0.0001306682825088501, 0.0001482740044593811, 0.0001658797264099121, 0.00018348544836044312, 0.00020109117031097412, 0.00021869689226150513, 0.00023630261421203613, 0.00025390833616256714, 0.00027151405811309814, 0.00028911978006362915, 0.00030672550201416016, 0.00032433122396469116, 0.00034193694591522217, 0.0003595426678657532, 0.0003771483898162842, 0.0003947541117668152, 0.0004123598337173462, 0.0004299655556678772, 0.0004475712776184082, 0.0004651769995689392, 0.0004827827215194702, 0.0005003884434700012, 0.0005179941654205322, 0.0005355998873710632, 0.0005532056093215942, 0.0005708113312721252, 0.0005884170532226562]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 11.0, 11.0, 16.0, 18.0, 39.0, 64.0, 104.0, 176.0, 263.0, 393.0, 610.0, 1051.0, 1671.0, 2603.0, 4353.0, 6943.0, 10758.0, 16799.0, 25626.0, 37872.0, 53746.0, 72404.0, 91015.0, 106797.0, 114447.0, 112520.0, 100705.0, 83670.0, 65008.0, 46966.0, 32239.0, 21582.0, 14179.0, 8942.0, 5600.0, 3524.0, 2241.0, 1329.0, 834.0, 529.0, 317.0, 200.0, 144.0, 86.0, 59.0, 39.0, 20.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.9609375, -5.7791748046875, -5.597412109375, -5.4156494140625, -5.23388671875, -5.0521240234375, -4.870361328125, -4.6885986328125, -4.5068359375, -4.3250732421875, -4.143310546875, -3.9615478515625, -3.77978515625, -3.5980224609375, -3.416259765625, -3.2344970703125, -3.052734375, -2.8709716796875, -2.689208984375, -2.5074462890625, -2.32568359375, -2.1439208984375, -1.962158203125, -1.7803955078125, -1.5986328125, -1.4168701171875, -1.235107421875, -1.0533447265625, -0.87158203125, -0.6898193359375, -0.508056640625, -0.3262939453125, -0.14453125, 0.0372314453125, 0.218994140625, 0.4007568359375, 0.58251953125, 0.7642822265625, 0.946044921875, 1.1278076171875, 1.3095703125, 1.4913330078125, 1.673095703125, 1.8548583984375, 2.03662109375, 2.2183837890625, 2.400146484375, 2.5819091796875, 2.763671875, 2.9454345703125, 3.127197265625, 3.3089599609375, 3.49072265625, 3.6724853515625, 3.854248046875, 4.0360107421875, 4.2177734375, 4.3995361328125, 4.581298828125, 4.7630615234375, 4.94482421875, 5.1265869140625, 5.308349609375, 5.4901123046875, 5.671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 6.0, 16.0, 13.0, 23.0, 16.0, 18.0, 22.0, 32.0, 38.0, 40.0, 42.0, 36.0, 55.0, 51.0, 53.0, 48.0, 48.0, 43.0, 41.0, 43.0, 41.0, 45.0, 34.0, 21.0, 19.0, 25.0, 22.0, 14.0, 15.0, 18.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.443359375, -2.36602783203125, -2.2886962890625, -2.21136474609375, -2.134033203125, -2.05670166015625, -1.9793701171875, -1.90203857421875, -1.82470703125, -1.74737548828125, -1.6700439453125, -1.59271240234375, -1.515380859375, -1.43804931640625, -1.3607177734375, -1.28338623046875, -1.2060546875, -1.12872314453125, -1.0513916015625, -0.97406005859375, -0.896728515625, -0.81939697265625, -0.7420654296875, -0.66473388671875, -0.58740234375, -0.51007080078125, -0.4327392578125, -0.35540771484375, -0.278076171875, -0.20074462890625, -0.1234130859375, -0.04608154296875, 0.03125, 0.10858154296875, 0.1859130859375, 0.26324462890625, 0.340576171875, 0.41790771484375, 0.4952392578125, 0.57257080078125, 0.64990234375, 0.72723388671875, 0.8045654296875, 0.88189697265625, 0.959228515625, 1.03656005859375, 1.1138916015625, 1.19122314453125, 1.2685546875, 1.34588623046875, 1.4232177734375, 1.50054931640625, 1.577880859375, 1.65521240234375, 1.7325439453125, 1.80987548828125, 1.88720703125, 1.96453857421875, 2.0418701171875, 2.11920166015625, 2.196533203125, 2.27386474609375, 2.3511962890625, 2.42852783203125, 2.505859375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 11.0, 10.0, 19.0, 26.0, 28.0, 25.0, 26.0, 36.0, 55.0, 54.0, 53.0, 49.0, 42.0, 47.0, 53.0, 45.0, 56.0, 54.0, 41.0, 36.0, 36.0, 33.0, 30.0, 17.0, 24.0, 17.0, 14.0, 6.0, 11.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.304317474365234, -15.670007705688477, -15.035696983337402, -14.401386260986328, -13.76707649230957, -13.132766723632812, -12.498456001281738, -11.864145278930664, -11.229835510253906, -10.595525741577148, -9.961215019226074, -9.326904296875, -8.692594528198242, -8.058284759521484, -7.42397403717041, -6.789663791656494, -6.155353546142578, -5.521043300628662, -4.886733055114746, -4.25242280960083, -3.618112564086914, -2.983802318572998, -2.349492073059082, -1.715181827545166, -1.08087158203125, -0.446561336517334, 0.18774890899658203, 0.822059154510498, 1.456369400024414, 2.09067964553833, 2.724989891052246, 3.359300136566162, 3.993612289428711, 4.627922534942627, 5.262232780456543, 5.896543025970459, 6.530853271484375, 7.165163516998291, 7.799473762512207, 8.433784484863281, 9.068094253540039, 9.702404022216797, 10.336714744567871, 10.971025466918945, 11.605335235595703, 12.239645004272461, 12.873955726623535, 13.50826644897461, 14.142576217651367, 14.776885986328125, 15.4111967086792, 16.045507431030273, 16.67981719970703, 17.31412696838379, 17.948436737060547, 18.582748413085938, 19.217058181762695, 19.851367950439453, 20.485679626464844, 21.1199893951416, 21.75429916381836, 22.388608932495117, 23.022918701171875, 23.657230377197266, 24.291540145874023]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 13.0, 6.0, 22.0, 15.0, 17.0, 20.0, 25.0, 28.0, 26.0, 31.0, 32.0, 42.0, 35.0, 41.0, 34.0, 36.0, 33.0, 38.0, 37.0, 49.0, 44.0, 36.0, 36.0, 38.0, 42.0, 33.0, 26.0, 21.0, 27.0, 24.0, 19.0, 13.0, 14.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.219585418701172, -16.635934829711914, -16.052282333374023, -15.468631744384766, -14.884980201721191, -14.301328659057617, -13.71767807006836, -13.134026527404785, -12.550374984741211, -11.966723442077637, -11.383071899414062, -10.799421310424805, -10.21576976776123, -9.632118225097656, -9.048467636108398, -8.464816093444824, -7.88116455078125, -7.297513008117676, -6.71386194229126, -6.130210876464844, -5.5465593338012695, -4.962907791137695, -4.379256725311279, -3.7956056594848633, -3.211954116821289, -2.628302812576294, -2.044651508331299, -1.4610002040863037, -0.8773488998413086, -0.2936975955963135, 0.28995370864868164, 0.8736047744750977, 1.4572582244873047, 2.0409095287323, 2.624560832977295, 3.20821213722229, 3.791863441467285, 4.375514984130859, 4.959166049957275, 5.542817115783691, 6.126468658447266, 6.71012020111084, 7.293771266937256, 7.877422332763672, 8.461073875427246, 9.04472541809082, 9.628376007080078, 10.212027549743652, 10.795679092407227, 11.3793306350708, 11.962982177734375, 12.546632766723633, 13.130284309387207, 13.713935852050781, 14.297586441040039, 14.881237983703613, 15.464889526367188, 16.048540115356445, 16.632192611694336, 17.215843200683594, 17.799495697021484, 18.383146286010742, 18.966796875, 19.55044937133789, 20.13409996032715]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 1.0, 6.0, 19.0, 24.0, 40.0, 59.0, 102.0, 161.0, 277.0, 429.0, 741.0, 1310.0, 2063.0, 3609.0, 5925.0, 10114.0, 17438.0, 29410.0, 49737.0, 83278.0, 134706.0, 210674.0, 310590.0, 418122.0, 509877.0, 548627.0, 516619.0, 430949.0, 323118.0, 221672.0, 143593.0, 87966.0, 53442.0, 32036.0, 18925.0, 11245.0, 6857.0, 4052.0, 2503.0, 1494.0, 881.0, 584.0, 378.0, 233.0, 140.0, 99.0, 60.0, 36.0, 25.0, 15.0, 10.0, 6.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3046875, -13.8209228515625, -13.337158203125, -12.8533935546875, -12.36962890625, -11.8858642578125, -11.402099609375, -10.9183349609375, -10.4345703125, -9.9508056640625, -9.467041015625, -8.9832763671875, -8.49951171875, -8.0157470703125, -7.531982421875, -7.0482177734375, -6.564453125, -6.0806884765625, -5.596923828125, -5.1131591796875, -4.62939453125, -4.1456298828125, -3.661865234375, -3.1781005859375, -2.6943359375, -2.2105712890625, -1.726806640625, -1.2430419921875, -0.75927734375, -0.2755126953125, 0.208251953125, 0.6920166015625, 1.17578125, 1.6595458984375, 2.143310546875, 2.6270751953125, 3.11083984375, 3.5946044921875, 4.078369140625, 4.5621337890625, 5.0458984375, 5.5296630859375, 6.013427734375, 6.4971923828125, 6.98095703125, 7.4647216796875, 7.948486328125, 8.4322509765625, 8.916015625, 9.3997802734375, 9.883544921875, 10.3673095703125, 10.85107421875, 11.3348388671875, 11.818603515625, 12.3023681640625, 12.7861328125, 13.2698974609375, 13.753662109375, 14.2374267578125, 14.72119140625, 15.2049560546875, 15.688720703125, 16.1724853515625, 16.65625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 12.0, 16.0, 16.0, 21.0, 28.0, 23.0, 26.0, 25.0, 36.0, 37.0, 34.0, 43.0, 31.0, 36.0, 34.0, 38.0, 40.0, 43.0, 48.0, 41.0, 33.0, 39.0, 36.0, 39.0, 25.0, 33.0, 22.0, 24.0, 21.0, 17.0, 13.0, 14.0, 10.0, 7.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.59375, -15.0595703125, -14.525390625, -13.9912109375, -13.45703125, -12.9228515625, -12.388671875, -11.8544921875, -11.3203125, -10.7861328125, -10.251953125, -9.7177734375, -9.18359375, -8.6494140625, -8.115234375, -7.5810546875, -7.046875, -6.5126953125, -5.978515625, -5.4443359375, -4.91015625, -4.3759765625, -3.841796875, -3.3076171875, -2.7734375, -2.2392578125, -1.705078125, -1.1708984375, -0.63671875, -0.1025390625, 0.431640625, 0.9658203125, 1.5, 2.0341796875, 2.568359375, 3.1025390625, 3.63671875, 4.1708984375, 4.705078125, 5.2392578125, 5.7734375, 6.3076171875, 6.841796875, 7.3759765625, 7.91015625, 8.4443359375, 8.978515625, 9.5126953125, 10.046875, 10.5810546875, 11.115234375, 11.6494140625, 12.18359375, 12.7177734375, 13.251953125, 13.7861328125, 14.3203125, 14.8544921875, 15.388671875, 15.9228515625, 16.45703125, 16.9912109375, 17.525390625, 18.0595703125, 18.59375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 13.0, 18.0, 34.0, 72.0, 93.0, 154.0, 260.0, 462.0, 751.0, 1374.0, 2217.0, 4093.0, 6874.0, 12342.0, 22324.0, 39411.0, 69186.0, 116740.0, 189360.0, 290220.0, 404022.0, 510330.0, 564999.0, 546947.0, 462071.0, 348309.0, 237943.0, 151430.0, 90534.0, 52357.0, 30064.0, 17088.0, 9524.0, 5381.0, 2968.0, 1828.0, 972.0, 589.0, 359.0, 233.0, 119.0, 77.0, 42.0, 48.0, 22.0, 12.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.918701171875, -16.36865234375, -15.818603515625, -15.2685546875, -14.718505859375, -14.16845703125, -13.618408203125, -13.068359375, -12.518310546875, -11.96826171875, -11.418212890625, -10.8681640625, -10.318115234375, -9.76806640625, -9.218017578125, -8.66796875, -8.117919921875, -7.56787109375, -7.017822265625, -6.4677734375, -5.917724609375, -5.36767578125, -4.817626953125, -4.267578125, -3.717529296875, -3.16748046875, -2.617431640625, -2.0673828125, -1.517333984375, -0.96728515625, -0.417236328125, 0.1328125, 0.682861328125, 1.23291015625, 1.782958984375, 2.3330078125, 2.883056640625, 3.43310546875, 3.983154296875, 4.533203125, 5.083251953125, 5.63330078125, 6.183349609375, 6.7333984375, 7.283447265625, 7.83349609375, 8.383544921875, 8.93359375, 9.483642578125, 10.03369140625, 10.583740234375, 11.1337890625, 11.683837890625, 12.23388671875, 12.783935546875, 13.333984375, 13.884033203125, 14.43408203125, 14.984130859375, 15.5341796875, 16.084228515625, 16.63427734375, 17.184326171875, 17.734375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 9.0, 13.0, 24.0, 29.0, 26.0, 42.0, 39.0, 58.0, 58.0, 60.0, 73.0, 96.0, 100.0, 111.0, 131.0, 154.0, 145.0, 164.0, 142.0, 181.0, 203.0, 201.0, 195.0, 201.0, 173.0, 165.0, 155.0, 129.0, 143.0, 119.0, 114.0, 111.0, 71.0, 89.0, 69.0, 51.0, 41.0, 37.0, 37.0, 24.0, 23.0, 13.0, 11.0, 10.0, 8.0, 2.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0], "bins": [-7.08203125, -6.87255859375, -6.6630859375, -6.45361328125, -6.244140625, -6.03466796875, -5.8251953125, -5.61572265625, -5.40625, -5.19677734375, -4.9873046875, -4.77783203125, -4.568359375, -4.35888671875, -4.1494140625, -3.93994140625, -3.73046875, -3.52099609375, -3.3115234375, -3.10205078125, -2.892578125, -2.68310546875, -2.4736328125, -2.26416015625, -2.0546875, -1.84521484375, -1.6357421875, -1.42626953125, -1.216796875, -1.00732421875, -0.7978515625, -0.58837890625, -0.37890625, -0.16943359375, 0.0400390625, 0.24951171875, 0.458984375, 0.66845703125, 0.8779296875, 1.08740234375, 1.296875, 1.50634765625, 1.7158203125, 1.92529296875, 2.134765625, 2.34423828125, 2.5537109375, 2.76318359375, 2.97265625, 3.18212890625, 3.3916015625, 3.60107421875, 3.810546875, 4.02001953125, 4.2294921875, 4.43896484375, 4.6484375, 4.85791015625, 5.0673828125, 5.27685546875, 5.486328125, 5.69580078125, 5.9052734375, 6.11474609375, 6.32421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 3.0, 3.0, 9.0, 8.0, 10.0, 12.0, 21.0, 19.0, 30.0, 22.0, 31.0, 34.0, 32.0, 40.0, 47.0, 50.0, 42.0, 32.0, 40.0, 50.0, 41.0, 39.0, 48.0, 34.0, 33.0, 40.0, 20.0, 43.0, 22.0, 26.0, 20.0, 21.0, 17.0, 12.0, 4.0, 10.0, 7.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.365427017211914, -16.807409286499023, -16.249391555786133, -15.691372871398926, -15.133354187011719, -14.575336456298828, -14.017318725585938, -13.459300994873047, -12.90128231048584, -12.34326457977295, -11.785245895385742, -11.227228164672852, -10.669210433959961, -10.111191749572754, -9.553174018859863, -8.995155334472656, -8.437137603759766, -7.879119396209717, -7.321101188659668, -6.763083457946777, -6.2050652503967285, -5.64704704284668, -5.089029312133789, -4.53101110458374, -3.9729928970336914, -3.4149746894836426, -2.856956720352173, -2.298938751220703, -1.7409205436706543, -1.1829023361206055, -0.6248843669891357, -0.06686639785766602, 0.4911518096923828, 1.049169898033142, 1.6071879863739014, 2.165205955505371, 2.72322416305542, 3.2812423706054688, 3.8392603397369385, 4.397278308868408, 4.955296516418457, 5.513314723968506, 6.071332931518555, 6.629350662231445, 7.187368869781494, 7.745387077331543, 8.303404808044434, 8.86142349243164, 9.419441223144531, 9.977458953857422, 10.535477638244629, 11.09349536895752, 11.651514053344727, 12.209531784057617, 12.767549514770508, 13.325567245483398, 13.883585929870605, 14.441603660583496, 14.999622344970703, 15.557640075683594, 16.115657806396484, 16.673675537109375, 17.2316951751709, 17.78971290588379, 18.34773063659668]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 17.0, 19.0, 18.0, 22.0, 36.0, 23.0, 35.0, 39.0, 31.0, 39.0, 35.0, 38.0, 38.0, 47.0, 50.0, 41.0, 45.0, 44.0, 36.0, 33.0, 45.0, 29.0, 35.0, 31.0, 29.0, 24.0, 19.0, 24.0, 15.0, 15.0, 10.0, 5.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.64324188232422, -20.98698616027832, -20.330730438232422, -19.674476623535156, -19.018220901489258, -18.36196517944336, -17.70570945739746, -17.049453735351562, -16.393198013305664, -15.736942291259766, -15.080687522888184, -14.424431800842285, -13.768176078796387, -13.111921310424805, -12.455665588378906, -11.799409866333008, -11.143155097961426, -10.486899375915527, -9.830644607543945, -9.174388885498047, -8.518133163452148, -7.861877918243408, -7.205622673034668, -6.5493669509887695, -5.893111705780029, -5.236856460571289, -4.580600738525391, -3.9243454933166504, -3.268090009689331, -2.6118345260620117, -1.9555792808532715, -1.299323558807373, -0.6430683135986328, 0.013187110424041748, 0.6694425344467163, 1.325697898864746, 1.9819533824920654, 2.6382088661193848, 3.294464111328125, 3.9507198333740234, 4.606975078582764, 5.263230323791504, 5.919486045837402, 6.575741291046143, 7.231996536254883, 7.888252258300781, 8.54450798034668, 9.200763702392578, 9.85701847076416, 10.513274192810059, 11.16952896118164, 11.825784683227539, 12.482040405273438, 13.138296127319336, 13.794550895690918, 14.450806617736816, 15.107061386108398, 15.763317108154297, 16.419572830200195, 17.075828552246094, 17.73208236694336, 18.388338088989258, 19.044593811035156, 19.700849533081055, 20.357105255126953]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 22.0, 20.0, 37.0, 57.0, 103.0, 169.0, 315.0, 458.0, 830.0, 1378.0, 2333.0, 3888.0, 6692.0, 10742.0, 17758.0, 29311.0, 46079.0, 71009.0, 102248.0, 134077.0, 150610.0, 141282.0, 111604.0, 79406.0, 52601.0, 33245.0, 20572.0, 12616.0, 7840.0, 4604.0, 2712.0, 1662.0, 908.0, 573.0, 318.0, 187.0, 120.0, 49.0, 36.0, 20.0, 14.0, 11.0, 13.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.396484375, -3.2955322265625, -3.194580078125, -3.0936279296875, -2.99267578125, -2.8917236328125, -2.790771484375, -2.6898193359375, -2.5888671875, -2.4879150390625, -2.386962890625, -2.2860107421875, -2.18505859375, -2.0841064453125, -1.983154296875, -1.8822021484375, -1.78125, -1.6802978515625, -1.579345703125, -1.4783935546875, -1.37744140625, -1.2764892578125, -1.175537109375, -1.0745849609375, -0.9736328125, -0.8726806640625, -0.771728515625, -0.6707763671875, -0.56982421875, -0.4688720703125, -0.367919921875, -0.2669677734375, -0.166015625, -0.0650634765625, 0.035888671875, 0.1368408203125, 0.23779296875, 0.3387451171875, 0.439697265625, 0.5406494140625, 0.6416015625, 0.7425537109375, 0.843505859375, 0.9444580078125, 1.04541015625, 1.1463623046875, 1.247314453125, 1.3482666015625, 1.44921875, 1.5501708984375, 1.651123046875, 1.7520751953125, 1.85302734375, 1.9539794921875, 2.054931640625, 2.1558837890625, 2.2568359375, 2.3577880859375, 2.458740234375, 2.5596923828125, 2.66064453125, 2.7615966796875, 2.862548828125, 2.9635009765625, 3.064453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 17.0, 19.0, 18.0, 23.0, 37.0, 21.0, 36.0, 39.0, 30.0, 39.0, 33.0, 39.0, 40.0, 47.0, 49.0, 41.0, 45.0, 43.0, 38.0, 34.0, 44.0, 31.0, 33.0, 31.0, 29.0, 23.0, 22.0, 21.0, 15.0, 17.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.06005859375, -20.4013671875, -19.74267578125, -19.083984375, -18.42529296875, -17.7666015625, -17.10791015625, -16.44921875, -15.79052734375, -15.1318359375, -14.47314453125, -13.814453125, -13.15576171875, -12.4970703125, -11.83837890625, -11.1796875, -10.52099609375, -9.8623046875, -9.20361328125, -8.544921875, -7.88623046875, -7.2275390625, -6.56884765625, -5.91015625, -5.25146484375, -4.5927734375, -3.93408203125, -3.275390625, -2.61669921875, -1.9580078125, -1.29931640625, -0.640625, 0.01806640625, 0.6767578125, 1.33544921875, 1.994140625, 2.65283203125, 3.3115234375, 3.97021484375, 4.62890625, 5.28759765625, 5.9462890625, 6.60498046875, 7.263671875, 7.92236328125, 8.5810546875, 9.23974609375, 9.8984375, 10.55712890625, 11.2158203125, 11.87451171875, 12.533203125, 13.19189453125, 13.8505859375, 14.50927734375, 15.16796875, 15.82666015625, 16.4853515625, 17.14404296875, 17.802734375, 18.46142578125, 19.1201171875, 19.77880859375, 20.4375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 18.0, 24.0, 47.0, 58.0, 84.0, 137.0, 197.0, 338.0, 493.0, 833.0, 1335.0, 2125.0, 3423.0, 5729.0, 9450.0, 16209.0, 31707.0, 295619.0, 597126.0, 38278.0, 18552.0, 10534.0, 6214.0, 3781.0, 2273.0, 1453.0, 898.0, 571.0, 388.0, 210.0, 131.0, 93.0, 68.0, 38.0, 33.0, 18.0, 17.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -5.9974365234375, -5.776123046875, -5.5548095703125, -5.33349609375, -5.1121826171875, -4.890869140625, -4.6695556640625, -4.4482421875, -4.2269287109375, -4.005615234375, -3.7843017578125, -3.56298828125, -3.3416748046875, -3.120361328125, -2.8990478515625, -2.677734375, -2.4564208984375, -2.235107421875, -2.0137939453125, -1.79248046875, -1.5711669921875, -1.349853515625, -1.1285400390625, -0.9072265625, -0.6859130859375, -0.464599609375, -0.2432861328125, -0.02197265625, 0.1993408203125, 0.420654296875, 0.6419677734375, 0.86328125, 1.0845947265625, 1.305908203125, 1.5272216796875, 1.74853515625, 1.9698486328125, 2.191162109375, 2.4124755859375, 2.6337890625, 2.8551025390625, 3.076416015625, 3.2977294921875, 3.51904296875, 3.7403564453125, 3.961669921875, 4.1829833984375, 4.404296875, 4.6256103515625, 4.846923828125, 5.0682373046875, 5.28955078125, 5.5108642578125, 5.732177734375, 5.9534912109375, 6.1748046875, 6.3961181640625, 6.617431640625, 6.8387451171875, 7.06005859375, 7.2813720703125, 7.502685546875, 7.7239990234375, 7.9453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 12.0, 8.0, 8.0, 15.0, 12.0, 8.0, 21.0, 29.0, 28.0, 29.0, 45.0, 38.0, 38.0, 45.0, 33.0, 43.0, 53.0, 49.0, 47.0, 50.0, 42.0, 33.0, 27.0, 31.0, 30.0, 38.0, 30.0, 28.0, 24.0, 12.0, 22.0, 17.0, 10.0, 10.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.4921875, -14.0631103515625, -13.634033203125, -13.2049560546875, -12.77587890625, -12.3468017578125, -11.917724609375, -11.4886474609375, -11.0595703125, -10.6304931640625, -10.201416015625, -9.7723388671875, -9.34326171875, -8.9141845703125, -8.485107421875, -8.0560302734375, -7.626953125, -7.1978759765625, -6.768798828125, -6.3397216796875, -5.91064453125, -5.4815673828125, -5.052490234375, -4.6234130859375, -4.1943359375, -3.7652587890625, -3.336181640625, -2.9071044921875, -2.47802734375, -2.0489501953125, -1.619873046875, -1.1907958984375, -0.76171875, -0.3326416015625, 0.096435546875, 0.5255126953125, 0.95458984375, 1.3836669921875, 1.812744140625, 2.2418212890625, 2.6708984375, 3.0999755859375, 3.529052734375, 3.9581298828125, 4.38720703125, 4.8162841796875, 5.245361328125, 5.6744384765625, 6.103515625, 6.5325927734375, 6.961669921875, 7.3907470703125, 7.81982421875, 8.2489013671875, 8.677978515625, 9.1070556640625, 9.5361328125, 9.9652099609375, 10.394287109375, 10.8233642578125, 11.25244140625, 11.6815185546875, 12.110595703125, 12.5396728515625, 12.96875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 16.0, 34.0, 37.0, 43.0, 62.0, 121.0, 147.0, 199.0, 280.0, 451.0, 616.0, 931.0, 1319.0, 1963.0, 3149.0, 4866.0, 7063.0, 11170.0, 17711.0, 29397.0, 320520.0, 562504.0, 32418.0, 18903.0, 11904.0, 7624.0, 4808.0, 3429.0, 2276.0, 1497.0, 942.0, 642.0, 468.0, 298.0, 198.0, 154.0, 110.0, 72.0, 50.0, 38.0, 17.0, 18.0, 17.0, 13.0, 5.0, 7.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.5634765625, -0.5464401245117188, -0.5294036865234375, -0.5123672485351562, -0.495330810546875, -0.47829437255859375, -0.4612579345703125, -0.44422149658203125, -0.42718505859375, -0.41014862060546875, -0.3931121826171875, -0.37607574462890625, -0.359039306640625, -0.34200286865234375, -0.3249664306640625, -0.30792999267578125, -0.2908935546875, -0.27385711669921875, -0.2568206787109375, -0.23978424072265625, -0.222747802734375, -0.20571136474609375, -0.1886749267578125, -0.17163848876953125, -0.15460205078125, -0.13756561279296875, -0.1205291748046875, -0.10349273681640625, -0.086456298828125, -0.06941986083984375, -0.0523834228515625, -0.03534698486328125, -0.018310546875, -0.00127410888671875, 0.0157623291015625, 0.03279876708984375, 0.049835205078125, 0.06687164306640625, 0.0839080810546875, 0.10094451904296875, 0.11798095703125, 0.13501739501953125, 0.1520538330078125, 0.16909027099609375, 0.186126708984375, 0.20316314697265625, 0.2201995849609375, 0.23723602294921875, 0.2542724609375, 0.27130889892578125, 0.2883453369140625, 0.30538177490234375, 0.322418212890625, 0.33945465087890625, 0.3564910888671875, 0.37352752685546875, 0.39056396484375, 0.40760040283203125, 0.4246368408203125, 0.44167327880859375, 0.458709716796875, 0.47574615478515625, 0.4927825927734375, 0.5098190307617188, 0.52685546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 6.0, 14.0, 15.0, 16.0, 26.0, 25.0, 30.0, 40.0, 27.0, 33.0, 43.0, 46.0, 47.0, 65.0, 53.0, 55.0, 53.0, 51.0, 35.0, 36.0, 33.0, 42.0, 31.0, 32.0, 27.0, 16.0, 19.0, 15.0, 13.0, 10.0, 8.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.806020736694336e-05, -1.7337501049041748e-05, -1.6614794731140137e-05, -1.5892088413238525e-05, -1.5169382095336914e-05, -1.4446675777435303e-05, -1.3723969459533691e-05, -1.300126314163208e-05, -1.2278556823730469e-05, -1.1555850505828857e-05, -1.0833144187927246e-05, -1.0110437870025635e-05, -9.387731552124023e-06, -8.665025234222412e-06, -7.9423189163208e-06, -7.2196125984191895e-06, -6.496906280517578e-06, -5.774199962615967e-06, -5.0514936447143555e-06, -4.328787326812744e-06, -3.606081008911133e-06, -2.8833746910095215e-06, -2.16066837310791e-06, -1.4379620552062988e-06, -7.152557373046875e-07, 7.450580596923828e-09, 7.301568984985352e-07, 1.4528632164001465e-06, 2.175569534301758e-06, 2.898275852203369e-06, 3.6209821701049805e-06, 4.343688488006592e-06, 5.066394805908203e-06, 5.7891011238098145e-06, 6.511807441711426e-06, 7.234513759613037e-06, 7.957220077514648e-06, 8.67992639541626e-06, 9.402632713317871e-06, 1.0125339031219482e-05, 1.0848045349121094e-05, 1.1570751667022705e-05, 1.2293457984924316e-05, 1.3016164302825928e-05, 1.3738870620727539e-05, 1.446157693862915e-05, 1.5184283256530762e-05, 1.5906989574432373e-05, 1.6629695892333984e-05, 1.7352402210235596e-05, 1.8075108528137207e-05, 1.879781484603882e-05, 1.952052116394043e-05, 2.024322748184204e-05, 2.0965933799743652e-05, 2.1688640117645264e-05, 2.2411346435546875e-05, 2.3134052753448486e-05, 2.3856759071350098e-05, 2.457946538925171e-05, 2.530217170715332e-05, 2.602487802505493e-05, 2.6747584342956543e-05, 2.7470290660858154e-05, 2.8192996978759766e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 15.0, 21.0, 16.0, 54.0, 68.0, 98.0, 164.0, 245.0, 395.0, 657.0, 991.0, 1654.0, 2684.0, 4121.0, 6520.0, 10136.0, 16386.0, 25182.0, 39243.0, 60391.0, 89513.0, 125660.0, 155540.0, 151372.0, 118591.0, 83568.0, 55677.0, 36333.0, 23012.0, 14677.0, 9211.0, 6087.0, 3942.0, 2397.0, 1443.0, 940.0, 591.0, 366.0, 203.0, 148.0, 88.0, 47.0, 28.0, 21.0, 15.0, 13.0, 10.0, 1.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.56103515625, -0.5434494018554688, -0.5258636474609375, -0.5082778930664062, -0.490692138671875, -0.47310638427734375, -0.4555206298828125, -0.43793487548828125, -0.42034912109375, -0.40276336669921875, -0.3851776123046875, -0.36759185791015625, -0.350006103515625, -0.33242034912109375, -0.3148345947265625, -0.29724884033203125, -0.2796630859375, -0.26207733154296875, -0.2444915771484375, -0.22690582275390625, -0.209320068359375, -0.19173431396484375, -0.1741485595703125, -0.15656280517578125, -0.13897705078125, -0.12139129638671875, -0.1038055419921875, -0.08621978759765625, -0.068634033203125, -0.05104827880859375, -0.0334625244140625, -0.01587677001953125, 0.001708984375, 0.01929473876953125, 0.0368804931640625, 0.05446624755859375, 0.072052001953125, 0.08963775634765625, 0.1072235107421875, 0.12480926513671875, 0.14239501953125, 0.15998077392578125, 0.1775665283203125, 0.19515228271484375, 0.212738037109375, 0.23032379150390625, 0.2479095458984375, 0.26549530029296875, 0.2830810546875, 0.30066680908203125, 0.3182525634765625, 0.33583831787109375, 0.353424072265625, 0.37100982666015625, 0.3885955810546875, 0.40618133544921875, 0.42376708984375, 0.44135284423828125, 0.4589385986328125, 0.47652435302734375, 0.494110107421875, 0.5116958618164062, 0.5292816162109375, 0.5468673706054688, 0.564453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 7.0, 4.0, 7.0, 9.0, 13.0, 22.0, 12.0, 14.0, 29.0, 22.0, 39.0, 39.0, 57.0, 60.0, 56.0, 63.0, 78.0, 70.0, 46.0, 62.0, 38.0, 47.0, 34.0, 32.0, 24.0, 22.0, 19.0, 15.0, 13.0, 7.0, 4.0, 10.0, 3.0, 2.0, 4.0, 3.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2327880859375, -0.22540283203125, -0.218017578125, -0.21063232421875, -0.2032470703125, -0.19586181640625, -0.1884765625, -0.18109130859375, -0.1737060546875, -0.16632080078125, -0.158935546875, -0.15155029296875, -0.1441650390625, -0.13677978515625, -0.12939453125, -0.12200927734375, -0.1146240234375, -0.10723876953125, -0.099853515625, -0.09246826171875, -0.0850830078125, -0.07769775390625, -0.0703125, -0.06292724609375, -0.0555419921875, -0.04815673828125, -0.040771484375, -0.03338623046875, -0.0260009765625, -0.01861572265625, -0.01123046875, -0.00384521484375, 0.0035400390625, 0.01092529296875, 0.018310546875, 0.02569580078125, 0.0330810546875, 0.04046630859375, 0.0478515625, 0.05523681640625, 0.0626220703125, 0.07000732421875, 0.077392578125, 0.08477783203125, 0.0921630859375, 0.09954833984375, 0.10693359375, 0.11431884765625, 0.1217041015625, 0.12908935546875, 0.136474609375, 0.14385986328125, 0.1512451171875, 0.15863037109375, 0.166015625, 0.17340087890625, 0.1807861328125, 0.18817138671875, 0.195556640625, 0.20294189453125, 0.2103271484375, 0.21771240234375, 0.22509765625, 0.23248291015625, 0.2398681640625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 3.0, 11.0, 9.0, 14.0, 13.0, 21.0, 23.0, 22.0, 30.0, 32.0, 29.0, 38.0, 48.0, 40.0, 45.0, 39.0, 39.0, 35.0, 50.0, 33.0, 50.0, 43.0, 30.0, 37.0, 37.0, 33.0, 27.0, 18.0, 27.0, 25.0, 14.0, 17.0, 11.0, 7.0, 11.0, 5.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92188262939453, -16.3713321685791, -15.820782661437988, -15.270232200622559, -14.719682693481445, -14.169132232666016, -13.618581771850586, -13.068031311035156, -12.517481803894043, -11.966931343078613, -11.4163818359375, -10.86583137512207, -10.31528091430664, -9.764731407165527, -9.214180946350098, -8.663631439208984, -8.113080978393555, -7.562530994415283, -7.011981010437012, -6.461430549621582, -5.9108805656433105, -5.360330581665039, -4.809780120849609, -4.259230136871338, -3.7086801528930664, -3.158130168914795, -2.6075799465179443, -2.0570297241210938, -1.5064797401428223, -0.9559297561645508, -0.4053795337677002, 0.1451706886291504, 0.6957187652587891, 1.24626886844635, 1.7968189716339111, 2.3473691940307617, 2.897919178009033, 3.4484691619873047, 3.9990193843841553, 4.549569606781006, 5.100119590759277, 5.650669574737549, 6.20121955871582, 6.75177001953125, 7.3023200035095215, 7.852869987487793, 8.403420448303223, 8.953969955444336, 9.504520416259766, 10.055070877075195, 10.605620384216309, 11.156170845031738, 11.706720352172852, 12.257270812988281, 12.807821273803711, 13.35837173461914, 13.908921241760254, 14.459471702575684, 15.010021209716797, 15.560571670532227, 16.111122131347656, 16.661670684814453, 17.212221145629883, 17.762771606445312, 18.313322067260742]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 17.0, 19.0, 20.0, 20.0, 38.0, 21.0, 37.0, 38.0, 29.0, 41.0, 32.0, 41.0, 37.0, 43.0, 51.0, 44.0, 45.0, 40.0, 41.0, 34.0, 43.0, 32.0, 31.0, 32.0, 27.0, 24.0, 21.0, 22.0, 16.0, 16.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.68993377685547, -21.03296661376953, -20.375999450683594, -19.719032287597656, -19.06206512451172, -18.40509796142578, -17.748130798339844, -17.091163635253906, -16.43419647216797, -15.777229309082031, -15.120262145996094, -14.463294982910156, -13.806327819824219, -13.149360656738281, -12.492393493652344, -11.835426330566406, -11.178460121154785, -10.521492958068848, -9.86452579498291, -9.207558631896973, -8.550591468811035, -7.893624305725098, -7.236657619476318, -6.579690456390381, -5.922723293304443, -5.265756130218506, -4.608788967132568, -3.95182204246521, -3.2948548793792725, -2.637887716293335, -1.9809207916259766, -1.323953628540039, -0.6669864654541016, -0.010019361972808838, 0.6469477415084839, 1.3039147853851318, 1.9608819484710693, 2.617849111557007, 3.2748160362243652, 3.9317831993103027, 4.58875036239624, 5.245717525482178, 5.902684688568115, 6.5596513748168945, 7.216618537902832, 7.8735857009887695, 8.530552864074707, 9.187520027160645, 9.844487190246582, 10.50145435333252, 11.158421516418457, 11.815388679504395, 12.472355842590332, 13.12932300567627, 13.78628921508789, 14.443256378173828, 15.100223541259766, 15.757190704345703, 16.41415786743164, 17.071125030517578, 17.728092193603516, 18.385059356689453, 19.04202651977539, 19.698993682861328, 20.355960845947266]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 14.0, 23.0, 32.0, 55.0, 96.0, 152.0, 226.0, 340.0, 548.0, 1010.0, 1548.0, 2396.0, 3775.0, 5978.0, 9169.0, 13617.0, 19853.0, 28497.0, 38880.0, 52197.0, 66791.0, 80366.0, 91256.0, 97989.0, 97979.0, 93565.0, 82487.0, 68880.0, 54945.0, 41867.0, 30798.0, 21193.0, 14668.0, 9915.0, 6273.0, 4013.0, 2681.0, 1644.0, 1069.0, 672.0, 384.0, 257.0, 165.0, 118.0, 61.0, 36.0, 29.0, 17.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1015625, -11.71240234375, -11.3232421875, -10.93408203125, -10.544921875, -10.15576171875, -9.7666015625, -9.37744140625, -8.98828125, -8.59912109375, -8.2099609375, -7.82080078125, -7.431640625, -7.04248046875, -6.6533203125, -6.26416015625, -5.875, -5.48583984375, -5.0966796875, -4.70751953125, -4.318359375, -3.92919921875, -3.5400390625, -3.15087890625, -2.76171875, -2.37255859375, -1.9833984375, -1.59423828125, -1.205078125, -0.81591796875, -0.4267578125, -0.03759765625, 0.3515625, 0.74072265625, 1.1298828125, 1.51904296875, 1.908203125, 2.29736328125, 2.6865234375, 3.07568359375, 3.46484375, 3.85400390625, 4.2431640625, 4.63232421875, 5.021484375, 5.41064453125, 5.7998046875, 6.18896484375, 6.578125, 6.96728515625, 7.3564453125, 7.74560546875, 8.134765625, 8.52392578125, 8.9130859375, 9.30224609375, 9.69140625, 10.08056640625, 10.4697265625, 10.85888671875, 11.248046875, 11.63720703125, 12.0263671875, 12.41552734375, 12.8046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 12.0, 12.0, 21.0, 20.0, 20.0, 34.0, 23.0, 35.0, 43.0, 32.0, 38.0, 32.0, 38.0, 42.0, 44.0, 48.0, 47.0, 43.0, 39.0, 40.0, 35.0, 47.0, 29.0, 35.0, 32.0, 24.0, 23.0, 22.0, 22.0, 18.0, 12.0, 11.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.362548828125, -19.72509765625, -19.087646484375, -18.4501953125, -17.812744140625, -17.17529296875, -16.537841796875, -15.900390625, -15.262939453125, -14.62548828125, -13.988037109375, -13.3505859375, -12.713134765625, -12.07568359375, -11.438232421875, -10.80078125, -10.163330078125, -9.52587890625, -8.888427734375, -8.2509765625, -7.613525390625, -6.97607421875, -6.338623046875, -5.701171875, -5.063720703125, -4.42626953125, -3.788818359375, -3.1513671875, -2.513916015625, -1.87646484375, -1.239013671875, -0.6015625, 0.035888671875, 0.67333984375, 1.310791015625, 1.9482421875, 2.585693359375, 3.22314453125, 3.860595703125, 4.498046875, 5.135498046875, 5.77294921875, 6.410400390625, 7.0478515625, 7.685302734375, 8.32275390625, 8.960205078125, 9.59765625, 10.235107421875, 10.87255859375, 11.510009765625, 12.1474609375, 12.784912109375, 13.42236328125, 14.059814453125, 14.697265625, 15.334716796875, 15.97216796875, 16.609619140625, 17.2470703125, 17.884521484375, 18.52197265625, 19.159423828125, 19.796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 15.0, 21.0, 40.0, 59.0, 100.0, 170.0, 249.0, 410.0, 648.0, 1127.0, 1728.0, 2995.0, 4523.0, 7190.0, 11108.0, 16643.0, 24416.0, 34742.0, 47413.0, 62172.0, 77512.0, 91386.0, 99675.0, 102630.0, 98197.0, 87870.0, 73960.0, 59360.0, 44927.0, 31962.0, 22310.0, 15347.0, 10065.0, 6528.0, 4137.0, 2554.0, 1683.0, 1087.0, 644.0, 390.0, 219.0, 125.0, 87.0, 52.0, 23.0, 15.0, 14.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.955078125, -11.57421875, -11.193359375, -10.8125, -10.431640625, -10.05078125, -9.669921875, -9.2890625, -8.908203125, -8.52734375, -8.146484375, -7.765625, -7.384765625, -7.00390625, -6.623046875, -6.2421875, -5.861328125, -5.48046875, -5.099609375, -4.71875, -4.337890625, -3.95703125, -3.576171875, -3.1953125, -2.814453125, -2.43359375, -2.052734375, -1.671875, -1.291015625, -0.91015625, -0.529296875, -0.1484375, 0.232421875, 0.61328125, 0.994140625, 1.375, 1.755859375, 2.13671875, 2.517578125, 2.8984375, 3.279296875, 3.66015625, 4.041015625, 4.421875, 4.802734375, 5.18359375, 5.564453125, 5.9453125, 6.326171875, 6.70703125, 7.087890625, 7.46875, 7.849609375, 8.23046875, 8.611328125, 8.9921875, 9.373046875, 9.75390625, 10.134765625, 10.515625, 10.896484375, 11.27734375, 11.658203125, 12.0390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 14.0, 15.0, 22.0, 22.0, 22.0, 27.0, 30.0, 32.0, 27.0, 37.0, 43.0, 31.0, 43.0, 49.0, 61.0, 41.0, 36.0, 48.0, 39.0, 37.0, 40.0, 36.0, 24.0, 26.0, 19.0, 27.0, 20.0, 23.0, 16.0, 16.0, 14.0, 10.0, 5.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2449951171875, -10.849365234375, -10.4537353515625, -10.05810546875, -9.6624755859375, -9.266845703125, -8.8712158203125, -8.4755859375, -8.0799560546875, -7.684326171875, -7.2886962890625, -6.89306640625, -6.4974365234375, -6.101806640625, -5.7061767578125, -5.310546875, -4.9149169921875, -4.519287109375, -4.1236572265625, -3.72802734375, -3.3323974609375, -2.936767578125, -2.5411376953125, -2.1455078125, -1.7498779296875, -1.354248046875, -0.9586181640625, -0.56298828125, -0.1673583984375, 0.228271484375, 0.6239013671875, 1.01953125, 1.4151611328125, 1.810791015625, 2.2064208984375, 2.60205078125, 2.9976806640625, 3.393310546875, 3.7889404296875, 4.1845703125, 4.5802001953125, 4.975830078125, 5.3714599609375, 5.76708984375, 6.1627197265625, 6.558349609375, 6.9539794921875, 7.349609375, 7.7452392578125, 8.140869140625, 8.5364990234375, 8.93212890625, 9.3277587890625, 9.723388671875, 10.1190185546875, 10.5146484375, 10.9102783203125, 11.305908203125, 11.7015380859375, 12.09716796875, 12.4927978515625, 12.888427734375, 13.2840576171875, 13.6796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 10.0, 12.0, 20.0, 30.0, 41.0, 62.0, 111.0, 158.0, 321.0, 453.0, 734.0, 1183.0, 1794.0, 2908.0, 4596.0, 7214.0, 10940.0, 16250.0, 24170.0, 34507.0, 47299.0, 62390.0, 77281.0, 91070.0, 100103.0, 103260.0, 99180.0, 87970.0, 73811.0, 59192.0, 44631.0, 32052.0, 22460.0, 14857.0, 9792.0, 6512.0, 4107.0, 2694.0, 1612.0, 1073.0, 647.0, 387.0, 235.0, 162.0, 101.0, 71.0, 38.0, 25.0, 17.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.60906982421875, -4.4407958984375, -4.27252197265625, -4.104248046875, -3.93597412109375, -3.7677001953125, -3.59942626953125, -3.43115234375, -3.26287841796875, -3.0946044921875, -2.92633056640625, -2.758056640625, -2.58978271484375, -2.4215087890625, -2.25323486328125, -2.0849609375, -1.91668701171875, -1.7484130859375, -1.58013916015625, -1.411865234375, -1.24359130859375, -1.0753173828125, -0.90704345703125, -0.73876953125, -0.57049560546875, -0.4022216796875, -0.23394775390625, -0.065673828125, 0.10260009765625, 0.2708740234375, 0.43914794921875, 0.607421875, 0.77569580078125, 0.9439697265625, 1.11224365234375, 1.280517578125, 1.44879150390625, 1.6170654296875, 1.78533935546875, 1.95361328125, 2.12188720703125, 2.2901611328125, 2.45843505859375, 2.626708984375, 2.79498291015625, 2.9632568359375, 3.13153076171875, 3.2998046875, 3.46807861328125, 3.6363525390625, 3.80462646484375, 3.972900390625, 4.14117431640625, 4.3094482421875, 4.47772216796875, 4.64599609375, 4.81427001953125, 4.9825439453125, 5.15081787109375, 5.319091796875, 5.48736572265625, 5.6556396484375, 5.82391357421875, 5.9921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 8.0, 8.0, 13.0, 9.0, 17.0, 21.0, 25.0, 25.0, 23.0, 33.0, 44.0, 33.0, 37.0, 33.0, 57.0, 49.0, 47.0, 42.0, 49.0, 47.0, 40.0, 43.0, 39.0, 32.0, 28.0, 31.0, 28.0, 20.0, 11.0, 18.0, 10.0, 11.0, 4.0, 8.0, 2.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00074005126953125, -0.0007163435220718384, -0.0006926357746124268, -0.0006689280271530151, -0.0006452202796936035, -0.0006215125322341919, -0.0005978047847747803, -0.0005740970373153687, -0.000550389289855957, -0.0005266815423965454, -0.0005029737949371338, -0.00047926604747772217, -0.00045555830001831055, -0.0004318505525588989, -0.0004081428050994873, -0.0003844350576400757, -0.00036072731018066406, -0.00033701956272125244, -0.0003133118152618408, -0.0002896040678024292, -0.0002658963203430176, -0.00024218857288360596, -0.00021848082542419434, -0.00019477307796478271, -0.0001710653305053711, -0.00014735758304595947, -0.00012364983558654785, -9.994208812713623e-05, -7.623434066772461e-05, -5.252659320831299e-05, -2.8818845748901367e-05, -5.111098289489746e-06, 1.8596649169921875e-05, 4.2304396629333496e-05, 6.601214408874512e-05, 8.971989154815674e-05, 0.00011342763900756836, 0.00013713538646697998, 0.0001608431339263916, 0.00018455088138580322, 0.00020825862884521484, 0.00023196637630462646, 0.0002556741237640381, 0.0002793818712234497, 0.00030308961868286133, 0.00032679736614227295, 0.00035050511360168457, 0.0003742128610610962, 0.0003979206085205078, 0.00042162835597991943, 0.00044533610343933105, 0.0004690438508987427, 0.0004927515983581543, 0.0005164593458175659, 0.0005401670932769775, 0.0005638748407363892, 0.0005875825881958008, 0.0006112903356552124, 0.000634998083114624, 0.0006587058305740356, 0.0006824135780334473, 0.0007061213254928589, 0.0007298290729522705, 0.0007535368204116821, 0.0007772445678710938]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 13.0, 25.0, 24.0, 42.0, 40.0, 84.0, 124.0, 197.0, 334.0, 478.0, 714.0, 1207.0, 1904.0, 3040.0, 4642.0, 7268.0, 10984.0, 16501.0, 24474.0, 34992.0, 47878.0, 62982.0, 78647.0, 92110.0, 101220.0, 103942.0, 98652.0, 87921.0, 73706.0, 57361.0, 43026.0, 30987.0, 21846.0, 14264.0, 9600.0, 6261.0, 4089.0, 2534.0, 1707.0, 1034.0, 618.0, 424.0, 226.0, 149.0, 101.0, 60.0, 37.0, 31.0, 21.0, 10.0, 11.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.6458740234375, -5.459716796875, -5.2735595703125, -5.08740234375, -4.9012451171875, -4.715087890625, -4.5289306640625, -4.3427734375, -4.1566162109375, -3.970458984375, -3.7843017578125, -3.59814453125, -3.4119873046875, -3.225830078125, -3.0396728515625, -2.853515625, -2.6673583984375, -2.481201171875, -2.2950439453125, -2.10888671875, -1.9227294921875, -1.736572265625, -1.5504150390625, -1.3642578125, -1.1781005859375, -0.991943359375, -0.8057861328125, -0.61962890625, -0.4334716796875, -0.247314453125, -0.0611572265625, 0.125, 0.3111572265625, 0.497314453125, 0.6834716796875, 0.86962890625, 1.0557861328125, 1.241943359375, 1.4281005859375, 1.6142578125, 1.8004150390625, 1.986572265625, 2.1727294921875, 2.35888671875, 2.5450439453125, 2.731201171875, 2.9173583984375, 3.103515625, 3.2896728515625, 3.475830078125, 3.6619873046875, 3.84814453125, 4.0343017578125, 4.220458984375, 4.4066162109375, 4.5927734375, 4.7789306640625, 4.965087890625, 5.1512451171875, 5.33740234375, 5.5235595703125, 5.709716796875, 5.8958740234375, 6.08203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 12.0, 8.0, 14.0, 21.0, 21.0, 30.0, 31.0, 42.0, 64.0, 41.0, 58.0, 69.0, 72.0, 55.0, 68.0, 60.0, 64.0, 45.0, 41.0, 36.0, 36.0, 20.0, 25.0, 16.0, 13.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2105712890625, -4.089111328125, -3.9676513671875, -3.84619140625, -3.7247314453125, -3.603271484375, -3.4818115234375, -3.3603515625, -3.2388916015625, -3.117431640625, -2.9959716796875, -2.87451171875, -2.7530517578125, -2.631591796875, -2.5101318359375, -2.388671875, -2.2672119140625, -2.145751953125, -2.0242919921875, -1.90283203125, -1.7813720703125, -1.659912109375, -1.5384521484375, -1.4169921875, -1.2955322265625, -1.174072265625, -1.0526123046875, -0.93115234375, -0.8096923828125, -0.688232421875, -0.5667724609375, -0.4453125, -0.3238525390625, -0.202392578125, -0.0809326171875, 0.04052734375, 0.1619873046875, 0.283447265625, 0.4049072265625, 0.5263671875, 0.6478271484375, 0.769287109375, 0.8907470703125, 1.01220703125, 1.1336669921875, 1.255126953125, 1.3765869140625, 1.498046875, 1.6195068359375, 1.740966796875, 1.8624267578125, 1.98388671875, 2.1053466796875, 2.226806640625, 2.3482666015625, 2.4697265625, 2.5911865234375, 2.712646484375, 2.8341064453125, 2.95556640625, 3.0770263671875, 3.198486328125, 3.3199462890625, 3.44140625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 12.0, 14.0, 15.0, 21.0, 12.0, 27.0, 25.0, 27.0, 31.0, 41.0, 35.0, 31.0, 33.0, 43.0, 48.0, 34.0, 46.0, 35.0, 39.0, 35.0, 38.0, 42.0, 32.0, 33.0, 29.0, 25.0, 22.0, 26.0, 17.0, 13.0, 10.0, 23.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4219970703125, -14.90878677368164, -14.395577430725098, -13.882367134094238, -13.369157791137695, -12.855947494506836, -12.342737197875977, -11.829526901245117, -11.316317558288574, -10.803107261657715, -10.289897918701172, -9.776687622070312, -9.263477325439453, -8.75026798248291, -8.23705768585205, -7.72384786605835, -7.210638046264648, -6.697428226470947, -6.184218406677246, -5.671008110046387, -5.1577982902526855, -4.644588470458984, -4.131378173828125, -3.618168354034424, -3.1049585342407227, -2.5917487144470215, -2.078538656234741, -1.5653287172317505, -1.0521187782287598, -0.5389089584350586, -0.02569890022277832, 0.48751115798950195, 1.0007190704345703, 1.513929009437561, 2.0271389484405518, 2.540349006652832, 3.053558826446533, 3.5667686462402344, 4.079978942871094, 4.593188762664795, 5.106398582458496, 5.619608402252197, 6.132818222045898, 6.646028518676758, 7.159238338470459, 7.67244815826416, 8.18565845489502, 8.698867797851562, 9.212078094482422, 9.725288391113281, 10.238497734069824, 10.751708030700684, 11.264917373657227, 11.778127670288086, 12.291337966918945, 12.804548263549805, 13.317757606506348, 13.830967903137207, 14.34417724609375, 14.85738754272461, 15.370597839355469, 15.883807182312012, 16.397016525268555, 16.910226821899414, 17.423437118530273]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 13.0, 14.0, 17.0, 25.0, 22.0, 25.0, 24.0, 28.0, 30.0, 42.0, 33.0, 32.0, 29.0, 43.0, 53.0, 35.0, 41.0, 41.0, 41.0, 44.0, 40.0, 42.0, 23.0, 35.0, 22.0, 32.0, 33.0, 22.0, 24.0, 12.0, 10.0, 13.0, 14.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.436277389526367, -20.79283332824707, -20.149389266967773, -19.505943298339844, -18.862499237060547, -18.21905517578125, -17.575611114501953, -16.932167053222656, -16.28872299194336, -15.645278930664062, -15.00183391571045, -14.358389854431152, -13.714944839477539, -13.071500778198242, -12.428056716918945, -11.784612655639648, -11.141166687011719, -10.497722625732422, -9.854277610778809, -9.210833549499512, -8.567388534545898, -7.923944473266602, -7.280500411987305, -6.63705587387085, -5.9936113357543945, -5.3501667976379395, -4.706722259521484, -4.0632781982421875, -3.4198336601257324, -2.7763891220092773, -2.1329448223114014, -1.4895005226135254, -0.8460559844970703, -0.20261156558990479, 0.44083285331726074, 1.0842772722244263, 1.7277216911315918, 2.371166229248047, 3.014610528945923, 3.658054828643799, 4.301499366760254, 4.944943904876709, 5.588388442993164, 6.231832504272461, 6.875277042388916, 7.518721580505371, 8.162165641784668, 8.805610656738281, 9.449054718017578, 10.092498779296875, 10.735943794250488, 11.379387855529785, 12.022832870483398, 12.666276931762695, 13.309720993041992, 13.953165054321289, 14.596610069274902, 15.2400541305542, 15.883499145507812, 16.52694320678711, 17.170387268066406, 17.813831329345703, 18.457277297973633, 19.10072135925293, 19.744165420532227]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 6.0, 11.0, 22.0, 45.0, 61.0, 92.0, 125.0, 198.0, 342.0, 559.0, 981.0, 1673.0, 3041.0, 5272.0, 9436.0, 17040.0, 30958.0, 54510.0, 96254.0, 162769.0, 262390.0, 389506.0, 517816.0, 595921.0, 587387.0, 496229.0, 365946.0, 242342.0, 149431.0, 87441.0, 50190.0, 28201.0, 16191.0, 9286.0, 5233.0, 3001.0, 1757.0, 1040.0, 609.0, 356.0, 216.0, 122.0, 99.0, 55.0, 36.0, 29.0, 21.0, 6.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-16.1875, -15.646484375, -15.10546875, -14.564453125, -14.0234375, -13.482421875, -12.94140625, -12.400390625, -11.859375, -11.318359375, -10.77734375, -10.236328125, -9.6953125, -9.154296875, -8.61328125, -8.072265625, -7.53125, -6.990234375, -6.44921875, -5.908203125, -5.3671875, -4.826171875, -4.28515625, -3.744140625, -3.203125, -2.662109375, -2.12109375, -1.580078125, -1.0390625, -0.498046875, 0.04296875, 0.583984375, 1.125, 1.666015625, 2.20703125, 2.748046875, 3.2890625, 3.830078125, 4.37109375, 4.912109375, 5.453125, 5.994140625, 6.53515625, 7.076171875, 7.6171875, 8.158203125, 8.69921875, 9.240234375, 9.78125, 10.322265625, 10.86328125, 11.404296875, 11.9453125, 12.486328125, 13.02734375, 13.568359375, 14.109375, 14.650390625, 15.19140625, 15.732421875, 16.2734375, 16.814453125, 17.35546875, 17.896484375, 18.4375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 7.0, 11.0, 12.0, 16.0, 14.0, 26.0, 21.0, 25.0, 26.0, 25.0, 36.0, 33.0, 34.0, 31.0, 34.0, 43.0, 49.0, 37.0, 43.0, 40.0, 42.0, 42.0, 38.0, 41.0, 25.0, 30.0, 28.0, 27.0, 37.0, 25.0, 22.0, 10.0, 12.0, 13.0, 11.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.53125, -19.914794921875, -19.29833984375, -18.681884765625, -18.0654296875, -17.448974609375, -16.83251953125, -16.216064453125, -15.599609375, -14.983154296875, -14.36669921875, -13.750244140625, -13.1337890625, -12.517333984375, -11.90087890625, -11.284423828125, -10.66796875, -10.051513671875, -9.43505859375, -8.818603515625, -8.2021484375, -7.585693359375, -6.96923828125, -6.352783203125, -5.736328125, -5.119873046875, -4.50341796875, -3.886962890625, -3.2705078125, -2.654052734375, -2.03759765625, -1.421142578125, -0.8046875, -0.188232421875, 0.42822265625, 1.044677734375, 1.6611328125, 2.277587890625, 2.89404296875, 3.510498046875, 4.126953125, 4.743408203125, 5.35986328125, 5.976318359375, 6.5927734375, 7.209228515625, 7.82568359375, 8.442138671875, 9.05859375, 9.675048828125, 10.29150390625, 10.907958984375, 11.5244140625, 12.140869140625, 12.75732421875, 13.373779296875, 13.990234375, 14.606689453125, 15.22314453125, 15.839599609375, 16.4560546875, 17.072509765625, 17.68896484375, 18.305419921875, 18.921875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 13.0, 3.0, 8.0, 23.0, 22.0, 57.0, 83.0, 145.0, 197.0, 314.0, 557.0, 833.0, 1429.0, 2373.0, 4040.0, 7020.0, 11800.0, 20326.0, 34082.0, 56699.0, 91825.0, 145176.0, 218497.0, 308582.0, 405191.0, 480023.0, 514580.0, 491176.0, 422178.0, 328311.0, 235137.0, 157857.0, 100700.0, 62319.0, 37673.0, 22568.0, 13219.0, 7820.0, 4620.0, 2684.0, 1648.0, 986.0, 562.0, 358.0, 229.0, 127.0, 85.0, 49.0, 41.0, 23.0, 8.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.015625, -16.49365234375, -15.9716796875, -15.44970703125, -14.927734375, -14.40576171875, -13.8837890625, -13.36181640625, -12.83984375, -12.31787109375, -11.7958984375, -11.27392578125, -10.751953125, -10.22998046875, -9.7080078125, -9.18603515625, -8.6640625, -8.14208984375, -7.6201171875, -7.09814453125, -6.576171875, -6.05419921875, -5.5322265625, -5.01025390625, -4.48828125, -3.96630859375, -3.4443359375, -2.92236328125, -2.400390625, -1.87841796875, -1.3564453125, -0.83447265625, -0.3125, 0.20947265625, 0.7314453125, 1.25341796875, 1.775390625, 2.29736328125, 2.8193359375, 3.34130859375, 3.86328125, 4.38525390625, 4.9072265625, 5.42919921875, 5.951171875, 6.47314453125, 6.9951171875, 7.51708984375, 8.0390625, 8.56103515625, 9.0830078125, 9.60498046875, 10.126953125, 10.64892578125, 11.1708984375, 11.69287109375, 12.21484375, 12.73681640625, 13.2587890625, 13.78076171875, 14.302734375, 14.82470703125, 15.3466796875, 15.86865234375, 16.390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 8.0, 7.0, 18.0, 18.0, 23.0, 33.0, 35.0, 55.0, 57.0, 64.0, 89.0, 91.0, 106.0, 117.0, 152.0, 138.0, 154.0, 191.0, 183.0, 210.0, 207.0, 190.0, 206.0, 197.0, 155.0, 194.0, 193.0, 141.0, 166.0, 114.0, 102.0, 89.0, 70.0, 53.0, 45.0, 39.0, 35.0, 28.0, 23.0, 16.0, 15.0, 10.0, 11.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.828125, -8.57293701171875, -8.3177490234375, -8.06256103515625, -7.807373046875, -7.55218505859375, -7.2969970703125, -7.04180908203125, -6.78662109375, -6.53143310546875, -6.2762451171875, -6.02105712890625, -5.765869140625, -5.51068115234375, -5.2554931640625, -5.00030517578125, -4.7451171875, -4.48992919921875, -4.2347412109375, -3.97955322265625, -3.724365234375, -3.46917724609375, -3.2139892578125, -2.95880126953125, -2.70361328125, -2.44842529296875, -2.1932373046875, -1.93804931640625, -1.682861328125, -1.42767333984375, -1.1724853515625, -0.91729736328125, -0.662109375, -0.40692138671875, -0.1517333984375, 0.10345458984375, 0.358642578125, 0.61383056640625, 0.8690185546875, 1.12420654296875, 1.37939453125, 1.63458251953125, 1.8897705078125, 2.14495849609375, 2.400146484375, 2.65533447265625, 2.9105224609375, 3.16571044921875, 3.4208984375, 3.67608642578125, 3.9312744140625, 4.18646240234375, 4.441650390625, 4.69683837890625, 4.9520263671875, 5.20721435546875, 5.46240234375, 5.71759033203125, 5.9727783203125, 6.22796630859375, 6.483154296875, 6.73834228515625, 6.9935302734375, 7.24871826171875, 7.50390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 9.0, 5.0, 14.0, 19.0, 17.0, 23.0, 17.0, 24.0, 18.0, 28.0, 27.0, 27.0, 31.0, 43.0, 34.0, 43.0, 30.0, 39.0, 40.0, 49.0, 41.0, 40.0, 45.0, 37.0, 30.0, 29.0, 33.0, 30.0, 28.0, 19.0, 22.0, 16.0, 9.0, 10.0, 9.0, 8.0, 10.0, 9.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.20712661743164, -16.641019821166992, -16.074913024902344, -15.508807182312012, -14.94270133972168, -14.376594543457031, -13.810487747192383, -13.244380950927734, -12.678275108337402, -12.112168312072754, -11.546062469482422, -10.979955673217773, -10.413848876953125, -9.847743034362793, -9.281636238098145, -8.715530395507812, -8.149423599243164, -7.583317279815674, -7.017210960388184, -6.451104164123535, -5.884997844696045, -5.318891525268555, -4.752784729003906, -4.186678409576416, -3.620572090148926, -3.0544657707214355, -2.488359212875366, -1.9222527742385864, -1.3561463356018066, -0.7900400161743164, -0.22393345832824707, 0.34217309951782227, 0.9082794189453125, 1.4743858575820923, 2.040492296218872, 2.6065988540649414, 3.1727051734924316, 3.738811492919922, 4.30491828918457, 4.8710246086120605, 5.437130928039551, 6.003237247467041, 6.569343566894531, 7.13545036315918, 7.70155668258667, 8.26766300201416, 8.833769798278809, 9.39987564086914, 9.965982437133789, 10.532089233398438, 11.09819507598877, 11.664301872253418, 12.23040771484375, 12.796514511108398, 13.362621307373047, 13.928728103637695, 14.494833946228027, 15.060940742492676, 15.627046585083008, 16.193153381347656, 16.759260177612305, 17.325366973876953, 17.89147186279297, 18.457578659057617, 19.023685455322266]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 11.0, 15.0, 14.0, 17.0, 20.0, 25.0, 19.0, 19.0, 26.0, 36.0, 29.0, 27.0, 32.0, 28.0, 53.0, 54.0, 41.0, 43.0, 42.0, 30.0, 34.0, 42.0, 39.0, 35.0, 31.0, 39.0, 31.0, 35.0, 27.0, 10.0, 15.0, 15.0, 8.0, 17.0, 6.0, 7.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.807043075561523, -20.106842041015625, -19.406641006469727, -18.706439971923828, -18.006237030029297, -17.3060359954834, -16.6058349609375, -15.905633926391602, -15.205431938171387, -14.505230903625488, -13.805028915405273, -13.104827880859375, -12.404626846313477, -11.704424858093262, -11.004223823547363, -10.304021835327148, -9.60382080078125, -8.903619766235352, -8.203417778015137, -7.503216743469238, -6.803015232086182, -6.102813720703125, -5.402612686157227, -4.70241117477417, -4.002209663391113, -3.3020081520080566, -2.601806879043579, -1.9016056060791016, -1.201404094696045, -0.5012025833129883, 0.19899845123291016, 0.8991999626159668, 1.5994014739990234, 2.29960298538208, 2.9998042583465576, 3.700005531311035, 4.400207042694092, 5.100408554077148, 5.800609588623047, 6.5008111000061035, 7.20101261138916, 7.901214122772217, 8.601415634155273, 9.301616668701172, 10.00181770324707, 10.702019691467285, 11.402220726013184, 12.102422714233398, 12.802623748779297, 13.502824783325195, 14.20302677154541, 14.903227806091309, 15.603429794311523, 16.303630828857422, 17.00383186340332, 17.70403289794922, 18.40423583984375, 19.10443687438965, 19.804637908935547, 20.504840850830078, 21.205041885375977, 21.905242919921875, 22.605443954467773, 23.305644989013672, 24.00584602355957]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 11.0, 13.0, 16.0, 29.0, 46.0, 61.0, 144.0, 138.0, 275.0, 477.0, 676.0, 1151.0, 1905.0, 2937.0, 4686.0, 7504.0, 12225.0, 19777.0, 31052.0, 49292.0, 74998.0, 108021.0, 138145.0, 150413.0, 136343.0, 105495.0, 73734.0, 48176.0, 30477.0, 19148.0, 11694.0, 7244.0, 4490.0, 2835.0, 1758.0, 1080.0, 765.0, 465.0, 311.0, 177.0, 126.0, 80.0, 50.0, 43.0, 32.0, 14.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.2890625, -4.160919189453125, -4.03277587890625, -3.904632568359375, -3.7764892578125, -3.648345947265625, -3.52020263671875, -3.392059326171875, -3.263916015625, -3.135772705078125, -3.00762939453125, -2.879486083984375, -2.7513427734375, -2.623199462890625, -2.49505615234375, -2.366912841796875, -2.23876953125, -2.110626220703125, -1.98248291015625, -1.854339599609375, -1.7261962890625, -1.598052978515625, -1.46990966796875, -1.341766357421875, -1.213623046875, -1.085479736328125, -0.95733642578125, -0.829193115234375, -0.7010498046875, -0.572906494140625, -0.44476318359375, -0.316619873046875, -0.1884765625, -0.060333251953125, 0.06781005859375, 0.195953369140625, 0.3240966796875, 0.452239990234375, 0.58038330078125, 0.708526611328125, 0.836669921875, 0.964813232421875, 1.09295654296875, 1.221099853515625, 1.3492431640625, 1.477386474609375, 1.60552978515625, 1.733673095703125, 1.86181640625, 1.989959716796875, 2.11810302734375, 2.246246337890625, 2.3743896484375, 2.502532958984375, 2.63067626953125, 2.758819580078125, 2.886962890625, 3.015106201171875, 3.14324951171875, 3.271392822265625, 3.3995361328125, 3.527679443359375, 3.65582275390625, 3.783966064453125, 3.912109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 14.0, 22.0, 21.0, 20.0, 19.0, 27.0, 38.0, 28.0, 27.0, 34.0, 25.0, 55.0, 53.0, 46.0, 41.0, 39.0, 33.0, 32.0, 44.0, 34.0, 38.0, 31.0, 38.0, 29.0, 36.0, 27.0, 10.0, 15.0, 14.0, 7.0, 19.0, 4.0, 8.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.921875, -20.218994140625, -19.51611328125, -18.813232421875, -18.1103515625, -17.407470703125, -16.70458984375, -16.001708984375, -15.298828125, -14.595947265625, -13.89306640625, -13.190185546875, -12.4873046875, -11.784423828125, -11.08154296875, -10.378662109375, -9.67578125, -8.972900390625, -8.27001953125, -7.567138671875, -6.8642578125, -6.161376953125, -5.45849609375, -4.755615234375, -4.052734375, -3.349853515625, -2.64697265625, -1.944091796875, -1.2412109375, -0.538330078125, 0.16455078125, 0.867431640625, 1.5703125, 2.273193359375, 2.97607421875, 3.678955078125, 4.3818359375, 5.084716796875, 5.78759765625, 6.490478515625, 7.193359375, 7.896240234375, 8.59912109375, 9.302001953125, 10.0048828125, 10.707763671875, 11.41064453125, 12.113525390625, 12.81640625, 13.519287109375, 14.22216796875, 14.925048828125, 15.6279296875, 16.330810546875, 17.03369140625, 17.736572265625, 18.439453125, 19.142333984375, 19.84521484375, 20.548095703125, 21.2509765625, 21.953857421875, 22.65673828125, 23.359619140625, 24.0625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 13.0, 12.0, 25.0, 35.0, 49.0, 68.0, 115.0, 171.0, 246.0, 421.0, 684.0, 1209.0, 1959.0, 3392.0, 5883.0, 10292.0, 18899.0, 41664.0, 765946.0, 138174.0, 26777.0, 13933.0, 7670.0, 4351.0, 2576.0, 1515.0, 922.0, 572.0, 328.0, 237.0, 136.0, 92.0, 52.0, 35.0, 36.0, 16.0, 11.0, 16.0, 10.0, 2.0, 1.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.6171875, -9.3143310546875, -9.011474609375, -8.7086181640625, -8.40576171875, -8.1029052734375, -7.800048828125, -7.4971923828125, -7.1943359375, -6.8914794921875, -6.588623046875, -6.2857666015625, -5.98291015625, -5.6800537109375, -5.377197265625, -5.0743408203125, -4.771484375, -4.4686279296875, -4.165771484375, -3.8629150390625, -3.56005859375, -3.2572021484375, -2.954345703125, -2.6514892578125, -2.3486328125, -2.0457763671875, -1.742919921875, -1.4400634765625, -1.13720703125, -0.8343505859375, -0.531494140625, -0.2286376953125, 0.07421875, 0.3770751953125, 0.679931640625, 0.9827880859375, 1.28564453125, 1.5885009765625, 1.891357421875, 2.1942138671875, 2.4970703125, 2.7999267578125, 3.102783203125, 3.4056396484375, 3.70849609375, 4.0113525390625, 4.314208984375, 4.6170654296875, 4.919921875, 5.2227783203125, 5.525634765625, 5.8284912109375, 6.13134765625, 6.4342041015625, 6.737060546875, 7.0399169921875, 7.3427734375, 7.6456298828125, 7.948486328125, 8.2513427734375, 8.55419921875, 8.8570556640625, 9.159912109375, 9.4627685546875, 9.765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 9.0, 12.0, 7.0, 13.0, 11.0, 22.0, 16.0, 24.0, 22.0, 29.0, 23.0, 38.0, 37.0, 36.0, 40.0, 31.0, 54.0, 47.0, 48.0, 46.0, 38.0, 34.0, 42.0, 36.0, 39.0, 22.0, 26.0, 34.0, 29.0, 18.0, 26.0, 19.0, 18.0, 14.0, 8.0, 13.0, 4.0, 2.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2265625, -11.7576904296875, -11.288818359375, -10.8199462890625, -10.35107421875, -9.8822021484375, -9.413330078125, -8.9444580078125, -8.4755859375, -8.0067138671875, -7.537841796875, -7.0689697265625, -6.60009765625, -6.1312255859375, -5.662353515625, -5.1934814453125, -4.724609375, -4.2557373046875, -3.786865234375, -3.3179931640625, -2.84912109375, -2.3802490234375, -1.911376953125, -1.4425048828125, -0.9736328125, -0.5047607421875, -0.035888671875, 0.4329833984375, 0.90185546875, 1.3707275390625, 1.839599609375, 2.3084716796875, 2.77734375, 3.2462158203125, 3.715087890625, 4.1839599609375, 4.65283203125, 5.1217041015625, 5.590576171875, 6.0594482421875, 6.5283203125, 6.9971923828125, 7.466064453125, 7.9349365234375, 8.40380859375, 8.8726806640625, 9.341552734375, 9.8104248046875, 10.279296875, 10.7481689453125, 11.217041015625, 11.6859130859375, 12.15478515625, 12.6236572265625, 13.092529296875, 13.5614013671875, 14.0302734375, 14.4991455078125, 14.968017578125, 15.4368896484375, 15.90576171875, 16.3746337890625, 16.843505859375, 17.3123779296875, 17.78125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 11.0, 5.0, 9.0, 24.0, 18.0, 38.0, 44.0, 53.0, 82.0, 123.0, 155.0, 231.0, 307.0, 537.0, 713.0, 1134.0, 1753.0, 2678.0, 4029.0, 6191.0, 9914.0, 15974.0, 25998.0, 103052.0, 775691.0, 41311.0, 21390.0, 13177.0, 8392.0, 5311.0, 3530.0, 2272.0, 1465.0, 950.0, 598.0, 434.0, 290.0, 203.0, 138.0, 90.0, 55.0, 60.0, 21.0, 23.0, 25.0, 14.0, 10.0, 7.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6513671875, -0.6312103271484375, -0.611053466796875, -0.5908966064453125, -0.57073974609375, -0.5505828857421875, -0.530426025390625, -0.5102691650390625, -0.4901123046875, -0.4699554443359375, -0.449798583984375, -0.4296417236328125, -0.40948486328125, -0.3893280029296875, -0.369171142578125, -0.3490142822265625, -0.328857421875, -0.3087005615234375, -0.288543701171875, -0.2683868408203125, -0.24822998046875, -0.2280731201171875, -0.207916259765625, -0.1877593994140625, -0.1676025390625, -0.1474456787109375, -0.127288818359375, -0.1071319580078125, -0.08697509765625, -0.0668182373046875, -0.046661376953125, -0.0265045166015625, -0.00634765625, 0.0138092041015625, 0.033966064453125, 0.0541229248046875, 0.07427978515625, 0.0944366455078125, 0.114593505859375, 0.1347503662109375, 0.1549072265625, 0.1750640869140625, 0.195220947265625, 0.2153778076171875, 0.23553466796875, 0.2556915283203125, 0.275848388671875, 0.2960052490234375, 0.316162109375, 0.3363189697265625, 0.356475830078125, 0.3766326904296875, 0.39678955078125, 0.4169464111328125, 0.437103271484375, 0.4572601318359375, 0.4774169921875, 0.4975738525390625, 0.517730712890625, 0.5378875732421875, 0.55804443359375, 0.5782012939453125, 0.598358154296875, 0.6185150146484375, 0.638671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 8.0, 6.0, 8.0, 28.0, 28.0, 30.0, 23.0, 38.0, 37.0, 28.0, 52.0, 45.0, 51.0, 59.0, 47.0, 49.0, 58.0, 48.0, 52.0, 51.0, 29.0, 39.0, 35.0, 29.0, 24.0, 17.0, 14.0, 16.0, 12.0, 5.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.0219554901123047e-05, -2.932269126176834e-05, -2.8425827622413635e-05, -2.752896398305893e-05, -2.6632100343704224e-05, -2.5735236704349518e-05, -2.4838373064994812e-05, -2.3941509425640106e-05, -2.30446457862854e-05, -2.2147782146930695e-05, -2.125091850757599e-05, -2.0354054868221283e-05, -1.9457191228866577e-05, -1.856032758951187e-05, -1.7663463950157166e-05, -1.676660031080246e-05, -1.5869736671447754e-05, -1.4972873032093048e-05, -1.4076009392738342e-05, -1.3179145753383636e-05, -1.228228211402893e-05, -1.1385418474674225e-05, -1.0488554835319519e-05, -9.591691195964813e-06, -8.694827556610107e-06, -7.797963917255402e-06, -6.901100277900696e-06, -6.00423663854599e-06, -5.107372999191284e-06, -4.210509359836578e-06, -3.3136457204818726e-06, -2.4167820811271667e-06, -1.519918441772461e-06, -6.230548024177551e-07, 2.738088369369507e-07, 1.1706724762916565e-06, 2.0675361156463623e-06, 2.964399755001068e-06, 3.861263394355774e-06, 4.75812703371048e-06, 5.6549906730651855e-06, 6.551854312419891e-06, 7.448717951774597e-06, 8.345581591129303e-06, 9.242445230484009e-06, 1.0139308869838715e-05, 1.103617250919342e-05, 1.1933036148548126e-05, 1.2829899787902832e-05, 1.3726763427257538e-05, 1.4623627066612244e-05, 1.552049070596695e-05, 1.6417354345321655e-05, 1.731421798467636e-05, 1.8211081624031067e-05, 1.9107945263385773e-05, 2.000480890274048e-05, 2.0901672542095184e-05, 2.179853618144989e-05, 2.2695399820804596e-05, 2.3592263460159302e-05, 2.4489127099514008e-05, 2.5385990738868713e-05, 2.628285437822342e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 13.0, 12.0, 20.0, 40.0, 40.0, 78.0, 94.0, 150.0, 273.0, 384.0, 575.0, 968.0, 1489.0, 2215.0, 3426.0, 5435.0, 8790.0, 13571.0, 21474.0, 33863.0, 51044.0, 76645.0, 108109.0, 139964.0, 152411.0, 132421.0, 98713.0, 68310.0, 45486.0, 29976.0, 19183.0, 12142.0, 7720.0, 4847.0, 3095.0, 1947.0, 1256.0, 821.0, 539.0, 361.0, 200.0, 152.0, 91.0, 69.0, 45.0, 37.0, 18.0, 18.0, 8.0, 3.0, 3.0, 6.0, 3.0, 0.0, 1.0], "bins": [-0.5859375, -0.5683746337890625, -0.550811767578125, -0.5332489013671875, -0.51568603515625, -0.4981231689453125, -0.480560302734375, -0.4629974365234375, -0.4454345703125, -0.4278717041015625, -0.410308837890625, -0.3927459716796875, -0.37518310546875, -0.3576202392578125, -0.340057373046875, -0.3224945068359375, -0.304931640625, -0.2873687744140625, -0.269805908203125, -0.2522430419921875, -0.23468017578125, -0.2171173095703125, -0.199554443359375, -0.1819915771484375, -0.1644287109375, -0.1468658447265625, -0.129302978515625, -0.1117401123046875, -0.09417724609375, -0.0766143798828125, -0.059051513671875, -0.0414886474609375, -0.02392578125, -0.0063629150390625, 0.011199951171875, 0.0287628173828125, 0.04632568359375, 0.0638885498046875, 0.081451416015625, 0.0990142822265625, 0.1165771484375, 0.1341400146484375, 0.151702880859375, 0.1692657470703125, 0.18682861328125, 0.2043914794921875, 0.221954345703125, 0.2395172119140625, 0.257080078125, 0.2746429443359375, 0.292205810546875, 0.3097686767578125, 0.32733154296875, 0.3448944091796875, 0.362457275390625, 0.3800201416015625, 0.3975830078125, 0.4151458740234375, 0.432708740234375, 0.4502716064453125, 0.46783447265625, 0.4853973388671875, 0.502960205078125, 0.5205230712890625, 0.5380859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 4.0, 7.0, 8.0, 10.0, 15.0, 13.0, 15.0, 22.0, 33.0, 26.0, 27.0, 49.0, 40.0, 60.0, 52.0, 33.0, 66.0, 51.0, 55.0, 57.0, 46.0, 53.0, 40.0, 29.0, 32.0, 30.0, 31.0, 26.0, 15.0, 16.0, 14.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260009765625, -0.25142669677734375, -0.2428436279296875, -0.23426055908203125, -0.225677490234375, -0.21709442138671875, -0.2085113525390625, -0.19992828369140625, -0.19134521484375, -0.18276214599609375, -0.1741790771484375, -0.16559600830078125, -0.157012939453125, -0.14842987060546875, -0.1398468017578125, -0.13126373291015625, -0.1226806640625, -0.11409759521484375, -0.1055145263671875, -0.09693145751953125, -0.088348388671875, -0.07976531982421875, -0.0711822509765625, -0.06259918212890625, -0.05401611328125, -0.04543304443359375, -0.0368499755859375, -0.02826690673828125, -0.019683837890625, -0.01110076904296875, -0.0025177001953125, 0.00606536865234375, 0.0146484375, 0.02323150634765625, 0.0318145751953125, 0.04039764404296875, 0.048980712890625, 0.05756378173828125, 0.0661468505859375, 0.07472991943359375, 0.08331298828125, 0.09189605712890625, 0.1004791259765625, 0.10906219482421875, 0.117645263671875, 0.12622833251953125, 0.1348114013671875, 0.14339447021484375, 0.1519775390625, 0.16056060791015625, 0.1691436767578125, 0.17772674560546875, 0.186309814453125, 0.19489288330078125, 0.2034759521484375, 0.21205902099609375, 0.22064208984375, 0.22922515869140625, 0.2378082275390625, 0.24639129638671875, 0.254974365234375, 0.26355743408203125, 0.2721405029296875, 0.28072357177734375, 0.289306640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 3.0, 10.0, 12.0, 15.0, 16.0, 22.0, 19.0, 20.0, 22.0, 25.0, 28.0, 32.0, 29.0, 38.0, 32.0, 39.0, 38.0, 43.0, 40.0, 42.0, 49.0, 29.0, 47.0, 37.0, 41.0, 27.0, 34.0, 35.0, 30.0, 21.0, 18.0, 19.0, 8.0, 10.0, 12.0, 9.0, 11.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.923259735107422, -17.339920043945312, -16.756580352783203, -16.173240661621094, -15.589900970458984, -15.006561279296875, -14.423221588134766, -13.839881896972656, -13.256542205810547, -12.673202514648438, -12.089862823486328, -11.506523132324219, -10.92318344116211, -10.33984375, -9.75650405883789, -9.173164367675781, -8.589823722839355, -8.006484031677246, -7.423144340515137, -6.839804649353027, -6.256464958190918, -5.673125267028809, -5.089785099029541, -4.506445407867432, -3.9231057167053223, -3.339766025543213, -2.7564263343811035, -2.173086404800415, -1.5897467136383057, -1.0064070224761963, -0.4230670928955078, 0.16027259826660156, 0.7436122894287109, 1.3269519805908203, 1.9102917909622192, 2.493631601333618, 3.0769712924957275, 3.660310983657837, 4.243650913238525, 4.826990604400635, 5.410330295562744, 5.9936699867248535, 6.577009677886963, 7.1603498458862305, 7.74368953704834, 8.32702922821045, 8.910368919372559, 9.493708610534668, 10.077048301696777, 10.660387992858887, 11.243727684020996, 11.827067375183105, 12.410407066345215, 12.993746757507324, 13.57708740234375, 14.16042709350586, 14.743766784667969, 15.327106475830078, 15.910446166992188, 16.493785858154297, 17.077125549316406, 17.660465240478516, 18.243804931640625, 18.827144622802734, 19.410484313964844]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 14.0, 12.0, 19.0, 14.0, 19.0, 23.0, 20.0, 19.0, 28.0, 38.0, 26.0, 32.0, 30.0, 29.0, 53.0, 51.0, 44.0, 43.0, 39.0, 33.0, 34.0, 41.0, 37.0, 35.0, 31.0, 37.0, 32.0, 32.0, 29.0, 10.0, 15.0, 15.0, 9.0, 15.0, 6.0, 7.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.86855125427246, -20.16748809814453, -19.466426849365234, -18.765363693237305, -18.064302444458008, -17.363239288330078, -16.66217803955078, -15.961114883422852, -15.260052680969238, -14.558990478515625, -13.857928276062012, -13.156866073608398, -12.455802917480469, -11.754741668701172, -11.053678512573242, -10.352616310119629, -9.651554107666016, -8.950491905212402, -8.249429702758789, -7.548367023468018, -6.847304821014404, -6.146242618560791, -5.4451799392700195, -4.744117736816406, -4.043055534362793, -3.3419933319091797, -2.6409308910369873, -1.939868450164795, -1.2388062477111816, -0.5377440452575684, 0.16331863403320312, 0.8643808364868164, 1.5654449462890625, 2.266507148742676, 2.967569589614868, 3.6686320304870605, 4.369694232940674, 5.070756435394287, 5.771819114685059, 6.472881317138672, 7.173943519592285, 7.875005722045898, 8.576067924499512, 9.277130126953125, 9.978193283081055, 10.679254531860352, 11.380317687988281, 12.081379890441895, 12.782442092895508, 13.483504295349121, 14.184566497802734, 14.885629653930664, 15.586690902709961, 16.28775405883789, 16.988815307617188, 17.689878463745117, 18.390941619873047, 19.092004776000977, 19.793066024780273, 20.494129180908203, 21.1951904296875, 21.89625358581543, 22.59731674194336, 23.298377990722656, 23.999439239501953]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 10.0, 16.0, 19.0, 29.0, 49.0, 95.0, 126.0, 226.0, 434.0, 700.0, 1214.0, 1972.0, 3396.0, 5905.0, 9873.0, 16053.0, 25774.0, 39737.0, 57834.0, 79255.0, 100430.0, 117281.0, 123303.0, 117319.0, 101544.0, 80627.0, 58080.0, 40200.0, 25937.0, 16447.0, 9983.0, 6011.0, 3663.0, 2085.0, 1222.0, 731.0, 389.0, 238.0, 143.0, 80.0, 46.0, 37.0, 23.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.90625, -16.40185546875, -15.8974609375, -15.39306640625, -14.888671875, -14.38427734375, -13.8798828125, -13.37548828125, -12.87109375, -12.36669921875, -11.8623046875, -11.35791015625, -10.853515625, -10.34912109375, -9.8447265625, -9.34033203125, -8.8359375, -8.33154296875, -7.8271484375, -7.32275390625, -6.818359375, -6.31396484375, -5.8095703125, -5.30517578125, -4.80078125, -4.29638671875, -3.7919921875, -3.28759765625, -2.783203125, -2.27880859375, -1.7744140625, -1.27001953125, -0.765625, -0.26123046875, 0.2431640625, 0.74755859375, 1.251953125, 1.75634765625, 2.2607421875, 2.76513671875, 3.26953125, 3.77392578125, 4.2783203125, 4.78271484375, 5.287109375, 5.79150390625, 6.2958984375, 6.80029296875, 7.3046875, 7.80908203125, 8.3134765625, 8.81787109375, 9.322265625, 9.82666015625, 10.3310546875, 10.83544921875, 11.33984375, 11.84423828125, 12.3486328125, 12.85302734375, 13.357421875, 13.86181640625, 14.3662109375, 14.87060546875, 15.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 6.0, 6.0, 14.0, 11.0, 19.0, 14.0, 21.0, 23.0, 23.0, 15.0, 30.0, 36.0, 28.0, 29.0, 32.0, 27.0, 54.0, 53.0, 45.0, 40.0, 41.0, 36.0, 31.0, 42.0, 40.0, 30.0, 34.0, 38.0, 28.0, 36.0, 26.0, 9.0, 13.0, 18.0, 9.0, 14.0, 5.0, 7.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.609375, -19.916015625, -19.22265625, -18.529296875, -17.8359375, -17.142578125, -16.44921875, -15.755859375, -15.0625, -14.369140625, -13.67578125, -12.982421875, -12.2890625, -11.595703125, -10.90234375, -10.208984375, -9.515625, -8.822265625, -8.12890625, -7.435546875, -6.7421875, -6.048828125, -5.35546875, -4.662109375, -3.96875, -3.275390625, -2.58203125, -1.888671875, -1.1953125, -0.501953125, 0.19140625, 0.884765625, 1.578125, 2.271484375, 2.96484375, 3.658203125, 4.3515625, 5.044921875, 5.73828125, 6.431640625, 7.125, 7.818359375, 8.51171875, 9.205078125, 9.8984375, 10.591796875, 11.28515625, 11.978515625, 12.671875, 13.365234375, 14.05859375, 14.751953125, 15.4453125, 16.138671875, 16.83203125, 17.525390625, 18.21875, 18.912109375, 19.60546875, 20.298828125, 20.9921875, 21.685546875, 22.37890625, 23.072265625, 23.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 24.0, 27.0, 38.0, 60.0, 101.0, 166.0, 293.0, 431.0, 730.0, 1155.0, 1790.0, 3060.0, 4604.0, 7235.0, 11312.0, 17103.0, 25168.0, 36787.0, 50290.0, 66685.0, 82447.0, 97054.0, 105956.0, 106267.0, 99000.0, 86963.0, 70293.0, 53601.0, 39332.0, 27639.0, 18644.0, 12295.0, 8106.0, 5133.0, 3287.0, 2113.0, 1273.0, 814.0, 468.0, 327.0, 192.0, 87.0, 69.0, 52.0, 23.0, 31.0, 10.0, 10.0, 7.0, 2.0, 5.0, 2.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 13.0, 9.0, 16.0, 23.0, 24.0, 16.0, 24.0, 34.0, 27.0, 45.0, 25.0, 28.0, 31.0, 27.0, 33.0, 46.0, 48.0, 53.0, 46.0, 42.0, 29.0, 41.0, 44.0, 39.0, 43.0, 19.0, 27.0, 13.0, 22.0, 18.0, 12.0, 14.0, 13.0, 7.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.8204345703125, -11.367431640625, -10.9144287109375, -10.46142578125, -10.0084228515625, -9.555419921875, -9.1024169921875, -8.6494140625, -8.1964111328125, -7.743408203125, -7.2904052734375, -6.83740234375, -6.3843994140625, -5.931396484375, -5.4783935546875, -5.025390625, -4.5723876953125, -4.119384765625, -3.6663818359375, -3.21337890625, -2.7603759765625, -2.307373046875, -1.8543701171875, -1.4013671875, -0.9483642578125, -0.495361328125, -0.0423583984375, 0.41064453125, 0.8636474609375, 1.316650390625, 1.7696533203125, 2.22265625, 2.6756591796875, 3.128662109375, 3.5816650390625, 4.03466796875, 4.4876708984375, 4.940673828125, 5.3936767578125, 5.8466796875, 6.2996826171875, 6.752685546875, 7.2056884765625, 7.65869140625, 8.1116943359375, 8.564697265625, 9.0177001953125, 9.470703125, 9.9237060546875, 10.376708984375, 10.8297119140625, 11.28271484375, 11.7357177734375, 12.188720703125, 12.6417236328125, 13.0947265625, 13.5477294921875, 14.000732421875, 14.4537353515625, 14.90673828125, 15.3597412109375, 15.812744140625, 16.2657470703125, 16.71875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 10.0, 2.0, 10.0, 17.0, 43.0, 49.0, 96.0, 127.0, 223.0, 289.0, 468.0, 912.0, 1441.0, 2394.0, 4206.0, 7177.0, 12147.0, 20908.0, 34526.0, 54341.0, 79368.0, 108510.0, 131995.0, 139951.0, 130184.0, 106356.0, 78432.0, 52826.0, 32872.0, 20153.0, 11713.0, 6764.0, 4080.0, 2352.0, 1388.0, 848.0, 531.0, 331.0, 183.0, 115.0, 72.0, 43.0, 34.0, 27.0, 14.0, 8.0, 10.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5078125, -7.27655029296875, -7.0452880859375, -6.81402587890625, -6.582763671875, -6.35150146484375, -6.1202392578125, -5.88897705078125, -5.65771484375, -5.42645263671875, -5.1951904296875, -4.96392822265625, -4.732666015625, -4.50140380859375, -4.2701416015625, -4.03887939453125, -3.8076171875, -3.57635498046875, -3.3450927734375, -3.11383056640625, -2.882568359375, -2.65130615234375, -2.4200439453125, -2.18878173828125, -1.95751953125, -1.72625732421875, -1.4949951171875, -1.26373291015625, -1.032470703125, -0.80120849609375, -0.5699462890625, -0.33868408203125, -0.107421875, 0.12384033203125, 0.3551025390625, 0.58636474609375, 0.817626953125, 1.04888916015625, 1.2801513671875, 1.51141357421875, 1.74267578125, 1.97393798828125, 2.2052001953125, 2.43646240234375, 2.667724609375, 2.89898681640625, 3.1302490234375, 3.36151123046875, 3.5927734375, 3.82403564453125, 4.0552978515625, 4.28656005859375, 4.517822265625, 4.74908447265625, 4.9803466796875, 5.21160888671875, 5.44287109375, 5.67413330078125, 5.9053955078125, 6.13665771484375, 6.367919921875, 6.59918212890625, 6.8304443359375, 7.06170654296875, 7.29296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 2.0, 3.0, 6.0, 10.0, 13.0, 21.0, 22.0, 26.0, 37.0, 34.0, 47.0, 58.0, 64.0, 53.0, 63.0, 64.0, 54.0, 63.0, 59.0, 53.0, 59.0, 33.0, 28.0, 15.0, 18.0, 19.0, 10.0, 16.0, 10.0, 13.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00115966796875, -0.0011275634169578552, -0.0010954588651657104, -0.0010633543133735657, -0.001031249761581421, -0.0009991452097892761, -0.0009670406579971313, -0.0009349361062049866, -0.0009028315544128418, -0.000870727002620697, -0.0008386224508285522, -0.0008065178990364075, -0.0007744133472442627, -0.0007423087954521179, -0.0007102042436599731, -0.0006780996918678284, -0.0006459951400756836, -0.0006138905882835388, -0.000581786036491394, -0.0005496814846992493, -0.0005175769329071045, -0.0004854723811149597, -0.00045336782932281494, -0.00042126327753067017, -0.0003891587257385254, -0.0003570541739463806, -0.00032494962215423584, -0.00029284507036209106, -0.0002607405185699463, -0.00022863596677780151, -0.00019653141498565674, -0.00016442686319351196, -0.0001323223114013672, -0.00010021775960922241, -6.811320781707764e-05, -3.600865602493286e-05, -3.904104232788086e-06, 2.820044755935669e-05, 6.0304999351501465e-05, 9.240955114364624e-05, 0.00012451410293579102, 0.0001566186547279358, 0.00018872320652008057, 0.00022082775831222534, 0.0002529323101043701, 0.0002850368618965149, 0.00031714141368865967, 0.00034924596548080444, 0.0003813505172729492, 0.000413455069065094, 0.00044555962085723877, 0.00047766417264938354, 0.0005097687244415283, 0.0005418732762336731, 0.0005739778280258179, 0.0006060823798179626, 0.0006381869316101074, 0.0006702914834022522, 0.000702396035194397, 0.0007345005869865417, 0.0007666051387786865, 0.0007987096905708313, 0.0008308142423629761, 0.0008629187941551208, 0.0008950233459472656]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 20.0, 24.0, 42.0, 38.0, 80.0, 107.0, 179.0, 260.0, 416.0, 629.0, 1104.0, 1673.0, 2874.0, 4584.0, 7591.0, 12383.0, 19987.0, 31777.0, 48718.0, 70055.0, 94365.0, 115835.0, 127541.0, 125653.0, 110428.0, 88466.0, 64429.0, 44144.0, 28890.0, 17780.0, 11131.0, 6778.0, 4049.0, 2449.0, 1516.0, 923.0, 608.0, 342.0, 219.0, 167.0, 87.0, 67.0, 39.0, 27.0, 21.0, 15.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.1328125, -6.9090576171875, -6.685302734375, -6.4615478515625, -6.23779296875, -6.0140380859375, -5.790283203125, -5.5665283203125, -5.3427734375, -5.1190185546875, -4.895263671875, -4.6715087890625, -4.44775390625, -4.2239990234375, -4.000244140625, -3.7764892578125, -3.552734375, -3.3289794921875, -3.105224609375, -2.8814697265625, -2.65771484375, -2.4339599609375, -2.210205078125, -1.9864501953125, -1.7626953125, -1.5389404296875, -1.315185546875, -1.0914306640625, -0.86767578125, -0.6439208984375, -0.420166015625, -0.1964111328125, 0.02734375, 0.2510986328125, 0.474853515625, 0.6986083984375, 0.92236328125, 1.1461181640625, 1.369873046875, 1.5936279296875, 1.8173828125, 2.0411376953125, 2.264892578125, 2.4886474609375, 2.71240234375, 2.9361572265625, 3.159912109375, 3.3836669921875, 3.607421875, 3.8311767578125, 4.054931640625, 4.2786865234375, 4.50244140625, 4.7261962890625, 4.949951171875, 5.1737060546875, 5.3974609375, 5.6212158203125, 5.844970703125, 6.0687255859375, 6.29248046875, 6.5162353515625, 6.739990234375, 6.9637451171875, 7.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 7.0, 5.0, 9.0, 7.0, 14.0, 13.0, 16.0, 20.0, 18.0, 32.0, 37.0, 33.0, 42.0, 43.0, 50.0, 57.0, 54.0, 37.0, 52.0, 51.0, 43.0, 43.0, 40.0, 33.0, 37.0, 40.0, 23.0, 23.0, 18.0, 21.0, 12.0, 19.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.754730224609375, -2.65985107421875, -2.564971923828125, -2.4700927734375, -2.375213623046875, -2.28033447265625, -2.185455322265625, -2.090576171875, -1.995697021484375, -1.90081787109375, -1.805938720703125, -1.7110595703125, -1.616180419921875, -1.52130126953125, -1.426422119140625, -1.33154296875, -1.236663818359375, -1.14178466796875, -1.046905517578125, -0.9520263671875, -0.857147216796875, -0.76226806640625, -0.667388916015625, -0.572509765625, -0.477630615234375, -0.38275146484375, -0.287872314453125, -0.1929931640625, -0.098114013671875, -0.00323486328125, 0.091644287109375, 0.1865234375, 0.281402587890625, 0.37628173828125, 0.471160888671875, 0.5660400390625, 0.660919189453125, 0.75579833984375, 0.850677490234375, 0.945556640625, 1.040435791015625, 1.13531494140625, 1.230194091796875, 1.3250732421875, 1.419952392578125, 1.51483154296875, 1.609710693359375, 1.70458984375, 1.799468994140625, 1.89434814453125, 1.989227294921875, 2.0841064453125, 2.178985595703125, 2.27386474609375, 2.368743896484375, 2.463623046875, 2.558502197265625, 2.65338134765625, 2.748260498046875, 2.8431396484375, 2.938018798828125, 3.03289794921875, 3.127777099609375, 3.22265625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 3.0, 1.0, 14.0, 10.0, 14.0, 5.0, 23.0, 20.0, 10.0, 16.0, 32.0, 24.0, 28.0, 20.0, 40.0, 23.0, 32.0, 44.0, 32.0, 48.0, 30.0, 27.0, 39.0, 45.0, 37.0, 39.0, 33.0, 36.0, 29.0, 34.0, 36.0, 28.0, 33.0, 16.0, 11.0, 16.0, 12.0, 7.0, 11.0, 5.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.452930450439453, -15.895241737365723, -15.337553024291992, -14.779863357543945, -14.222174644470215, -13.664485931396484, -13.106797218322754, -12.549108505249023, -11.991418838500977, -11.433730125427246, -10.876041412353516, -10.318351745605469, -9.760663032531738, -9.202974319458008, -8.645285606384277, -8.087596893310547, -7.529908180236816, -6.972219467163086, -6.414530277252197, -5.856841564178467, -5.299152374267578, -4.741463661193848, -4.183774948120117, -3.6260859966278076, -3.068397045135498, -2.5107080936431885, -1.9530192613601685, -1.3953304290771484, -0.8376414775848389, -0.2799525260925293, 0.27773618698120117, 0.8354251384735107, 1.3931140899658203, 1.9508030414581299, 2.5084919929504395, 3.06618070602417, 3.6238696575164795, 4.181558609008789, 4.7392473220825195, 5.29693603515625, 5.854625225067139, 6.412313938140869, 6.970003128051758, 7.527691841125488, 8.085380554199219, 8.643070220947266, 9.20075798034668, 9.758447647094727, 10.316136360168457, 10.873825073242188, 11.431513786315918, 11.989202499389648, 12.546892166137695, 13.104580879211426, 13.662269592285156, 14.219958305358887, 14.777647018432617, 15.335335731506348, 15.893024444580078, 16.450714111328125, 17.00840187072754, 17.566091537475586, 18.123779296875, 18.681468963623047, 19.239158630371094]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 9.0, 8.0, 7.0, 11.0, 16.0, 14.0, 12.0, 20.0, 26.0, 21.0, 30.0, 28.0, 32.0, 30.0, 34.0, 30.0, 42.0, 41.0, 35.0, 31.0, 38.0, 32.0, 43.0, 35.0, 35.0, 35.0, 37.0, 37.0, 31.0, 33.0, 27.0, 17.0, 20.0, 13.0, 20.0, 13.0, 16.0, 11.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-22.683317184448242, -21.936798095703125, -21.190277099609375, -20.443758010864258, -19.697237014770508, -18.95071792602539, -18.20419692993164, -17.457677841186523, -16.711158752441406, -15.964638710021973, -15.218118667602539, -14.471599578857422, -13.725079536437988, -12.978559494018555, -12.232039451599121, -11.485519409179688, -10.738999366760254, -9.99247932434082, -9.245959281921387, -8.499439239501953, -7.752920150756836, -7.006400108337402, -6.259880065917969, -5.513360500335693, -4.76684045791626, -4.020320415496826, -3.273800849914551, -2.527280807495117, -1.7807610034942627, -1.0342411994934082, -0.2877211570739746, 0.4587984085083008, 1.2053184509277344, 1.9518382549285889, 2.6983580589294434, 3.444878101348877, 4.191397666931152, 4.937917709350586, 5.6844377517700195, 6.430957317352295, 7.1774773597717285, 7.923997402191162, 8.670516967773438, 9.417037010192871, 10.163557052612305, 10.910076141357422, 11.656597137451172, 12.403116226196289, 13.149636268615723, 13.896156311035156, 14.64267635345459, 15.389196395874023, 16.13571548461914, 16.88223648071289, 17.628755569458008, 18.375274658203125, 19.121795654296875, 19.868314743041992, 20.614835739135742, 21.36135482788086, 22.10787582397461, 22.854394912719727, 23.600914001464844, 24.347434997558594, 25.09395408630371]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 7.0, 3.0, 11.0, 13.0, 11.0, 13.0, 27.0, 31.0, 39.0, 57.0, 74.0, 92.0, 142.0, 225.0, 260.0, 435.0, 660.0, 1042.0, 1433.0, 2065.0, 2873.0, 3630.0, 1025480.0, 3391.0, 2465.0, 1929.0, 1324.0, 886.0, 619.0, 411.0, 272.0, 164.0, 123.0, 82.0, 77.0, 56.0, 42.0, 25.0, 26.0, 21.0, 20.0, 8.0, 12.0, 10.0, 8.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-258.6935119628906, -250.44822692871094, -242.2029266357422, -233.9576416015625, -225.7123565673828, -217.46707153320312, -209.22177124023438, -200.9764862060547, -192.731201171875, -184.4859161376953, -176.24061584472656, -167.99533081054688, -159.7500457763672, -151.5047607421875, -143.25946044921875, -135.01417541503906, -126.76887512207031, -118.5235824584961, -110.2782974243164, -102.03300476074219, -93.7877197265625, -85.54242706298828, -77.29713439941406, -69.05184936523438, -60.806556701660156, -52.5612678527832, -44.31597900390625, -36.07068634033203, -27.825397491455078, -19.580108642578125, -11.334815979003906, -3.089527130126953, 5.15576171875, 13.40105152130127, 21.64634132385254, 29.891632080078125, 38.13692092895508, 46.38220977783203, 54.62750244140625, 62.8727912902832, 71.11808013916016, 79.36337280273438, 87.60865783691406, 95.85395050048828, 104.0992431640625, 112.34452819824219, 120.5898208618164, 128.83511352539062, 137.0803985595703, 145.32568359375, 153.57098388671875, 161.81626892089844, 170.06155395507812, 178.30685424804688, 186.55213928222656, 194.79742431640625, 203.042724609375, 211.2880096435547, 219.53330993652344, 227.77859497070312, 236.0238800048828, 244.2691650390625, 252.51446533203125, 260.759765625, 269.0050354003906]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 11.0, 6.0, 9.0, 16.0, 14.0, 19.0, 31.0, 34.0, 30.0, 44.0, 76.0, 76.0, 106.0, 112.0, 167.0, 221.0, 247.0, 338.0, 485.0, 725.0, 1048.0, 1631.0, 2549.0, 4371.0, 8141.0, 18064.0, 51362288.0, 42859.0, 11473.0, 5912.0, 3471.0, 2130.0, 1288.0, 879.0, 601.0, 401.0, 335.0, 253.0, 181.0, 161.0, 114.0, 99.0, 65.0, 61.0, 45.0, 39.0, 25.0, 20.0, 16.0, 13.0, 10.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 4.0], "bins": [-255.2211151123047, -247.1879425048828, -239.15478515625, -231.12161254882812, -223.08843994140625, -215.05526733398438, -207.02210998535156, -198.9889373779297, -190.95578002929688, -182.922607421875, -174.8894500732422, -166.8562774658203, -158.82310485839844, -150.78994750976562, -142.75677490234375, -134.72360229492188, -126.6904296875, -118.65726470947266, -110.62409210205078, -102.59092712402344, -94.55775451660156, -86.52458953857422, -78.49142456054688, -70.458251953125, -62.425086975097656, -54.39191818237305, -46.35874938964844, -38.325584411621094, -30.292415618896484, -22.259246826171875, -14.226081848144531, -6.192913055419922, 1.840240478515625, 9.873408317565918, 17.90657615661621, 25.939743041992188, 33.9729118347168, 42.006080627441406, 50.03924560546875, 58.07241439819336, 66.10558319091797, 74.13874816894531, 82.17192077636719, 90.20508575439453, 98.23825073242188, 106.27142333984375, 114.3045883178711, 122.33775329589844, 130.3709259033203, 138.4040985107422, 146.437255859375, 154.47042846679688, 162.50360107421875, 170.53677368164062, 178.56993103027344, 186.6031036376953, 194.63626098632812, 202.66943359375, 210.7025909423828, 218.7357635498047, 226.76893615722656, 234.80209350585938, 242.83526611328125, 250.86843872070312, 258.901611328125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 13.0, 10.0, 13.0, 25.0, 30.0, 42.0, 39.0, 57.0, 70.0, 81.0, 96.0, 75.0, 90.0, 74.0, 67.0, 51.0, 32.0, 39.0, 22.0, 15.0, 12.0, 11.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.27764892578125, -109.9367904663086, -103.59593200683594, -97.25507354736328, -90.91421508789062, -84.57335662841797, -78.23249816894531, -71.89164733886719, -65.55078125, -59.209922790527344, -52.86906433105469, -46.52820587158203, -40.187347412109375, -33.84648895263672, -27.505634307861328, -21.164775848388672, -14.823921203613281, -8.483062744140625, -2.142205238342285, 4.198652267456055, 10.539510726928711, 16.880369186401367, 23.22122573852539, 29.562084197998047, 35.9029426574707, 42.24380111694336, 48.584659576416016, 54.925514221191406, 61.26637268066406, 67.60723114013672, 73.94808959960938, 80.28894805908203, 86.62980651855469, 92.97066497802734, 99.3115234375, 105.65238189697266, 111.99324035644531, 118.33409881591797, 124.67495727539062, 131.01580810546875, 137.35667419433594, 143.69752502441406, 150.03839111328125, 156.37924194335938, 162.72010803222656, 169.0609588623047, 175.40182495117188, 181.74267578125, 188.08352661132812, 194.42437744140625, 200.76524353027344, 207.10609436035156, 213.44696044921875, 219.78781127929688, 226.12867736816406, 232.4695281982422, 238.81039428710938, 245.1512451171875, 251.4921112060547, 257.8329772949219, 264.173828125, 270.5146789550781, 276.85552978515625, 283.1964111328125, 289.5372619628906]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 7.0, 18.0, 13.0, 15.0, 23.0, 33.0, 24.0, 27.0, 35.0, 43.0, 66.0, 56.0, 74.0, 86.0, 69.0, 66.0, 66.0, 41.0, 36.0, 28.0, 26.0, 26.0, 23.0, 21.0, 16.0, 16.0, 8.0, 7.0, 5.0, 6.0, 1.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.6728515625, -235.62342834472656, -228.57400512695312, -221.5245819091797, -214.47515869140625, -207.4257354736328, -200.37631225585938, -193.326904296875, -186.2774658203125, -179.22804260253906, -172.17861938476562, -165.1291961669922, -158.07977294921875, -151.0303497314453, -143.98092651367188, -136.9315185546875, -129.88209533691406, -122.83267211914062, -115.78324890136719, -108.73382568359375, -101.68440246582031, -94.63497924804688, -87.58556365966797, -80.53614044189453, -73.4867172241211, -66.43729400634766, -59.38787078857422, -52.33845138549805, -45.28902816772461, -38.23960494995117, -31.190185546875, -24.140762329101562, -17.091354370117188, -10.041932106018066, -2.9925098419189453, 4.056911468505859, 11.106334686279297, 18.155757904052734, 25.205177307128906, 32.254600524902344, 39.30402374267578, 46.35344696044922, 53.402870178222656, 60.45228958129883, 67.501708984375, 74.55113220214844, 81.60055541992188, 88.64997863769531, 95.69940185546875, 102.74882507324219, 109.79824829101562, 116.84767150878906, 123.8970947265625, 130.94651794433594, 137.99594116210938, 145.04534912109375, 152.09478759765625, 159.1442108154297, 166.19363403320312, 173.24305725097656, 180.29248046875, 187.34190368652344, 194.39132690429688, 201.44073486328125, 208.4901580810547]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 14.0, 14.0, 20.0, 29.0, 61.0, 92.0, 140.0, 237.0, 357.0, 641.0, 1060.0, 2000.0, 3972.0, 8654.0, 21970.0, 76550.0, 542762.0, 3292057.0, 184971.0, 36598.0, 12070.0, 4868.0, 2250.0, 1203.0, 662.0, 375.0, 237.0, 135.0, 81.0, 76.0, 38.0, 27.0, 16.0, 12.0, 5.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.7265625, -10.4306640625, -10.134765625, -9.8388671875, -9.54296875, -9.2470703125, -8.951171875, -8.6552734375, -8.359375, -8.0634765625, -7.767578125, -7.4716796875, -7.17578125, -6.8798828125, -6.583984375, -6.2880859375, -5.9921875, -5.6962890625, -5.400390625, -5.1044921875, -4.80859375, -4.5126953125, -4.216796875, -3.9208984375, -3.625, -3.3291015625, -3.033203125, -2.7373046875, -2.44140625, -2.1455078125, -1.849609375, -1.5537109375, -1.2578125, -0.9619140625, -0.666015625, -0.3701171875, -0.07421875, 0.2216796875, 0.517578125, 0.8134765625, 1.109375, 1.4052734375, 1.701171875, 1.9970703125, 2.29296875, 2.5888671875, 2.884765625, 3.1806640625, 3.4765625, 3.7724609375, 4.068359375, 4.3642578125, 4.66015625, 4.9560546875, 5.251953125, 5.5478515625, 5.84375, 6.1396484375, 6.435546875, 6.7314453125, 7.02734375, 7.3232421875, 7.619140625, 7.9150390625, 8.2109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 11.0, 29.0, 35.0, 51.0, 70.0, 81.0, 118.0, 130.0, 109.0, 93.0, 87.0, 54.0, 24.0, 19.0, 16.0, 13.0, 10.0, 3.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.669921875, -0.6478500366210938, -0.6257781982421875, -0.6037063598632812, -0.581634521484375, -0.5595626831054688, -0.5374908447265625, -0.5154190063476562, -0.49334716796875, -0.47127532958984375, -0.4492034912109375, -0.42713165283203125, -0.405059814453125, -0.38298797607421875, -0.3609161376953125, -0.33884429931640625, -0.3167724609375, -0.29470062255859375, -0.2726287841796875, -0.25055694580078125, -0.228485107421875, -0.20641326904296875, -0.1843414306640625, -0.16226959228515625, -0.14019775390625, -0.11812591552734375, -0.0960540771484375, -0.07398223876953125, -0.051910400390625, -0.02983856201171875, -0.0077667236328125, 0.01430511474609375, 0.036376953125, 0.05844879150390625, 0.0805206298828125, 0.10259246826171875, 0.124664306640625, 0.14673614501953125, 0.1688079833984375, 0.19087982177734375, 0.21295166015625, 0.23502349853515625, 0.2570953369140625, 0.27916717529296875, 0.301239013671875, 0.32331085205078125, 0.3453826904296875, 0.36745452880859375, 0.3895263671875, 0.41159820556640625, 0.4336700439453125, 0.45574188232421875, 0.477813720703125, 0.49988555908203125, 0.5219573974609375, 0.5440292358398438, 0.56610107421875, 0.5881729125976562, 0.6102447509765625, 0.6323165893554688, 0.654388427734375, 0.6764602661132812, 0.6985321044921875, 0.7206039428710938, 0.74267578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 16.0, 13.0, 27.0, 25.0, 43.0, 69.0, 91.0, 128.0, 177.0, 295.0, 523.0, 816.0, 1431.0, 2564.0, 4426.0, 8846.0, 18549.0, 41679.0, 106765.0, 336810.0, 2249787.0, 1037100.0, 238927.0, 80710.0, 32861.0, 15003.0, 7337.0, 3859.0, 2104.0, 1203.0, 763.0, 460.0, 277.0, 176.0, 107.0, 82.0, 61.0, 46.0, 26.0, 22.0, 21.0, 11.0, 12.0, 8.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.73046875, -4.57720947265625, -4.4239501953125, -4.27069091796875, -4.117431640625, -3.96417236328125, -3.8109130859375, -3.65765380859375, -3.50439453125, -3.35113525390625, -3.1978759765625, -3.04461669921875, -2.891357421875, -2.73809814453125, -2.5848388671875, -2.43157958984375, -2.2783203125, -2.12506103515625, -1.9718017578125, -1.81854248046875, -1.665283203125, -1.51202392578125, -1.3587646484375, -1.20550537109375, -1.05224609375, -0.89898681640625, -0.7457275390625, -0.59246826171875, -0.439208984375, -0.28594970703125, -0.1326904296875, 0.02056884765625, 0.173828125, 0.32708740234375, 0.4803466796875, 0.63360595703125, 0.786865234375, 0.94012451171875, 1.0933837890625, 1.24664306640625, 1.39990234375, 1.55316162109375, 1.7064208984375, 1.85968017578125, 2.012939453125, 2.16619873046875, 2.3194580078125, 2.47271728515625, 2.6259765625, 2.77923583984375, 2.9324951171875, 3.08575439453125, 3.239013671875, 3.39227294921875, 3.5455322265625, 3.69879150390625, 3.85205078125, 4.00531005859375, 4.1585693359375, 4.31182861328125, 4.465087890625, 4.61834716796875, 4.7716064453125, 4.92486572265625, 5.078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 9.0, 7.0, 8.0, 15.0, 17.0, 17.0, 21.0, 27.0, 35.0, 50.0, 47.0, 90.0, 93.0, 121.0, 157.0, 196.0, 245.0, 434.0, 966.0, 382.0, 278.0, 182.0, 146.0, 126.0, 89.0, 73.0, 47.0, 32.0, 34.0, 19.0, 21.0, 14.0, 14.0, 4.0, 9.0, 15.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3349609375, -1.28961181640625, -1.2442626953125, -1.19891357421875, -1.153564453125, -1.10821533203125, -1.0628662109375, -1.01751708984375, -0.97216796875, -0.92681884765625, -0.8814697265625, -0.83612060546875, -0.790771484375, -0.74542236328125, -0.7000732421875, -0.65472412109375, -0.609375, -0.56402587890625, -0.5186767578125, -0.47332763671875, -0.427978515625, -0.38262939453125, -0.3372802734375, -0.29193115234375, -0.24658203125, -0.20123291015625, -0.1558837890625, -0.11053466796875, -0.065185546875, -0.01983642578125, 0.0255126953125, 0.07086181640625, 0.1162109375, 0.16156005859375, 0.2069091796875, 0.25225830078125, 0.297607421875, 0.34295654296875, 0.3883056640625, 0.43365478515625, 0.47900390625, 0.52435302734375, 0.5697021484375, 0.61505126953125, 0.660400390625, 0.70574951171875, 0.7510986328125, 0.79644775390625, 0.841796875, 0.88714599609375, 0.9324951171875, 0.97784423828125, 1.023193359375, 1.06854248046875, 1.1138916015625, 1.15924072265625, 1.20458984375, 1.24993896484375, 1.2952880859375, 1.34063720703125, 1.385986328125, 1.43133544921875, 1.4766845703125, 1.52203369140625, 1.5673828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 13.0, 12.0, 25.0, 23.0, 20.0, 21.0, 33.0, 36.0, 46.0, 57.0, 59.0, 60.0, 61.0, 53.0, 59.0, 57.0, 58.0, 42.0, 51.0, 39.0, 27.0, 24.0, 19.0, 19.0, 8.0, 19.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.321364402770996, -6.098531723022461, -5.875699520111084, -5.652866840362549, -5.430034637451172, -5.207201957702637, -4.984369277954102, -4.761537075042725, -4.538704872131348, -4.3158721923828125, -4.0930399894714355, -3.8702073097229004, -3.6473751068115234, -3.4245424270629883, -3.2017099857330322, -2.978877544403076, -2.756044864654541, -2.533212423324585, -2.310379981994629, -2.0875473022460938, -1.8647149801254272, -1.6418825387954712, -1.4190499782562256, -1.1962175369262695, -0.9733850955963135, -0.7505526542663574, -0.5277201533317566, -0.30488765239715576, -0.08205521106719971, 0.14077723026275635, 0.36360979080200195, 0.586442232131958, 0.8092751502990723, 1.0321075916290283, 1.2549400329589844, 1.47777259349823, 1.700605034828186, 1.923437476158142, 2.1462700366973877, 2.3691024780273438, 2.5919349193573, 2.814767360687256, 3.037599802017212, 3.260432243347168, 3.483264923095703, 3.70609712600708, 3.9289298057556152, 4.151762008666992, 4.374594688415527, 4.5974273681640625, 4.8202595710754395, 5.043092250823975, 5.265924453735352, 5.488757133483887, 5.711589813232422, 5.934422016143799, 6.157254219055176, 6.380086898803711, 6.602919101715088, 6.825751781463623, 7.048583984375, 7.271416664123535, 7.49424934387207, 7.717081546783447, 7.939914226531982]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 2.0, 7.0, 7.0, 9.0, 14.0, 15.0, 13.0, 25.0, 15.0, 19.0, 32.0, 28.0, 26.0, 37.0, 41.0, 47.0, 48.0, 48.0, 48.0, 51.0, 53.0, 49.0, 45.0, 36.0, 34.0, 30.0, 38.0, 29.0, 23.0, 24.0, 15.0, 12.0, 16.0, 12.0, 12.0, 3.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.141359329223633, -6.920445442199707, -6.699531555175781, -6.4786176681518555, -6.25770378112793, -6.036789894104004, -5.81587553024292, -5.594961643218994, -5.374047756195068, -5.153133869171143, -4.932219982147217, -4.711306095123291, -4.490391731262207, -4.269477844238281, -4.0485639572143555, -3.8276500701904297, -3.606736183166504, -3.385822296142578, -3.1649084091186523, -2.9439942836761475, -2.7230803966522217, -2.502166509628296, -2.281252384185791, -2.0603384971618652, -1.8394246101379395, -1.6185107231140137, -1.3975967168807983, -1.176682710647583, -0.9557688236236572, -0.7348549365997314, -0.5139409303665161, -0.2930269241333008, -0.072113037109375, 0.14880090951919556, 0.3697148561477661, 0.5906288027763367, 0.8115427494049072, 1.032456636428833, 1.2533706426620483, 1.4742846488952637, 1.6951985359191895, 1.9161124229431152, 2.137026309967041, 2.357940435409546, 2.5788543224334717, 2.7997682094573975, 3.0206823348999023, 3.241596221923828, 3.462510108947754, 3.6834239959716797, 3.9043378829956055, 4.125251770019531, 4.346165657043457, 4.567079544067383, 4.787993907928467, 5.008907794952393, 5.229821681976318, 5.450735569000244, 5.67164945602417, 5.892563343048096, 6.11347770690918, 6.3343915939331055, 6.555305480957031, 6.776219367980957, 6.997133255004883]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 5.0, 11.0, 13.0, 15.0, 31.0, 36.0, 54.0, 92.0, 141.0, 176.0, 295.0, 513.0, 885.0, 1598.0, 3057.0, 6733.0, 17393.0, 57782.0, 268119.0, 514631.0, 124566.0, 31743.0, 10825.0, 4618.0, 2213.0, 1207.0, 652.0, 365.0, 257.0, 170.0, 109.0, 74.0, 44.0, 29.0, 24.0, 18.0, 13.0, 9.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.9765625, -8.689453125, -8.40234375, -8.115234375, -7.828125, -7.541015625, -7.25390625, -6.966796875, -6.6796875, -6.392578125, -6.10546875, -5.818359375, -5.53125, -5.244140625, -4.95703125, -4.669921875, -4.3828125, -4.095703125, -3.80859375, -3.521484375, -3.234375, -2.947265625, -2.66015625, -2.373046875, -2.0859375, -1.798828125, -1.51171875, -1.224609375, -0.9375, -0.650390625, -0.36328125, -0.076171875, 0.2109375, 0.498046875, 0.78515625, 1.072265625, 1.359375, 1.646484375, 1.93359375, 2.220703125, 2.5078125, 2.794921875, 3.08203125, 3.369140625, 3.65625, 3.943359375, 4.23046875, 4.517578125, 4.8046875, 5.091796875, 5.37890625, 5.666015625, 5.953125, 6.240234375, 6.52734375, 6.814453125, 7.1015625, 7.388671875, 7.67578125, 7.962890625, 8.25, 8.537109375, 8.82421875, 9.111328125, 9.3984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 9.0, 13.0, 16.0, 22.0, 22.0, 58.0, 44.0, 58.0, 66.0, 94.0, 98.0, 99.0, 101.0, 78.0, 54.0, 36.0, 33.0, 28.0, 20.0, 16.0, 8.0, 5.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6953125, -0.6726303100585938, -0.6499481201171875, -0.6272659301757812, -0.604583740234375, -0.5819015502929688, -0.5592193603515625, -0.5365371704101562, -0.51385498046875, -0.49117279052734375, -0.4684906005859375, -0.44580841064453125, -0.423126220703125, -0.40044403076171875, -0.3777618408203125, -0.35507965087890625, -0.3323974609375, -0.30971527099609375, -0.2870330810546875, -0.26435089111328125, -0.241668701171875, -0.21898651123046875, -0.1963043212890625, -0.17362213134765625, -0.15093994140625, -0.12825775146484375, -0.1055755615234375, -0.08289337158203125, -0.060211181640625, -0.03752899169921875, -0.0148468017578125, 0.00783538818359375, 0.030517578125, 0.05319976806640625, 0.0758819580078125, 0.09856414794921875, 0.121246337890625, 0.14392852783203125, 0.1666107177734375, 0.18929290771484375, 0.21197509765625, 0.23465728759765625, 0.2573394775390625, 0.28002166748046875, 0.302703857421875, 0.32538604736328125, 0.3480682373046875, 0.37075042724609375, 0.3934326171875, 0.41611480712890625, 0.4387969970703125, 0.46147918701171875, 0.484161376953125, 0.5068435668945312, 0.5295257568359375, 0.5522079467773438, 0.57489013671875, 0.5975723266601562, 0.6202545166015625, 0.6429367065429688, 0.665618896484375, 0.6883010864257812, 0.7109832763671875, 0.7336654663085938, 0.75634765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 11.0, 11.0, 13.0, 26.0, 20.0, 37.0, 61.0, 85.0, 120.0, 190.0, 293.0, 447.0, 815.0, 1401.0, 2399.0, 4462.0, 8661.0, 19865.0, 67595.0, 417823.0, 417746.0, 67624.0, 19704.0, 8771.0, 4363.0, 2470.0, 1335.0, 852.0, 470.0, 316.0, 190.0, 131.0, 74.0, 51.0, 41.0, 15.0, 15.0, 13.0, 16.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.515625, -8.24951171875, -7.9833984375, -7.71728515625, -7.451171875, -7.18505859375, -6.9189453125, -6.65283203125, -6.38671875, -6.12060546875, -5.8544921875, -5.58837890625, -5.322265625, -5.05615234375, -4.7900390625, -4.52392578125, -4.2578125, -3.99169921875, -3.7255859375, -3.45947265625, -3.193359375, -2.92724609375, -2.6611328125, -2.39501953125, -2.12890625, -1.86279296875, -1.5966796875, -1.33056640625, -1.064453125, -0.79833984375, -0.5322265625, -0.26611328125, 0.0, 0.26611328125, 0.5322265625, 0.79833984375, 1.064453125, 1.33056640625, 1.5966796875, 1.86279296875, 2.12890625, 2.39501953125, 2.6611328125, 2.92724609375, 3.193359375, 3.45947265625, 3.7255859375, 3.99169921875, 4.2578125, 4.52392578125, 4.7900390625, 5.05615234375, 5.322265625, 5.58837890625, 5.8544921875, 6.12060546875, 6.38671875, 6.65283203125, 6.9189453125, 7.18505859375, 7.451171875, 7.71728515625, 7.9833984375, 8.24951171875, 8.515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 12.0, 7.0, 6.0, 17.0, 16.0, 21.0, 23.0, 17.0, 27.0, 28.0, 36.0, 38.0, 33.0, 43.0, 37.0, 45.0, 35.0, 38.0, 53.0, 42.0, 40.0, 49.0, 33.0, 31.0, 40.0, 33.0, 26.0, 25.0, 25.0, 14.0, 17.0, 23.0, 12.0, 13.0, 12.0, 1.0, 8.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.376800537109375, -3.26141357421875, -3.146026611328125, -3.0306396484375, -2.915252685546875, -2.79986572265625, -2.684478759765625, -2.569091796875, -2.453704833984375, -2.33831787109375, -2.222930908203125, -2.1075439453125, -1.992156982421875, -1.87677001953125, -1.761383056640625, -1.64599609375, -1.530609130859375, -1.41522216796875, -1.299835205078125, -1.1844482421875, -1.069061279296875, -0.95367431640625, -0.838287353515625, -0.722900390625, -0.607513427734375, -0.49212646484375, -0.376739501953125, -0.2613525390625, -0.145965576171875, -0.03057861328125, 0.084808349609375, 0.2001953125, 0.315582275390625, 0.43096923828125, 0.546356201171875, 0.6617431640625, 0.777130126953125, 0.89251708984375, 1.007904052734375, 1.123291015625, 1.238677978515625, 1.35406494140625, 1.469451904296875, 1.5848388671875, 1.700225830078125, 1.81561279296875, 1.930999755859375, 2.04638671875, 2.161773681640625, 2.27716064453125, 2.392547607421875, 2.5079345703125, 2.623321533203125, 2.73870849609375, 2.854095458984375, 2.969482421875, 3.084869384765625, 3.20025634765625, 3.315643310546875, 3.4310302734375, 3.546417236328125, 3.66180419921875, 3.777191162109375, 3.892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 6.0, 8.0, 4.0, 10.0, 8.0, 13.0, 19.0, 34.0, 47.0, 60.0, 94.0, 122.0, 197.0, 301.0, 445.0, 742.0, 1204.0, 2062.0, 3860.0, 7645.0, 17715.0, 49692.0, 225096.0, 548921.0, 128798.0, 34309.0, 13243.0, 6157.0, 3134.0, 1682.0, 1013.0, 629.0, 418.0, 266.0, 183.0, 133.0, 90.0, 69.0, 44.0, 29.0, 15.0, 15.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.99609375, -5.8106689453125, -5.625244140625, -5.4398193359375, -5.25439453125, -5.0689697265625, -4.883544921875, -4.6981201171875, -4.5126953125, -4.3272705078125, -4.141845703125, -3.9564208984375, -3.77099609375, -3.5855712890625, -3.400146484375, -3.2147216796875, -3.029296875, -2.8438720703125, -2.658447265625, -2.4730224609375, -2.28759765625, -2.1021728515625, -1.916748046875, -1.7313232421875, -1.5458984375, -1.3604736328125, -1.175048828125, -0.9896240234375, -0.80419921875, -0.6187744140625, -0.433349609375, -0.2479248046875, -0.0625, 0.1229248046875, 0.308349609375, 0.4937744140625, 0.67919921875, 0.8646240234375, 1.050048828125, 1.2354736328125, 1.4208984375, 1.6063232421875, 1.791748046875, 1.9771728515625, 2.16259765625, 2.3480224609375, 2.533447265625, 2.7188720703125, 2.904296875, 3.0897216796875, 3.275146484375, 3.4605712890625, 3.64599609375, 3.8314208984375, 4.016845703125, 4.2022705078125, 4.3876953125, 4.5731201171875, 4.758544921875, 4.9439697265625, 5.12939453125, 5.3148193359375, 5.500244140625, 5.6856689453125, 5.87109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 12.0, 12.0, 19.0, 27.0, 29.0, 57.0, 72.0, 133.0, 155.0, 147.0, 105.0, 60.0, 46.0, 27.0, 21.0, 14.0, 9.0, 6.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010309219360351562, -0.0009960383176803589, -0.0009611546993255615, -0.0009262710809707642, -0.0008913874626159668, -0.0008565038442611694, -0.0008216202259063721, -0.0007867366075515747, -0.0007518529891967773, -0.00071696937084198, -0.0006820857524871826, -0.0006472021341323853, -0.0006123185157775879, -0.0005774348974227905, -0.0005425512790679932, -0.0005076676607131958, -0.00047278404235839844, -0.0004379004240036011, -0.0004030168056488037, -0.00036813318729400635, -0.000333249568939209, -0.0002983659505844116, -0.00026348233222961426, -0.0002285987138748169, -0.00019371509552001953, -0.00015883147716522217, -0.0001239478588104248, -8.906424045562744e-05, -5.418062210083008e-05, -1.9297003746032715e-05, 1.558661460876465e-05, 5.047023296356201e-05, 8.535385131835938e-05, 0.00012023746967315674, 0.0001551210880279541, 0.00019000470638275146, 0.00022488832473754883, 0.0002597719430923462, 0.00029465556144714355, 0.0003295391798019409, 0.0003644227981567383, 0.00039930641651153564, 0.000434190034866333, 0.00046907365322113037, 0.0005039572715759277, 0.0005388408899307251, 0.0005737245082855225, 0.0006086081266403198, 0.0006434917449951172, 0.0006783753633499146, 0.0007132589817047119, 0.0007481426000595093, 0.0007830262184143066, 0.000817909836769104, 0.0008527934551239014, 0.0008876770734786987, 0.0009225606918334961, 0.0009574443101882935, 0.0009923279285430908, 0.0010272115468978882, 0.0010620951652526855, 0.001096978783607483, 0.0011318624019622803, 0.0011667460203170776, 0.001201629638671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 15.0, 26.0, 30.0, 33.0, 51.0, 84.0, 107.0, 164.0, 237.0, 348.0, 549.0, 803.0, 1348.0, 2226.0, 3938.0, 6998.0, 14465.0, 36453.0, 144708.0, 544082.0, 208674.0, 46821.0, 17113.0, 8262.0, 4181.0, 2570.0, 1506.0, 922.0, 583.0, 376.0, 245.0, 183.0, 117.0, 99.0, 56.0, 42.0, 33.0, 24.0, 18.0, 17.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.974609375, -3.840362548828125, -3.70611572265625, -3.571868896484375, -3.4376220703125, -3.303375244140625, -3.16912841796875, -3.034881591796875, -2.900634765625, -2.766387939453125, -2.63214111328125, -2.497894287109375, -2.3636474609375, -2.229400634765625, -2.09515380859375, -1.960906982421875, -1.82666015625, -1.692413330078125, -1.55816650390625, -1.423919677734375, -1.2896728515625, -1.155426025390625, -1.02117919921875, -0.886932373046875, -0.752685546875, -0.618438720703125, -0.48419189453125, -0.349945068359375, -0.2156982421875, -0.081451416015625, 0.05279541015625, 0.187042236328125, 0.3212890625, 0.455535888671875, 0.58978271484375, 0.724029541015625, 0.8582763671875, 0.992523193359375, 1.12677001953125, 1.261016845703125, 1.395263671875, 1.529510498046875, 1.66375732421875, 1.798004150390625, 1.9322509765625, 2.066497802734375, 2.20074462890625, 2.334991455078125, 2.46923828125, 2.603485107421875, 2.73773193359375, 2.871978759765625, 3.0062255859375, 3.140472412109375, 3.27471923828125, 3.408966064453125, 3.543212890625, 3.677459716796875, 3.81170654296875, 3.945953369140625, 4.0802001953125, 4.214447021484375, 4.34869384765625, 4.482940673828125, 4.6171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 3.0, 11.0, 8.0, 14.0, 12.0, 10.0, 12.0, 20.0, 19.0, 22.0, 28.0, 43.0, 46.0, 33.0, 46.0, 45.0, 63.0, 48.0, 51.0, 52.0, 63.0, 52.0, 44.0, 37.0, 26.0, 34.0, 29.0, 20.0, 22.0, 13.0, 15.0, 8.0, 9.0, 13.0, 9.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.61285400390625, -1.5538330078125, -1.49481201171875, -1.435791015625, -1.37677001953125, -1.3177490234375, -1.25872802734375, -1.19970703125, -1.14068603515625, -1.0816650390625, -1.02264404296875, -0.963623046875, -0.90460205078125, -0.8455810546875, -0.78656005859375, -0.7275390625, -0.66851806640625, -0.6094970703125, -0.55047607421875, -0.491455078125, -0.43243408203125, -0.3734130859375, -0.31439208984375, -0.25537109375, -0.19635009765625, -0.1373291015625, -0.07830810546875, -0.019287109375, 0.03973388671875, 0.0987548828125, 0.15777587890625, 0.216796875, 0.27581787109375, 0.3348388671875, 0.39385986328125, 0.452880859375, 0.51190185546875, 0.5709228515625, 0.62994384765625, 0.68896484375, 0.74798583984375, 0.8070068359375, 0.86602783203125, 0.925048828125, 0.98406982421875, 1.0430908203125, 1.10211181640625, 1.1611328125, 1.22015380859375, 1.2791748046875, 1.33819580078125, 1.397216796875, 1.45623779296875, 1.5152587890625, 1.57427978515625, 1.63330078125, 1.69232177734375, 1.7513427734375, 1.81036376953125, 1.869384765625, 1.92840576171875, 1.9874267578125, 2.04644775390625, 2.10546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 13.0, 14.0, 37.0, 121.0, 318.0, 272.0, 106.0, 23.0, 16.0, 15.0, 9.0, 7.0, 2.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.59197998046875, -153.92050170898438, -150.24903869628906, -146.5775604248047, -142.90609741210938, -139.234619140625, -135.5631561279297, -131.8916778564453, -128.22021484375, -124.54874420166016, -120.87727355957031, -117.20580291748047, -113.53433227539062, -109.86286163330078, -106.19139099121094, -102.51991271972656, -98.84844207763672, -95.17697143554688, -91.50550079345703, -87.83403015136719, -84.16255950927734, -80.4910888671875, -76.81961059570312, -73.14814758300781, -69.47666931152344, -65.8051986694336, -62.13372802734375, -58.462257385253906, -54.79078674316406, -51.11931610107422, -47.44784164428711, -43.776371002197266, -40.10490417480469, -36.433433532714844, -32.761962890625, -29.090490341186523, -25.41901969909668, -21.747549057006836, -18.07607650756836, -14.404605865478516, -10.733135223388672, -7.06166410446167, -3.390192985534668, 0.2812786102294922, 3.952749252319336, 7.62421989440918, 11.295692443847656, 14.9671630859375, 18.638633728027344, 22.310104370117188, 25.98157501220703, 29.653047561645508, 33.32451629638672, 36.99598693847656, 40.66746139526367, 44.338932037353516, 48.01040267944336, 51.6818733215332, 55.35334396362305, 59.024818420410156, 62.6962890625, 66.36775970458984, 70.03923034667969, 73.71070098876953, 77.38217163085938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 45.0, 73.0, 121.0, 147.0, 172.0, 131.0, 86.0, 50.0, 35.0, 16.0, 4.0, 12.0, 10.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-83.10597229003906, -80.67865753173828, -78.2513427734375, -75.82402801513672, -73.39671325683594, -70.96940612792969, -68.54208374023438, -66.11477661132812, -63.687461853027344, -61.26014709472656, -58.83283233642578, -56.405517578125, -53.978206634521484, -51.5508918762207, -49.12357711791992, -46.696266174316406, -44.26894760131836, -41.84163284301758, -39.4143180847168, -36.98700714111328, -34.5596923828125, -32.13237762451172, -29.705062866210938, -27.27775001525879, -24.850435256958008, -22.423120498657227, -19.995807647705078, -17.568492889404297, -15.141179084777832, -12.713865280151367, -10.286550521850586, -7.8592376708984375, -5.431922912597656, -3.0046088695526123, -0.5772948265075684, 1.8500194549560547, 4.2773332595825195, 6.704647064208984, 9.131961822509766, 11.559274673461914, 13.986589431762695, 16.413904190063477, 18.841217041015625, 21.268531799316406, 23.695846557617188, 26.123159408569336, 28.550474166870117, 30.977787017822266, 33.40510177612305, 35.83241653442383, 38.25973129272461, 40.687042236328125, 43.114356994628906, 45.54167175292969, 47.96898651123047, 50.39630126953125, 52.82361602783203, 55.25093078613281, 57.678245544433594, 60.105560302734375, 62.53287124633789, 64.96018981933594, 67.38749694824219, 69.81481170654297, 72.24212646484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 7.0, 11.0, 6.0, 15.0, 23.0, 28.0, 40.0, 47.0, 83.0, 106.0, 168.0, 262.0, 394.0, 664.0, 1203.0, 2230.0, 4730.0, 12543.0, 40005.0, 209370.0, 3663699.0, 197786.0, 38761.0, 11980.0, 4759.0, 2212.0, 1223.0, 663.0, 377.0, 289.0, 177.0, 124.0, 86.0, 44.0, 40.0, 34.0, 19.0, 15.0, 16.0, 7.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.51611328125, -18.8759765625, -18.23583984375, -17.595703125, -16.95556640625, -16.3154296875, -15.67529296875, -15.03515625, -14.39501953125, -13.7548828125, -13.11474609375, -12.474609375, -11.83447265625, -11.1943359375, -10.55419921875, -9.9140625, -9.27392578125, -8.6337890625, -7.99365234375, -7.353515625, -6.71337890625, -6.0732421875, -5.43310546875, -4.79296875, -4.15283203125, -3.5126953125, -2.87255859375, -2.232421875, -1.59228515625, -0.9521484375, -0.31201171875, 0.328125, 0.96826171875, 1.6083984375, 2.24853515625, 2.888671875, 3.52880859375, 4.1689453125, 4.80908203125, 5.44921875, 6.08935546875, 6.7294921875, 7.36962890625, 8.009765625, 8.64990234375, 9.2900390625, 9.93017578125, 10.5703125, 11.21044921875, 11.8505859375, 12.49072265625, 13.130859375, 13.77099609375, 14.4111328125, 15.05126953125, 15.69140625, 16.33154296875, 16.9716796875, 17.61181640625, 18.251953125, 18.89208984375, 19.5322265625, 20.17236328125, 20.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 9.0, 13.0, 18.0, 32.0, 34.0, 50.0, 75.0, 64.0, 78.0, 83.0, 106.0, 78.0, 89.0, 59.0, 47.0, 37.0, 22.0, 22.0, 18.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.7841110229492188, -0.7596282958984375, -0.7351455688476562, -0.710662841796875, -0.6861801147460938, -0.6616973876953125, -0.6372146606445312, -0.61273193359375, -0.5882492065429688, -0.5637664794921875, -0.5392837524414062, -0.514801025390625, -0.49031829833984375, -0.4658355712890625, -0.44135284423828125, -0.4168701171875, -0.39238739013671875, -0.3679046630859375, -0.34342193603515625, -0.318939208984375, -0.29445648193359375, -0.2699737548828125, -0.24549102783203125, -0.22100830078125, -0.19652557373046875, -0.1720428466796875, -0.14756011962890625, -0.123077392578125, -0.09859466552734375, -0.0741119384765625, -0.04962921142578125, -0.025146484375, -0.00066375732421875, 0.0238189697265625, 0.04830169677734375, 0.072784423828125, 0.09726715087890625, 0.1217498779296875, 0.14623260498046875, 0.17071533203125, 0.19519805908203125, 0.2196807861328125, 0.24416351318359375, 0.268646240234375, 0.29312896728515625, 0.3176116943359375, 0.34209442138671875, 0.3665771484375, 0.39105987548828125, 0.4155426025390625, 0.44002532958984375, 0.464508056640625, 0.48899078369140625, 0.5134735107421875, 0.5379562377929688, 0.56243896484375, 0.5869216918945312, 0.6114044189453125, 0.6358871459960938, 0.660369873046875, 0.6848526000976562, 0.7093353271484375, 0.7338180541992188, 0.75830078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 7.0, 7.0, 9.0, 17.0, 25.0, 42.0, 66.0, 89.0, 164.0, 302.0, 580.0, 1249.0, 2884.0, 7858.0, 27418.0, 140164.0, 2571778.0, 1292205.0, 114104.0, 23532.0, 6930.0, 2507.0, 1138.0, 517.0, 287.0, 147.0, 88.0, 55.0, 37.0, 20.0, 21.0, 8.0, 6.0, 1.0, 6.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.546875, -18.0308837890625, -17.514892578125, -16.9989013671875, -16.48291015625, -15.9669189453125, -15.450927734375, -14.9349365234375, -14.4189453125, -13.9029541015625, -13.386962890625, -12.8709716796875, -12.35498046875, -11.8389892578125, -11.322998046875, -10.8070068359375, -10.291015625, -9.7750244140625, -9.259033203125, -8.7430419921875, -8.22705078125, -7.7110595703125, -7.195068359375, -6.6790771484375, -6.1630859375, -5.6470947265625, -5.131103515625, -4.6151123046875, -4.09912109375, -3.5831298828125, -3.067138671875, -2.5511474609375, -2.03515625, -1.5191650390625, -1.003173828125, -0.4871826171875, 0.02880859375, 0.5447998046875, 1.060791015625, 1.5767822265625, 2.0927734375, 2.6087646484375, 3.124755859375, 3.6407470703125, 4.15673828125, 4.6727294921875, 5.188720703125, 5.7047119140625, 6.220703125, 6.7366943359375, 7.252685546875, 7.7686767578125, 8.28466796875, 8.8006591796875, 9.316650390625, 9.8326416015625, 10.3486328125, 10.8646240234375, 11.380615234375, 11.8966064453125, 12.41259765625, 12.9285888671875, 13.444580078125, 13.9605712890625, 14.4765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 9.0, 10.0, 20.0, 25.0, 43.0, 77.0, 102.0, 171.0, 291.0, 634.0, 1549.0, 480.0, 225.0, 151.0, 100.0, 49.0, 51.0, 26.0, 19.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.35546875, -2.275177001953125, -2.19488525390625, -2.114593505859375, -2.0343017578125, -1.954010009765625, -1.87371826171875, -1.793426513671875, -1.713134765625, -1.632843017578125, -1.55255126953125, -1.472259521484375, -1.3919677734375, -1.311676025390625, -1.23138427734375, -1.151092529296875, -1.07080078125, -0.990509033203125, -0.91021728515625, -0.829925537109375, -0.7496337890625, -0.669342041015625, -0.58905029296875, -0.508758544921875, -0.428466796875, -0.348175048828125, -0.26788330078125, -0.187591552734375, -0.1072998046875, -0.027008056640625, 0.05328369140625, 0.133575439453125, 0.2138671875, 0.294158935546875, 0.37445068359375, 0.454742431640625, 0.5350341796875, 0.615325927734375, 0.69561767578125, 0.775909423828125, 0.856201171875, 0.936492919921875, 1.01678466796875, 1.097076416015625, 1.1773681640625, 1.257659912109375, 1.33795166015625, 1.418243408203125, 1.49853515625, 1.578826904296875, 1.65911865234375, 1.739410400390625, 1.8197021484375, 1.899993896484375, 1.98028564453125, 2.060577392578125, 2.140869140625, 2.221160888671875, 2.30145263671875, 2.381744384765625, 2.4620361328125, 2.542327880859375, 2.62261962890625, 2.702911376953125, 2.783203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 15.0, 35.0, 63.0, 145.0, 251.0, 254.0, 121.0, 67.0, 28.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.80404281616211, -28.002899169921875, -27.20175552368164, -26.400611877441406, -25.599468231201172, -24.798324584960938, -23.99717903137207, -23.196035385131836, -22.3948917388916, -21.593748092651367, -20.792604446411133, -19.9914608001709, -19.19031524658203, -18.389171600341797, -17.588027954101562, -16.786884307861328, -15.985740661621094, -15.18459701538086, -14.383453369140625, -13.582308769226074, -12.78116512298584, -11.980021476745605, -11.178876876831055, -10.37773323059082, -9.576589584350586, -8.775445938110352, -7.974301815032959, -7.173157691955566, -6.372014045715332, -5.570870399475098, -4.769726276397705, -3.9685821533203125, -3.167438507080078, -2.3662946224212646, -1.5651507377624512, -0.7640068531036377, 0.03713703155517578, 0.8382806777954102, 1.6394248008728027, 2.4405689239501953, 3.2417125701904297, 4.042856216430664, 4.844000339508057, 5.645144462585449, 6.446288108825684, 7.247431755065918, 8.048576354980469, 8.849720001220703, 9.650863647460938, 10.452007293701172, 11.253150939941406, 12.054295539855957, 12.855439186096191, 13.656582832336426, 14.457727432250977, 15.258871078491211, 16.060014724731445, 16.86115837097168, 17.662302017211914, 18.46344566345215, 19.264591217041016, 20.06573486328125, 20.866878509521484, 21.66802215576172, 22.469165802001953]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 10.0, 7.0, 20.0, 19.0, 26.0, 28.0, 39.0, 44.0, 49.0, 68.0, 72.0, 86.0, 77.0, 77.0, 85.0, 58.0, 56.0, 46.0, 30.0, 23.0, 17.0, 11.0, 12.0, 9.0, 10.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.719928741455078, -7.384385108947754, -7.0488409996032715, -6.713296890258789, -6.377753257751465, -6.042209625244141, -5.706665515899658, -5.371121406555176, -5.035577774047852, -4.700034141540527, -4.364490032196045, -4.0289459228515625, -3.6934022903442383, -3.357858419418335, -3.0223145484924316, -2.6867706775665283, -2.351226806640625, -2.0156829357147217, -1.6801390647888184, -1.344595193862915, -1.0090513229370117, -0.6735074520111084, -0.3379635810852051, -0.002419710159301758, 0.33312416076660156, 0.6686680316925049, 1.0042119026184082, 1.3397557735443115, 1.6752996444702148, 2.010843515396118, 2.3463873863220215, 2.681931257247925, 3.0174760818481445, 3.353019952774048, 3.688563823699951, 4.024107933044434, 4.359651565551758, 4.695195198059082, 5.0307393074035645, 5.366283416748047, 5.701827049255371, 6.037370681762695, 6.372914791107178, 6.70845890045166, 7.044002532958984, 7.379546165466309, 7.715090274810791, 8.050634384155273, 8.386178016662598, 8.721721649169922, 9.057266235351562, 9.392809867858887, 9.728353500366211, 10.063897132873535, 10.39944076538086, 10.7349853515625, 11.070528984069824, 11.406072616577148, 11.741617202758789, 12.077160835266113, 12.412704467773438, 12.748248100280762, 13.083791732788086, 13.419336318969727, 13.75487995147705]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 3.0, 9.0, 9.0, 14.0, 17.0, 28.0, 49.0, 38.0, 130.0, 203.0, 423.0, 939.0, 2343.0, 6224.0, 18476.0, 65047.0, 287830.0, 494146.0, 124560.0, 31833.0, 9972.0, 3577.0, 1401.0, 613.0, 275.0, 152.0, 68.0, 33.0, 36.0, 24.0, 13.0, 14.0, 6.0, 10.0, 4.0, 7.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1522216796875, -8.859130859375, -8.5660400390625, -8.27294921875, -7.9798583984375, -7.686767578125, -7.3936767578125, -7.1005859375, -6.8074951171875, -6.514404296875, -6.2213134765625, -5.92822265625, -5.6351318359375, -5.342041015625, -5.0489501953125, -4.755859375, -4.4627685546875, -4.169677734375, -3.8765869140625, -3.58349609375, -3.2904052734375, -2.997314453125, -2.7042236328125, -2.4111328125, -2.1180419921875, -1.824951171875, -1.5318603515625, -1.23876953125, -0.9456787109375, -0.652587890625, -0.3594970703125, -0.06640625, 0.2266845703125, 0.519775390625, 0.8128662109375, 1.10595703125, 1.3990478515625, 1.692138671875, 1.9852294921875, 2.2783203125, 2.5714111328125, 2.864501953125, 3.1575927734375, 3.45068359375, 3.7437744140625, 4.036865234375, 4.3299560546875, 4.623046875, 4.9161376953125, 5.209228515625, 5.5023193359375, 5.79541015625, 6.0885009765625, 6.381591796875, 6.6746826171875, 6.9677734375, 7.2608642578125, 7.553955078125, 7.8470458984375, 8.14013671875, 8.4332275390625, 8.726318359375, 9.0194091796875, 9.3125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 4.0, 11.0, 7.0, 16.0, 28.0, 28.0, 25.0, 33.0, 52.0, 62.0, 77.0, 74.0, 75.0, 93.0, 77.0, 78.0, 58.0, 45.0, 40.0, 27.0, 24.0, 13.0, 16.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.47760009765625, -0.4547119140625, -0.43182373046875, -0.408935546875, -0.38604736328125, -0.3631591796875, -0.34027099609375, -0.3173828125, -0.29449462890625, -0.2716064453125, -0.24871826171875, -0.225830078125, -0.20294189453125, -0.1800537109375, -0.15716552734375, -0.13427734375, -0.11138916015625, -0.0885009765625, -0.06561279296875, -0.042724609375, -0.01983642578125, 0.0030517578125, 0.02593994140625, 0.048828125, 0.07171630859375, 0.0946044921875, 0.11749267578125, 0.140380859375, 0.16326904296875, 0.1861572265625, 0.20904541015625, 0.23193359375, 0.25482177734375, 0.2777099609375, 0.30059814453125, 0.323486328125, 0.34637451171875, 0.3692626953125, 0.39215087890625, 0.4150390625, 0.43792724609375, 0.4608154296875, 0.48370361328125, 0.506591796875, 0.52947998046875, 0.5523681640625, 0.57525634765625, 0.59814453125, 0.62103271484375, 0.6439208984375, 0.66680908203125, 0.689697265625, 0.71258544921875, 0.7354736328125, 0.75836181640625, 0.78125, 0.80413818359375, 0.8270263671875, 0.84991455078125, 0.872802734375, 0.89569091796875, 0.9185791015625, 0.94146728515625, 0.96435546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 6.0, 7.0, 16.0, 16.0, 16.0, 36.0, 47.0, 64.0, 126.0, 195.0, 388.0, 692.0, 1501.0, 3176.0, 7638.0, 20674.0, 65834.0, 262238.0, 485806.0, 139342.0, 38647.0, 12982.0, 4823.0, 2114.0, 1004.0, 512.0, 275.0, 127.0, 76.0, 52.0, 39.0, 25.0, 15.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3203125, -6.135986328125, -5.95166015625, -5.767333984375, -5.5830078125, -5.398681640625, -5.21435546875, -5.030029296875, -4.845703125, -4.661376953125, -4.47705078125, -4.292724609375, -4.1083984375, -3.924072265625, -3.73974609375, -3.555419921875, -3.37109375, -3.186767578125, -3.00244140625, -2.818115234375, -2.6337890625, -2.449462890625, -2.26513671875, -2.080810546875, -1.896484375, -1.712158203125, -1.52783203125, -1.343505859375, -1.1591796875, -0.974853515625, -0.79052734375, -0.606201171875, -0.421875, -0.237548828125, -0.05322265625, 0.131103515625, 0.3154296875, 0.499755859375, 0.68408203125, 0.868408203125, 1.052734375, 1.237060546875, 1.42138671875, 1.605712890625, 1.7900390625, 1.974365234375, 2.15869140625, 2.343017578125, 2.52734375, 2.711669921875, 2.89599609375, 3.080322265625, 3.2646484375, 3.448974609375, 3.63330078125, 3.817626953125, 4.001953125, 4.186279296875, 4.37060546875, 4.554931640625, 4.7392578125, 4.923583984375, 5.10791015625, 5.292236328125, 5.4765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 8.0, 4.0, 6.0, 4.0, 10.0, 8.0, 7.0, 18.0, 16.0, 19.0, 21.0, 24.0, 22.0, 31.0, 29.0, 29.0, 29.0, 31.0, 39.0, 36.0, 48.0, 42.0, 41.0, 43.0, 36.0, 37.0, 33.0, 39.0, 27.0, 33.0, 27.0, 28.0, 23.0, 19.0, 14.0, 19.0, 14.0, 15.0, 14.0, 11.0, 5.0, 8.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0], "bins": [-2.423828125, -2.35198974609375, -2.2801513671875, -2.20831298828125, -2.136474609375, -2.06463623046875, -1.9927978515625, -1.92095947265625, -1.84912109375, -1.77728271484375, -1.7054443359375, -1.63360595703125, -1.561767578125, -1.48992919921875, -1.4180908203125, -1.34625244140625, -1.2744140625, -1.20257568359375, -1.1307373046875, -1.05889892578125, -0.987060546875, -0.91522216796875, -0.8433837890625, -0.77154541015625, -0.69970703125, -0.62786865234375, -0.5560302734375, -0.48419189453125, -0.412353515625, -0.34051513671875, -0.2686767578125, -0.19683837890625, -0.125, -0.05316162109375, 0.0186767578125, 0.09051513671875, 0.162353515625, 0.23419189453125, 0.3060302734375, 0.37786865234375, 0.44970703125, 0.52154541015625, 0.5933837890625, 0.66522216796875, 0.737060546875, 0.80889892578125, 0.8807373046875, 0.95257568359375, 1.0244140625, 1.09625244140625, 1.1680908203125, 1.23992919921875, 1.311767578125, 1.38360595703125, 1.4554443359375, 1.52728271484375, 1.59912109375, 1.67095947265625, 1.7427978515625, 1.81463623046875, 1.886474609375, 1.95831298828125, 2.0301513671875, 2.10198974609375, 2.173828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 10.0, 12.0, 13.0, 41.0, 37.0, 45.0, 62.0, 82.0, 141.0, 201.0, 258.0, 458.0, 790.0, 1546.0, 3457.0, 9309.0, 37145.0, 283059.0, 606944.0, 78971.0, 15912.0, 5257.0, 2131.0, 1023.0, 571.0, 402.0, 229.0, 108.0, 97.0, 65.0, 40.0, 38.0, 29.0, 23.0, 10.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.515625, -8.2427978515625, -7.969970703125, -7.6971435546875, -7.42431640625, -7.1514892578125, -6.878662109375, -6.6058349609375, -6.3330078125, -6.0601806640625, -5.787353515625, -5.5145263671875, -5.24169921875, -4.9688720703125, -4.696044921875, -4.4232177734375, -4.150390625, -3.8775634765625, -3.604736328125, -3.3319091796875, -3.05908203125, -2.7862548828125, -2.513427734375, -2.2406005859375, -1.9677734375, -1.6949462890625, -1.422119140625, -1.1492919921875, -0.87646484375, -0.6036376953125, -0.330810546875, -0.0579833984375, 0.21484375, 0.4876708984375, 0.760498046875, 1.0333251953125, 1.30615234375, 1.5789794921875, 1.851806640625, 2.1246337890625, 2.3974609375, 2.6702880859375, 2.943115234375, 3.2159423828125, 3.48876953125, 3.7615966796875, 4.034423828125, 4.3072509765625, 4.580078125, 4.8529052734375, 5.125732421875, 5.3985595703125, 5.67138671875, 5.9442138671875, 6.217041015625, 6.4898681640625, 6.7626953125, 7.0355224609375, 7.308349609375, 7.5811767578125, 7.85400390625, 8.1268310546875, 8.399658203125, 8.6724853515625, 8.9453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 8.0, 10.0, 22.0, 56.0, 185.0, 342.0, 234.0, 77.0, 37.0, 14.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0019779205322265625, -0.0019325986504554749, -0.0018872767686843872, -0.0018419548869132996, -0.001796633005142212, -0.0017513111233711243, -0.0017059892416000366, -0.001660667359828949, -0.0016153454780578613, -0.0015700235962867737, -0.001524701714515686, -0.0014793798327445984, -0.0014340579509735107, -0.001388736069202423, -0.0013434141874313354, -0.0012980923056602478, -0.0012527704238891602, -0.0012074485421180725, -0.0011621266603469849, -0.0011168047785758972, -0.0010714828968048096, -0.001026161015033722, -0.0009808391332626343, -0.0009355172514915466, -0.000890195369720459, -0.0008448734879493713, -0.0007995516061782837, -0.000754229724407196, -0.0007089078426361084, -0.0006635859608650208, -0.0006182640790939331, -0.0005729421973228455, -0.0005276203155517578, -0.00048229843378067017, -0.0004369765520095825, -0.0003916546702384949, -0.0003463327884674072, -0.0003010109066963196, -0.00025568902492523193, -0.0002103671431541443, -0.00016504526138305664, -0.000119723379611969, -7.440149784088135e-05, -2.90796160697937e-05, 1.6242265701293945e-05, 6.156414747238159e-05, 0.00010688602924346924, 0.00015220791101455688, 0.00019752979278564453, 0.00024285167455673218, 0.0002881735563278198, 0.00033349543809890747, 0.0003788173198699951, 0.00042413920164108276, 0.0004694610834121704, 0.0005147829651832581, 0.0005601048469543457, 0.0006054267287254333, 0.000650748610496521, 0.0006960704922676086, 0.0007413923740386963, 0.0007867142558097839, 0.0008320361375808716, 0.0008773580193519592, 0.0009226799011230469]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 17.0, 21.0, 51.0, 110.0, 191.0, 460.0, 1321.0, 4698.0, 28655.0, 625975.0, 363208.0, 18576.0, 3441.0, 1082.0, 376.0, 160.0, 99.0, 48.0, 27.0, 9.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -15.0369873046875, -14.550537109375, -14.0640869140625, -13.57763671875, -13.0911865234375, -12.604736328125, -12.1182861328125, -11.6318359375, -11.1453857421875, -10.658935546875, -10.1724853515625, -9.68603515625, -9.1995849609375, -8.713134765625, -8.2266845703125, -7.740234375, -7.2537841796875, -6.767333984375, -6.2808837890625, -5.79443359375, -5.3079833984375, -4.821533203125, -4.3350830078125, -3.8486328125, -3.3621826171875, -2.875732421875, -2.3892822265625, -1.90283203125, -1.4163818359375, -0.929931640625, -0.4434814453125, 0.04296875, 0.5294189453125, 1.015869140625, 1.5023193359375, 1.98876953125, 2.4752197265625, 2.961669921875, 3.4481201171875, 3.9345703125, 4.4210205078125, 4.907470703125, 5.3939208984375, 5.88037109375, 6.3668212890625, 6.853271484375, 7.3397216796875, 7.826171875, 8.3126220703125, 8.799072265625, 9.2855224609375, 9.77197265625, 10.2584228515625, 10.744873046875, 11.2313232421875, 11.7177734375, 12.2042236328125, 12.690673828125, 13.1771240234375, 13.66357421875, 14.1500244140625, 14.636474609375, 15.1229248046875, 15.609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 9.0, 16.0, 15.0, 11.0, 35.0, 39.0, 57.0, 75.0, 107.0, 129.0, 131.0, 99.0, 87.0, 50.0, 42.0, 26.0, 15.0, 10.0, 10.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.040283203125, -3.90087890625, -3.761474609375, -3.6220703125, -3.482666015625, -3.34326171875, -3.203857421875, -3.064453125, -2.925048828125, -2.78564453125, -2.646240234375, -2.5068359375, -2.367431640625, -2.22802734375, -2.088623046875, -1.94921875, -1.809814453125, -1.67041015625, -1.531005859375, -1.3916015625, -1.252197265625, -1.11279296875, -0.973388671875, -0.833984375, -0.694580078125, -0.55517578125, -0.415771484375, -0.2763671875, -0.136962890625, 0.00244140625, 0.141845703125, 0.28125, 0.420654296875, 0.56005859375, 0.699462890625, 0.8388671875, 0.978271484375, 1.11767578125, 1.257080078125, 1.396484375, 1.535888671875, 1.67529296875, 1.814697265625, 1.9541015625, 2.093505859375, 2.23291015625, 2.372314453125, 2.51171875, 2.651123046875, 2.79052734375, 2.929931640625, 3.0693359375, 3.208740234375, 3.34814453125, 3.487548828125, 3.626953125, 3.766357421875, 3.90576171875, 4.045166015625, 4.1845703125, 4.323974609375, 4.46337890625, 4.602783203125, 4.7421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 14.0, 39.0, 72.0, 154.0, 234.0, 237.0, 121.0, 63.0, 24.0, 11.0, 8.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.095191955566406, -58.200523376464844, -56.305850982666016, -54.41118240356445, -52.516510009765625, -50.62184143066406, -48.7271728515625, -46.83250045776367, -44.93783187866211, -43.04316329956055, -41.14849090576172, -39.253822326660156, -37.35914993286133, -35.464481353759766, -33.56980895996094, -31.675140380859375, -29.78046989440918, -27.885799407958984, -25.99112892150879, -24.096458435058594, -22.20178985595703, -20.307119369506836, -18.41244888305664, -16.517780303955078, -14.623108863830566, -12.728438377380371, -10.833768844604492, -8.939098358154297, -7.04442834854126, -5.149758338928223, -3.2550878524780273, -1.3604183197021484, 0.5342521667480469, 2.428922176361084, 4.323592185974121, 6.218262672424316, 8.112932205200195, 10.00760269165039, 11.902273178100586, 13.796942710876465, 15.69161319732666, 17.58628273010254, 19.480953216552734, 21.37562370300293, 23.270294189453125, 25.164962768554688, 27.059635162353516, 28.954303741455078, 30.848974227905273, 32.74364471435547, 34.63831329345703, 36.53298568725586, 38.42765426635742, 40.32232666015625, 42.21699523925781, 44.111663818359375, 46.0063362121582, 47.901004791259766, 49.795677185058594, 51.690345764160156, 53.585018157958984, 55.47968673706055, 57.374359130859375, 59.26902770996094, 61.1636962890625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 9.0, 9.0, 9.0, 17.0, 29.0, 37.0, 56.0, 93.0, 114.0, 128.0, 124.0, 102.0, 85.0, 72.0, 39.0, 26.0, 13.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.74987030029297, -65.2035903930664, -63.657310485839844, -62.11103057861328, -60.56474685668945, -59.01846694946289, -57.47218704223633, -55.925907135009766, -54.37962341308594, -52.833343505859375, -51.28706359863281, -49.74078369140625, -48.19449996948242, -46.64822006225586, -45.1019401550293, -43.555660247802734, -42.00938034057617, -40.46310043334961, -38.91682052612305, -37.37053680419922, -35.824256896972656, -34.277976989746094, -32.73169708251953, -31.18541717529297, -29.639135360717773, -28.09285545349121, -26.546573638916016, -25.000293731689453, -23.45401382446289, -21.907732009887695, -20.361452102661133, -18.815170288085938, -17.26888656616211, -15.72260570526123, -14.176324844360352, -12.630044937133789, -11.08376407623291, -9.537483215332031, -7.991203308105469, -6.44492244720459, -4.898641586303711, -3.352360963821411, -1.8060803413391113, -0.2597999572753906, 1.2864809036254883, 2.832761764526367, 4.37904167175293, 5.925322532653809, 7.4716033935546875, 9.017884254455566, 10.564165115356445, 12.110445022583008, 13.656725883483887, 15.203006744384766, 16.749286651611328, 18.29556655883789, 19.841848373413086, 21.38812828063965, 22.934410095214844, 24.480690002441406, 26.02696990966797, 27.573251724243164, 29.119531631469727, 30.665813446044922, 32.212093353271484]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 17.0, 13.0, 23.0, 18.0, 18.0, 24.0, 45.0, 43.0, 66.0, 119.0, 157.0, 318.0, 570.0, 1188.0, 2494.0, 5887.0, 15898.0, 55828.0, 472342.0, 3502374.0, 98632.0, 23247.0, 8085.0, 3339.0, 1662.0, 799.0, 384.0, 268.0, 140.0, 92.0, 58.0, 31.0, 33.0, 12.0, 6.0, 8.0, 5.0, 1.0, 3.0, 2.0], "bins": [-25.640625, -25.0467529296875, -24.452880859375, -23.8590087890625, -23.26513671875, -22.6712646484375, -22.077392578125, -21.4835205078125, -20.8896484375, -20.2957763671875, -19.701904296875, -19.1080322265625, -18.51416015625, -17.9202880859375, -17.326416015625, -16.7325439453125, -16.138671875, -15.5447998046875, -14.950927734375, -14.3570556640625, -13.76318359375, -13.1693115234375, -12.575439453125, -11.9815673828125, -11.3876953125, -10.7938232421875, -10.199951171875, -9.6060791015625, -9.01220703125, -8.4183349609375, -7.824462890625, -7.2305908203125, -6.63671875, -6.0428466796875, -5.448974609375, -4.8551025390625, -4.26123046875, -3.6673583984375, -3.073486328125, -2.4796142578125, -1.8857421875, -1.2918701171875, -0.697998046875, -0.1041259765625, 0.48974609375, 1.0836181640625, 1.677490234375, 2.2713623046875, 2.865234375, 3.4591064453125, 4.052978515625, 4.6468505859375, 5.24072265625, 5.8345947265625, 6.428466796875, 7.0223388671875, 7.6162109375, 8.2100830078125, 8.803955078125, 9.3978271484375, 9.99169921875, 10.5855712890625, 11.179443359375, 11.7733154296875, 12.3671875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 2.0, 5.0, 15.0, 23.0, 26.0, 36.0, 51.0, 53.0, 68.0, 83.0, 105.0, 96.0, 104.0, 79.0, 67.0, 58.0, 41.0, 25.0, 20.0, 18.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.11328125, -1.0841827392578125, -1.055084228515625, -1.0259857177734375, -0.99688720703125, -0.9677886962890625, -0.938690185546875, -0.9095916748046875, -0.8804931640625, -0.8513946533203125, -0.822296142578125, -0.7931976318359375, -0.76409912109375, -0.7350006103515625, -0.705902099609375, -0.6768035888671875, -0.647705078125, -0.6186065673828125, -0.589508056640625, -0.5604095458984375, -0.53131103515625, -0.5022125244140625, -0.473114013671875, -0.4440155029296875, -0.4149169921875, -0.3858184814453125, -0.356719970703125, -0.3276214599609375, -0.29852294921875, -0.2694244384765625, -0.240325927734375, -0.2112274169921875, -0.18212890625, -0.1530303955078125, -0.123931884765625, -0.0948333740234375, -0.06573486328125, -0.0366363525390625, -0.007537841796875, 0.0215606689453125, 0.0506591796875, 0.0797576904296875, 0.108856201171875, 0.1379547119140625, 0.16705322265625, 0.1961517333984375, 0.225250244140625, 0.2543487548828125, 0.283447265625, 0.3125457763671875, 0.341644287109375, 0.3707427978515625, 0.39984130859375, 0.4289398193359375, 0.458038330078125, 0.4871368408203125, 0.5162353515625, 0.5453338623046875, 0.574432373046875, 0.6035308837890625, 0.63262939453125, 0.6617279052734375, 0.690826416015625, 0.7199249267578125, 0.7490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 7.0, 12.0, 18.0, 16.0, 19.0, 28.0, 50.0, 103.0, 107.0, 235.0, 495.0, 1201.0, 3448.0, 13301.0, 71063.0, 875539.0, 3093012.0, 109327.0, 18882.0, 4655.0, 1465.0, 562.0, 265.0, 161.0, 99.0, 58.0, 38.0, 28.0, 21.0, 15.0, 8.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.015625, -17.396728515625, -16.77783203125, -16.158935546875, -15.5400390625, -14.921142578125, -14.30224609375, -13.683349609375, -13.064453125, -12.445556640625, -11.82666015625, -11.207763671875, -10.5888671875, -9.969970703125, -9.35107421875, -8.732177734375, -8.11328125, -7.494384765625, -6.87548828125, -6.256591796875, -5.6376953125, -5.018798828125, -4.39990234375, -3.781005859375, -3.162109375, -2.543212890625, -1.92431640625, -1.305419921875, -0.6865234375, -0.067626953125, 0.55126953125, 1.170166015625, 1.7890625, 2.407958984375, 3.02685546875, 3.645751953125, 4.2646484375, 4.883544921875, 5.50244140625, 6.121337890625, 6.740234375, 7.359130859375, 7.97802734375, 8.596923828125, 9.2158203125, 9.834716796875, 10.45361328125, 11.072509765625, 11.69140625, 12.310302734375, 12.92919921875, 13.548095703125, 14.1669921875, 14.785888671875, 15.40478515625, 16.023681640625, 16.642578125, 17.261474609375, 17.88037109375, 18.499267578125, 19.1181640625, 19.737060546875, 20.35595703125, 20.974853515625, 21.59375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 11.0, 13.0, 10.0, 22.0, 26.0, 35.0, 40.0, 50.0, 71.0, 87.0, 136.0, 210.0, 372.0, 1331.0, 693.0, 300.0, 184.0, 103.0, 65.0, 70.0, 41.0, 37.0, 35.0, 31.0, 13.0, 21.0, 14.0, 12.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.4291839599609375, -1.375946044921875, -1.3227081298828125, -1.26947021484375, -1.2162322998046875, -1.162994384765625, -1.1097564697265625, -1.0565185546875, -1.0032806396484375, -0.950042724609375, -0.8968048095703125, -0.84356689453125, -0.7903289794921875, -0.737091064453125, -0.6838531494140625, -0.630615234375, -0.5773773193359375, -0.524139404296875, -0.4709014892578125, -0.41766357421875, -0.3644256591796875, -0.311187744140625, -0.2579498291015625, -0.2047119140625, -0.1514739990234375, -0.098236083984375, -0.0449981689453125, 0.00823974609375, 0.0614776611328125, 0.114715576171875, 0.1679534912109375, 0.22119140625, 0.2744293212890625, 0.327667236328125, 0.3809051513671875, 0.43414306640625, 0.4873809814453125, 0.540618896484375, 0.5938568115234375, 0.6470947265625, 0.7003326416015625, 0.753570556640625, 0.8068084716796875, 0.86004638671875, 0.9132843017578125, 0.966522216796875, 1.0197601318359375, 1.072998046875, 1.1262359619140625, 1.179473876953125, 1.2327117919921875, 1.28594970703125, 1.3391876220703125, 1.392425537109375, 1.4456634521484375, 1.4989013671875, 1.5521392822265625, 1.605377197265625, 1.6586151123046875, 1.71185302734375, 1.7650909423828125, 1.818328857421875, 1.8715667724609375, 1.9248046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 20.0, 22.0, 35.0, 39.0, 72.0, 81.0, 106.0, 113.0, 126.0, 115.0, 65.0, 68.0, 29.0, 23.0, 21.0, 12.0, 14.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.629003524780273, -13.258279800415039, -12.887555122375488, -12.516831398010254, -12.14610767364502, -11.775382995605469, -11.404659271240234, -11.033935546875, -10.663211822509766, -10.292488098144531, -9.92176342010498, -9.551039695739746, -9.180315971374512, -8.809591293334961, -8.438867568969727, -8.068143844604492, -7.697419166564941, -7.326694965362549, -6.9559712409973145, -6.585247039794922, -6.2145233154296875, -5.843799114227295, -5.473074913024902, -5.102351188659668, -4.731626987457275, -4.360902786254883, -3.9901790618896484, -3.619454860687256, -3.2487308979034424, -2.878006935119629, -2.5072827339172363, -2.136558771133423, -1.7658357620239258, -1.3951117992401123, -1.0243877172470093, -0.6536636352539062, -0.2829396724700928, 0.0877842903137207, 0.4585084915161133, 0.8292324542999268, 1.1999564170837402, 1.5706803798675537, 1.9414044618606567, 2.3121285438537598, 2.6828525066375732, 3.0535764694213867, 3.4243006706237793, 3.7950246334075928, 4.165748596191406, 4.536472797393799, 4.907196521759033, 5.277920722961426, 5.64864444732666, 6.019368648529053, 6.390092849731445, 6.76081657409668, 7.131540775299072, 7.502264976501465, 7.872988700866699, 8.24371337890625, 8.614437103271484, 8.985160827636719, 9.355884552001953, 9.726609230041504, 10.097332954406738]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 8.0, 13.0, 11.0, 20.0, 26.0, 37.0, 40.0, 54.0, 62.0, 78.0, 94.0, 107.0, 97.0, 74.0, 64.0, 62.0, 57.0, 28.0, 28.0, 21.0, 4.0, 11.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.148794174194336, -7.771350860595703, -7.3939080238342285, -7.016464710235596, -6.639021873474121, -6.261578559875488, -5.8841352462768555, -5.506691932678223, -5.129249095916748, -4.751805782318115, -4.374362945556641, -3.996919631958008, -3.619476556777954, -3.2420334815979004, -2.8645901679992676, -2.487147092819214, -2.10970401763916, -1.7322609424591064, -1.3548177480697632, -0.9773745536804199, -0.5999314785003662, -0.2224884033203125, 0.1549549102783203, 0.532397985458374, 0.9098410606384277, 1.2872841358184814, 1.6647273302078247, 2.042170524597168, 2.4196135997772217, 2.7970566749572754, 3.174499988555908, 3.551943063735962, 3.9293861389160156, 4.306829452514648, 4.684272289276123, 5.061715602874756, 5.4391584396362305, 5.816601753234863, 6.194045066833496, 6.571488380432129, 6.9489312171936035, 7.326374530792236, 7.703817367553711, 8.081260681152344, 8.458703994750977, 8.83614730834961, 9.213590621948242, 9.591032981872559, 9.968476295471191, 10.345919609069824, 10.723362922668457, 11.100805282592773, 11.478248596191406, 11.855691909790039, 12.233135223388672, 12.610578536987305, 12.988021850585938, 13.36546516418457, 13.742908477783203, 14.120351791381836, 14.497794151306152, 14.875237464904785, 15.252680778503418, 15.63012409210205, 16.007566452026367]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 11.0, 26.0, 28.0, 45.0, 63.0, 107.0, 138.0, 210.0, 473.0, 756.0, 1245.0, 2383.0, 4601.0, 9067.0, 19114.0, 42414.0, 98154.0, 214601.0, 305201.0, 191964.0, 86757.0, 37034.0, 16891.0, 8033.0, 4099.0, 2248.0, 1205.0, 647.0, 385.0, 234.0, 131.0, 81.0, 61.0, 34.0, 28.0, 20.0, 7.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.6904296875, -4.525390625, -4.3603515625, -4.1953125, -4.0302734375, -3.865234375, -3.7001953125, -3.53515625, -3.3701171875, -3.205078125, -3.0400390625, -2.875, -2.7099609375, -2.544921875, -2.3798828125, -2.21484375, -2.0498046875, -1.884765625, -1.7197265625, -1.5546875, -1.3896484375, -1.224609375, -1.0595703125, -0.89453125, -0.7294921875, -0.564453125, -0.3994140625, -0.234375, -0.0693359375, 0.095703125, 0.2607421875, 0.42578125, 0.5908203125, 0.755859375, 0.9208984375, 1.0859375, 1.2509765625, 1.416015625, 1.5810546875, 1.74609375, 1.9111328125, 2.076171875, 2.2412109375, 2.40625, 2.5712890625, 2.736328125, 2.9013671875, 3.06640625, 3.2314453125, 3.396484375, 3.5615234375, 3.7265625, 3.8916015625, 4.056640625, 4.2216796875, 4.38671875, 4.5517578125, 4.716796875, 4.8818359375, 5.046875, 5.2119140625, 5.376953125, 5.5419921875, 5.70703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 8.0, 8.0, 8.0, 5.0, 10.0, 14.0, 20.0, 15.0, 16.0, 38.0, 25.0, 41.0, 32.0, 50.0, 61.0, 41.0, 53.0, 52.0, 53.0, 53.0, 50.0, 44.0, 50.0, 31.0, 33.0, 29.0, 22.0, 25.0, 25.0, 13.0, 15.0, 10.0, 7.0, 7.0, 4.0, 3.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.42612457275390625, -0.4113311767578125, -0.39653778076171875, -0.381744384765625, -0.36695098876953125, -0.3521575927734375, -0.33736419677734375, -0.32257080078125, -0.30777740478515625, -0.2929840087890625, -0.27819061279296875, -0.263397216796875, -0.24860382080078125, -0.2338104248046875, -0.21901702880859375, -0.2042236328125, -0.18943023681640625, -0.1746368408203125, -0.15984344482421875, -0.145050048828125, -0.13025665283203125, -0.1154632568359375, -0.10066986083984375, -0.08587646484375, -0.07108306884765625, -0.0562896728515625, -0.04149627685546875, -0.026702880859375, -0.01190948486328125, 0.0028839111328125, 0.01767730712890625, 0.032470703125, 0.04726409912109375, 0.0620574951171875, 0.07685089111328125, 0.091644287109375, 0.10643768310546875, 0.1212310791015625, 0.13602447509765625, 0.15081787109375, 0.16561126708984375, 0.1804046630859375, 0.19519805908203125, 0.209991455078125, 0.22478485107421875, 0.2395782470703125, 0.25437164306640625, 0.2691650390625, 0.28395843505859375, 0.2987518310546875, 0.31354522705078125, 0.328338623046875, 0.34313201904296875, 0.3579254150390625, 0.37271881103515625, 0.38751220703125, 0.40230560302734375, 0.4170989990234375, 0.43189239501953125, 0.446685791015625, 0.46147918701171875, 0.4762725830078125, 0.49106597900390625, 0.505859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 4.0, 10.0, 14.0, 19.0, 21.0, 12.0, 35.0, 48.0, 78.0, 87.0, 161.0, 285.0, 400.0, 684.0, 1569.0, 4677.0, 20253.0, 123772.0, 531548.0, 302360.0, 48402.0, 9136.0, 2522.0, 1054.0, 512.0, 289.0, 175.0, 128.0, 100.0, 51.0, 37.0, 32.0, 24.0, 14.0, 10.0, 9.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.390625, -10.0633544921875, -9.736083984375, -9.4088134765625, -9.08154296875, -8.7542724609375, -8.427001953125, -8.0997314453125, -7.7724609375, -7.4451904296875, -7.117919921875, -6.7906494140625, -6.46337890625, -6.1361083984375, -5.808837890625, -5.4815673828125, -5.154296875, -4.8270263671875, -4.499755859375, -4.1724853515625, -3.84521484375, -3.5179443359375, -3.190673828125, -2.8634033203125, -2.5361328125, -2.2088623046875, -1.881591796875, -1.5543212890625, -1.22705078125, -0.8997802734375, -0.572509765625, -0.2452392578125, 0.08203125, 0.4093017578125, 0.736572265625, 1.0638427734375, 1.39111328125, 1.7183837890625, 2.045654296875, 2.3729248046875, 2.7001953125, 3.0274658203125, 3.354736328125, 3.6820068359375, 4.00927734375, 4.3365478515625, 4.663818359375, 4.9910888671875, 5.318359375, 5.6456298828125, 5.972900390625, 6.3001708984375, 6.62744140625, 6.9547119140625, 7.281982421875, 7.6092529296875, 7.9365234375, 8.2637939453125, 8.591064453125, 8.9183349609375, 9.24560546875, 9.5728759765625, 9.900146484375, 10.2274169921875, 10.5546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 9.0, 8.0, 6.0, 12.0, 14.0, 11.0, 15.0, 22.0, 17.0, 22.0, 26.0, 20.0, 40.0, 23.0, 32.0, 30.0, 37.0, 42.0, 35.0, 60.0, 49.0, 52.0, 47.0, 43.0, 43.0, 34.0, 32.0, 33.0, 28.0, 15.0, 25.0, 16.0, 20.0, 19.0, 10.0, 9.0, 5.0, 9.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.482421875, -2.39593505859375, -2.3094482421875, -2.22296142578125, -2.136474609375, -2.04998779296875, -1.9635009765625, -1.87701416015625, -1.79052734375, -1.70404052734375, -1.6175537109375, -1.53106689453125, -1.444580078125, -1.35809326171875, -1.2716064453125, -1.18511962890625, -1.0986328125, -1.01214599609375, -0.9256591796875, -0.83917236328125, -0.752685546875, -0.66619873046875, -0.5797119140625, -0.49322509765625, -0.40673828125, -0.32025146484375, -0.2337646484375, -0.14727783203125, -0.060791015625, 0.02569580078125, 0.1121826171875, 0.19866943359375, 0.28515625, 0.37164306640625, 0.4581298828125, 0.54461669921875, 0.631103515625, 0.71759033203125, 0.8040771484375, 0.89056396484375, 0.97705078125, 1.06353759765625, 1.1500244140625, 1.23651123046875, 1.322998046875, 1.40948486328125, 1.4959716796875, 1.58245849609375, 1.6689453125, 1.75543212890625, 1.8419189453125, 1.92840576171875, 2.014892578125, 2.10137939453125, 2.1878662109375, 2.27435302734375, 2.36083984375, 2.44732666015625, 2.5338134765625, 2.62030029296875, 2.706787109375, 2.79327392578125, 2.8797607421875, 2.96624755859375, 3.052734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 8.0, 11.0, 17.0, 23.0, 29.0, 34.0, 51.0, 89.0, 152.0, 246.0, 462.0, 834.0, 1577.0, 3145.0, 7091.0, 16332.0, 43095.0, 131616.0, 366315.0, 313236.0, 103785.0, 34976.0, 13719.0, 5848.0, 2753.0, 1348.0, 714.0, 392.0, 225.0, 130.0, 95.0, 61.0, 50.0, 28.0, 19.0, 11.0, 10.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4921875, -6.3006591796875, -6.109130859375, -5.9176025390625, -5.72607421875, -5.5345458984375, -5.343017578125, -5.1514892578125, -4.9599609375, -4.7684326171875, -4.576904296875, -4.3853759765625, -4.19384765625, -4.0023193359375, -3.810791015625, -3.6192626953125, -3.427734375, -3.2362060546875, -3.044677734375, -2.8531494140625, -2.66162109375, -2.4700927734375, -2.278564453125, -2.0870361328125, -1.8955078125, -1.7039794921875, -1.512451171875, -1.3209228515625, -1.12939453125, -0.9378662109375, -0.746337890625, -0.5548095703125, -0.36328125, -0.1717529296875, 0.019775390625, 0.2113037109375, 0.40283203125, 0.5943603515625, 0.785888671875, 0.9774169921875, 1.1689453125, 1.3604736328125, 1.552001953125, 1.7435302734375, 1.93505859375, 2.1265869140625, 2.318115234375, 2.5096435546875, 2.701171875, 2.8927001953125, 3.084228515625, 3.2757568359375, 3.46728515625, 3.6588134765625, 3.850341796875, 4.0418701171875, 4.2333984375, 4.4249267578125, 4.616455078125, 4.8079833984375, 4.99951171875, 5.1910400390625, 5.382568359375, 5.5740966796875, 5.765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 15.0, 21.0, 32.0, 39.0, 48.0, 64.0, 94.0, 121.0, 117.0, 98.0, 79.0, 56.0, 53.0, 24.0, 35.0, 13.0, 12.0, 10.0, 9.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00092315673828125, -0.0008969902992248535, -0.000870823860168457, -0.0008446574211120605, -0.0008184909820556641, -0.0007923245429992676, -0.0007661581039428711, -0.0007399916648864746, -0.0007138252258300781, -0.0006876587867736816, -0.0006614923477172852, -0.0006353259086608887, -0.0006091594696044922, -0.0005829930305480957, -0.0005568265914916992, -0.0005306601524353027, -0.0005044937133789062, -0.00047832727432250977, -0.0004521608352661133, -0.0004259943962097168, -0.0003998279571533203, -0.00037366151809692383, -0.00034749507904052734, -0.00032132863998413086, -0.0002951622009277344, -0.0002689957618713379, -0.0002428293228149414, -0.00021666288375854492, -0.00019049644470214844, -0.00016433000564575195, -0.00013816356658935547, -0.00011199712753295898, -8.58306884765625e-05, -5.9664249420166016e-05, -3.349781036376953e-05, -7.331371307373047e-06, 1.8835067749023438e-05, 4.500150680541992e-05, 7.11679458618164e-05, 9.733438491821289e-05, 0.00012350082397460938, 0.00014966726303100586, 0.00017583370208740234, 0.00020200014114379883, 0.0002281665802001953, 0.0002543330192565918, 0.0002804994583129883, 0.00030666589736938477, 0.00033283233642578125, 0.00035899877548217773, 0.0003851652145385742, 0.0004113316535949707, 0.0004374980926513672, 0.00046366453170776367, 0.0004898309707641602, 0.0005159974098205566, 0.0005421638488769531, 0.0005683302879333496, 0.0005944967269897461, 0.0006206631660461426, 0.0006468296051025391, 0.0006729960441589355, 0.000699162483215332, 0.0007253289222717285, 0.000751495361328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 5.0, 7.0, 10.0, 7.0, 23.0, 38.0, 46.0, 65.0, 96.0, 247.0, 492.0, 1276.0, 4828.0, 29458.0, 369102.0, 585773.0, 47513.0, 6703.0, 1637.0, 623.0, 249.0, 131.0, 68.0, 49.0, 38.0, 22.0, 14.0, 8.0, 2.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.015625, -14.575439453125, -14.13525390625, -13.695068359375, -13.2548828125, -12.814697265625, -12.37451171875, -11.934326171875, -11.494140625, -11.053955078125, -10.61376953125, -10.173583984375, -9.7333984375, -9.293212890625, -8.85302734375, -8.412841796875, -7.97265625, -7.532470703125, -7.09228515625, -6.652099609375, -6.2119140625, -5.771728515625, -5.33154296875, -4.891357421875, -4.451171875, -4.010986328125, -3.57080078125, -3.130615234375, -2.6904296875, -2.250244140625, -1.81005859375, -1.369873046875, -0.9296875, -0.489501953125, -0.04931640625, 0.390869140625, 0.8310546875, 1.271240234375, 1.71142578125, 2.151611328125, 2.591796875, 3.031982421875, 3.47216796875, 3.912353515625, 4.3525390625, 4.792724609375, 5.23291015625, 5.673095703125, 6.11328125, 6.553466796875, 6.99365234375, 7.433837890625, 7.8740234375, 8.314208984375, 8.75439453125, 9.194580078125, 9.634765625, 10.074951171875, 10.51513671875, 10.955322265625, 11.3955078125, 11.835693359375, 12.27587890625, 12.716064453125, 13.15625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 5.0, 7.0, 7.0, 7.0, 8.0, 13.0, 14.0, 12.0, 13.0, 29.0, 24.0, 31.0, 44.0, 34.0, 55.0, 65.0, 74.0, 85.0, 52.0, 63.0, 52.0, 47.0, 37.0, 40.0, 33.0, 21.0, 20.0, 20.0, 14.0, 11.0, 11.0, 14.0, 7.0, 12.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.628936767578125, -2.54107666015625, -2.453216552734375, -2.3653564453125, -2.277496337890625, -2.18963623046875, -2.101776123046875, -2.013916015625, -1.926055908203125, -1.83819580078125, -1.750335693359375, -1.6624755859375, -1.574615478515625, -1.48675537109375, -1.398895263671875, -1.31103515625, -1.223175048828125, -1.13531494140625, -1.047454833984375, -0.9595947265625, -0.871734619140625, -0.78387451171875, -0.696014404296875, -0.608154296875, -0.520294189453125, -0.43243408203125, -0.344573974609375, -0.2567138671875, -0.168853759765625, -0.08099365234375, 0.006866455078125, 0.0947265625, 0.182586669921875, 0.27044677734375, 0.358306884765625, 0.4461669921875, 0.534027099609375, 0.62188720703125, 0.709747314453125, 0.797607421875, 0.885467529296875, 0.97332763671875, 1.061187744140625, 1.1490478515625, 1.236907958984375, 1.32476806640625, 1.412628173828125, 1.50048828125, 1.588348388671875, 1.67620849609375, 1.764068603515625, 1.8519287109375, 1.939788818359375, 2.02764892578125, 2.115509033203125, 2.203369140625, 2.291229248046875, 2.37908935546875, 2.466949462890625, 2.5548095703125, 2.642669677734375, 2.73052978515625, 2.818389892578125, 2.90625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 20.0, 52.0, 165.0, 314.0, 269.0, 112.0, 42.0, 15.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.85728454589844, -80.73849487304688, -77.61971282958984, -74.50092315673828, -71.38214111328125, -68.26335144042969, -65.14456939697266, -62.025779724121094, -58.90699768066406, -55.788211822509766, -52.66942596435547, -49.55064010620117, -46.431854248046875, -43.31306838989258, -40.19428253173828, -37.07549285888672, -33.95670700073242, -30.837921142578125, -27.719135284423828, -24.60034942626953, -21.481563568115234, -18.362777709960938, -15.243989944458008, -12.125204086303711, -9.006418228149414, -5.887632369995117, -2.768846035003662, 0.34994029998779297, 3.46872615814209, 6.587512016296387, 9.706298828125, 12.825084686279297, 15.943870544433594, 19.06265640258789, 22.181442260742188, 25.300228118896484, 28.41901397705078, 31.537799835205078, 34.656585693359375, 37.77537536621094, 40.89415740966797, 44.012943267822266, 47.13172912597656, 50.25051498413086, 53.369300842285156, 56.48808670043945, 59.60687255859375, 62.72566223144531, 65.84445190429688, 68.96324157714844, 72.08202362060547, 75.20081329345703, 78.31959533691406, 81.43838500976562, 84.55716705322266, 87.67595672607422, 90.79473876953125, 93.91352844238281, 97.03231048583984, 100.1511001586914, 103.26988220214844, 106.388671875, 109.50745391845703, 112.6262435913086, 115.74502563476562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 9.0, 16.0, 4.0, 19.0, 24.0, 18.0, 28.0, 38.0, 38.0, 47.0, 39.0, 49.0, 57.0, 65.0, 48.0, 57.0, 55.0, 50.0, 50.0, 48.0, 43.0, 40.0, 34.0, 33.0, 16.0, 15.0, 14.0, 8.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-30.261804580688477, -29.429311752319336, -28.596818923950195, -27.764326095581055, -26.931833267211914, -26.09933853149414, -25.266845703125, -24.43435287475586, -23.60186004638672, -22.769367218017578, -21.936874389648438, -21.104381561279297, -20.271888732910156, -19.439395904541016, -18.606903076171875, -17.7744083404541, -16.941917419433594, -16.109424591064453, -15.276931762695312, -14.444438934326172, -13.611945152282715, -12.779452323913574, -11.946959495544434, -11.114465713500977, -10.281972885131836, -9.449480056762695, -8.616987228393555, -7.784493923187256, -6.952000617980957, -6.119507789611816, -5.287014961242676, -4.454521656036377, -3.622028350830078, -2.7895352840423584, -1.9570423364639282, -1.124549388885498, -0.2920563220977783, 0.5404367446899414, 1.372929573059082, 2.205422878265381, 3.0379157066345215, 3.870408773422241, 4.702901840209961, 5.535394668579102, 6.367887496948242, 7.200380802154541, 8.032873153686523, 8.86536693572998, 9.697859764099121, 10.530352592468262, 11.362845420837402, 12.19533920288086, 13.02783203125, 13.86032485961914, 14.692817687988281, 15.525310516357422, 16.357803344726562, 17.190296173095703, 18.022789001464844, 18.855281829833984, 19.687774658203125, 20.520267486572266, 21.352760314941406, 22.18525505065918, 23.01774787902832]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 12.0, 10.0, 13.0, 15.0, 29.0, 29.0, 55.0, 84.0, 177.0, 474.0, 1673.0, 9361.0, 83854.0, 3887680.0, 191318.0, 15855.0, 2554.0, 596.0, 191.0, 88.0, 52.0, 39.0, 28.0, 21.0, 14.0, 10.0, 6.0, 6.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.9677734375, -23.185546875, -22.4033203125, -21.62109375, -20.8388671875, -20.056640625, -19.2744140625, -18.4921875, -17.7099609375, -16.927734375, -16.1455078125, -15.36328125, -14.5810546875, -13.798828125, -13.0166015625, -12.234375, -11.4521484375, -10.669921875, -9.8876953125, -9.10546875, -8.3232421875, -7.541015625, -6.7587890625, -5.9765625, -5.1943359375, -4.412109375, -3.6298828125, -2.84765625, -2.0654296875, -1.283203125, -0.5009765625, 0.28125, 1.0634765625, 1.845703125, 2.6279296875, 3.41015625, 4.1923828125, 4.974609375, 5.7568359375, 6.5390625, 7.3212890625, 8.103515625, 8.8857421875, 9.66796875, 10.4501953125, 11.232421875, 12.0146484375, 12.796875, 13.5791015625, 14.361328125, 15.1435546875, 15.92578125, 16.7080078125, 17.490234375, 18.2724609375, 19.0546875, 19.8369140625, 20.619140625, 21.4013671875, 22.18359375, 22.9658203125, 23.748046875, 24.5302734375, 25.3125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 7.0, 11.0, 9.0, 20.0, 25.0, 22.0, 30.0, 34.0, 41.0, 47.0, 51.0, 51.0, 55.0, 53.0, 56.0, 65.0, 52.0, 51.0, 49.0, 55.0, 34.0, 44.0, 25.0, 21.0, 15.0, 12.0, 8.0, 6.0, 8.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6770706176757812, -0.6554107666015625, -0.6337509155273438, -0.612091064453125, -0.5904312133789062, -0.5687713623046875, -0.5471115112304688, -0.52545166015625, -0.5037918090820312, -0.4821319580078125, -0.46047210693359375, -0.438812255859375, -0.41715240478515625, -0.3954925537109375, -0.37383270263671875, -0.3521728515625, -0.33051300048828125, -0.3088531494140625, -0.28719329833984375, -0.265533447265625, -0.24387359619140625, -0.2222137451171875, -0.20055389404296875, -0.17889404296875, -0.15723419189453125, -0.1355743408203125, -0.11391448974609375, -0.092254638671875, -0.07059478759765625, -0.0489349365234375, -0.02727508544921875, -0.005615234375, 0.01604461669921875, 0.0377044677734375, 0.05936431884765625, 0.081024169921875, 0.10268402099609375, 0.1243438720703125, 0.14600372314453125, 0.16766357421875, 0.18932342529296875, 0.2109832763671875, 0.23264312744140625, 0.254302978515625, 0.27596282958984375, 0.2976226806640625, 0.31928253173828125, 0.3409423828125, 0.36260223388671875, 0.3842620849609375, 0.40592193603515625, 0.427581787109375, 0.44924163818359375, 0.4709014892578125, 0.49256134033203125, 0.51422119140625, 0.5358810424804688, 0.5575408935546875, 0.5792007446289062, 0.600860595703125, 0.6225204467773438, 0.6441802978515625, 0.6658401489257812, 0.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 1.0, 7.0, 13.0, 19.0, 30.0, 52.0, 71.0, 103.0, 231.0, 414.0, 937.0, 2835.0, 10521.0, 53188.0, 454840.0, 3444234.0, 188032.0, 28805.0, 6365.0, 1926.0, 737.0, 388.0, 200.0, 119.0, 76.0, 54.0, 27.0, 23.0, 14.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.5, -15.955810546875, -15.41162109375, -14.867431640625, -14.3232421875, -13.779052734375, -13.23486328125, -12.690673828125, -12.146484375, -11.602294921875, -11.05810546875, -10.513916015625, -9.9697265625, -9.425537109375, -8.88134765625, -8.337158203125, -7.79296875, -7.248779296875, -6.70458984375, -6.160400390625, -5.6162109375, -5.072021484375, -4.52783203125, -3.983642578125, -3.439453125, -2.895263671875, -2.35107421875, -1.806884765625, -1.2626953125, -0.718505859375, -0.17431640625, 0.369873046875, 0.9140625, 1.458251953125, 2.00244140625, 2.546630859375, 3.0908203125, 3.635009765625, 4.17919921875, 4.723388671875, 5.267578125, 5.811767578125, 6.35595703125, 6.900146484375, 7.4443359375, 7.988525390625, 8.53271484375, 9.076904296875, 9.62109375, 10.165283203125, 10.70947265625, 11.253662109375, 11.7978515625, 12.342041015625, 12.88623046875, 13.430419921875, 13.974609375, 14.518798828125, 15.06298828125, 15.607177734375, 16.1513671875, 16.695556640625, 17.23974609375, 17.783935546875, 18.328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 6.0, 8.0, 5.0, 16.0, 17.0, 28.0, 21.0, 44.0, 58.0, 94.0, 139.0, 245.0, 443.0, 1516.0, 640.0, 246.0, 156.0, 113.0, 73.0, 56.0, 40.0, 27.0, 21.0, 25.0, 9.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.705078125, -1.62994384765625, -1.5548095703125, -1.47967529296875, -1.404541015625, -1.32940673828125, -1.2542724609375, -1.17913818359375, -1.10400390625, -1.02886962890625, -0.9537353515625, -0.87860107421875, -0.803466796875, -0.72833251953125, -0.6531982421875, -0.57806396484375, -0.5029296875, -0.42779541015625, -0.3526611328125, -0.27752685546875, -0.202392578125, -0.12725830078125, -0.0521240234375, 0.02301025390625, 0.09814453125, 0.17327880859375, 0.2484130859375, 0.32354736328125, 0.398681640625, 0.47381591796875, 0.5489501953125, 0.62408447265625, 0.69921875, 0.77435302734375, 0.8494873046875, 0.92462158203125, 0.999755859375, 1.07489013671875, 1.1500244140625, 1.22515869140625, 1.30029296875, 1.37542724609375, 1.4505615234375, 1.52569580078125, 1.600830078125, 1.67596435546875, 1.7510986328125, 1.82623291015625, 1.9013671875, 1.97650146484375, 2.0516357421875, 2.12677001953125, 2.201904296875, 2.27703857421875, 2.3521728515625, 2.42730712890625, 2.50244140625, 2.57757568359375, 2.6527099609375, 2.72784423828125, 2.802978515625, 2.87811279296875, 2.9532470703125, 3.02838134765625, 3.103515625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 22.0, 37.0, 59.0, 88.0, 115.0, 184.0, 157.0, 105.0, 78.0, 51.0, 25.0, 31.0, 15.0, 13.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.640647888183594, -22.01165771484375, -21.38266944885254, -20.753679275512695, -20.124691009521484, -19.49570083618164, -18.86671257019043, -18.237722396850586, -17.608734130859375, -16.97974395751953, -16.35075569152832, -15.721766471862793, -15.092777252197266, -14.463788032531738, -13.834798812866211, -13.205808639526367, -12.57681941986084, -11.947830200195312, -11.318840980529785, -10.689851760864258, -10.06086254119873, -9.431873321533203, -8.80288314819336, -8.173894882202148, -7.544905185699463, -6.9159159660339355, -6.286926746368408, -5.657937049865723, -5.028947830200195, -4.399958610534668, -3.7709693908691406, -3.1419801712036133, -2.512990951538086, -1.8840017318725586, -1.2550123929977417, -0.6260230541229248, 0.002966165542602539, 0.6319553852081299, 1.2609448432922363, 1.8899340629577637, 2.518923282623291, 3.1479125022888184, 3.7769017219543457, 4.405891418457031, 5.034880638122559, 5.663869857788086, 6.292859077453613, 6.921848297119141, 7.550837516784668, 8.179826736450195, 8.808815956115723, 9.43780517578125, 10.066794395446777, 10.695783615112305, 11.324773788452148, 11.95376205444336, 12.582752227783203, 13.21174144744873, 13.840730667114258, 14.469719886779785, 15.098709106445312, 15.72769832611084, 16.356687545776367, 16.98567771911621, 17.614665985107422]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 7.0, 7.0, 8.0, 11.0, 19.0, 21.0, 19.0, 16.0, 26.0, 26.0, 26.0, 31.0, 45.0, 35.0, 39.0, 36.0, 37.0, 44.0, 38.0, 36.0, 44.0, 42.0, 35.0, 37.0, 33.0, 34.0, 34.0, 27.0, 17.0, 32.0, 23.0, 11.0, 14.0, 19.0, 11.0, 10.0, 5.0, 5.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.466585159301758, -7.247486591339111, -7.028387546539307, -6.80928897857666, -6.5901899337768555, -6.371091365814209, -6.1519927978515625, -5.932893753051758, -5.713794708251953, -5.494696140289307, -5.275597095489502, -5.0564985275268555, -4.837399482727051, -4.618300914764404, -4.399202346801758, -4.180103302001953, -3.9610047340393066, -3.741905927658081, -3.5228071212768555, -3.303708553314209, -3.0846095085144043, -2.865510940551758, -2.6464121341705322, -2.4273133277893066, -2.208214521408081, -1.9891157150268555, -1.7700169086456299, -1.5509182214736938, -1.3318194150924683, -1.1127206087112427, -0.8936219215393066, -0.674523115158081, -0.45542430877685547, -0.23632553219795227, -0.017226755619049072, 0.20187199115753174, 0.4209707975387573, 0.6400696039199829, 0.859168291091919, 1.0782670974731445, 1.2973659038543701, 1.5164647102355957, 1.7355635166168213, 1.9546622037887573, 2.1737608909606934, 2.392859935760498, 2.6119585037231445, 2.83105731010437, 3.0501561164855957, 3.2692549228668213, 3.488353729248047, 3.7074522972106934, 3.926551342010498, 4.1456499099731445, 4.364748954772949, 4.583847522735596, 4.802946090698242, 5.022044658660889, 5.241143703460693, 5.46024227142334, 5.6793413162231445, 5.898439884185791, 6.1175384521484375, 6.336637496948242, 6.555736541748047]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 12.0, 18.0, 32.0, 28.0, 49.0, 83.0, 118.0, 172.0, 246.0, 417.0, 729.0, 1177.0, 2121.0, 3817.0, 6980.0, 13839.0, 27172.0, 54818.0, 108792.0, 198948.0, 258512.0, 178245.0, 95197.0, 47088.0, 23755.0, 11877.0, 6192.0, 3409.0, 1832.0, 1073.0, 699.0, 401.0, 214.0, 157.0, 97.0, 62.0, 42.0, 40.0, 24.0, 15.0, 23.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.16424560546875, -4.0316162109375, -3.89898681640625, -3.766357421875, -3.63372802734375, -3.5010986328125, -3.36846923828125, -3.23583984375, -3.10321044921875, -2.9705810546875, -2.83795166015625, -2.705322265625, -2.57269287109375, -2.4400634765625, -2.30743408203125, -2.1748046875, -2.04217529296875, -1.9095458984375, -1.77691650390625, -1.644287109375, -1.51165771484375, -1.3790283203125, -1.24639892578125, -1.11376953125, -0.98114013671875, -0.8485107421875, -0.71588134765625, -0.583251953125, -0.45062255859375, -0.3179931640625, -0.18536376953125, -0.052734375, 0.07989501953125, 0.2125244140625, 0.34515380859375, 0.477783203125, 0.61041259765625, 0.7430419921875, 0.87567138671875, 1.00830078125, 1.14093017578125, 1.2735595703125, 1.40618896484375, 1.538818359375, 1.67144775390625, 1.8040771484375, 1.93670654296875, 2.0693359375, 2.20196533203125, 2.3345947265625, 2.46722412109375, 2.599853515625, 2.73248291015625, 2.8651123046875, 2.99774169921875, 3.13037109375, 3.26300048828125, 3.3956298828125, 3.52825927734375, 3.660888671875, 3.79351806640625, 3.9261474609375, 4.05877685546875, 4.19140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 11.0, 12.0, 14.0, 26.0, 25.0, 33.0, 29.0, 43.0, 50.0, 57.0, 44.0, 55.0, 63.0, 78.0, 69.0, 69.0, 53.0, 73.0, 27.0, 36.0, 22.0, 33.0, 21.0, 16.0, 13.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8427734375, -0.8172683715820312, -0.7917633056640625, -0.7662582397460938, -0.740753173828125, -0.7152481079101562, -0.6897430419921875, -0.6642379760742188, -0.63873291015625, -0.6132278442382812, -0.5877227783203125, -0.5622177124023438, -0.536712646484375, -0.5112075805664062, -0.4857025146484375, -0.46019744873046875, -0.4346923828125, -0.40918731689453125, -0.3836822509765625, -0.35817718505859375, -0.332672119140625, -0.30716705322265625, -0.2816619873046875, -0.25615692138671875, -0.23065185546875, -0.20514678955078125, -0.1796417236328125, -0.15413665771484375, -0.128631591796875, -0.10312652587890625, -0.0776214599609375, -0.05211639404296875, -0.026611328125, -0.00110626220703125, 0.0243988037109375, 0.04990386962890625, 0.075408935546875, 0.10091400146484375, 0.1264190673828125, 0.15192413330078125, 0.17742919921875, 0.20293426513671875, 0.2284393310546875, 0.25394439697265625, 0.279449462890625, 0.30495452880859375, 0.3304595947265625, 0.35596466064453125, 0.3814697265625, 0.40697479248046875, 0.4324798583984375, 0.45798492431640625, 0.483489990234375, 0.5089950561523438, 0.5345001220703125, 0.5600051879882812, 0.58551025390625, 0.6110153198242188, 0.6365203857421875, 0.6620254516601562, 0.687530517578125, 0.7130355834960938, 0.7385406494140625, 0.7640457153320312, 0.78955078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 13.0, 13.0, 25.0, 29.0, 48.0, 70.0, 96.0, 140.0, 244.0, 414.0, 649.0, 1466.0, 4964.0, 29355.0, 250802.0, 621370.0, 118394.0, 14671.0, 3057.0, 1168.0, 577.0, 342.0, 210.0, 116.0, 87.0, 64.0, 50.0, 22.0, 9.0, 21.0, 14.0, 10.0, 4.0, 5.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.236083984375, -10.83935546875, -10.442626953125, -10.0458984375, -9.649169921875, -9.25244140625, -8.855712890625, -8.458984375, -8.062255859375, -7.66552734375, -7.268798828125, -6.8720703125, -6.475341796875, -6.07861328125, -5.681884765625, -5.28515625, -4.888427734375, -4.49169921875, -4.094970703125, -3.6982421875, -3.301513671875, -2.90478515625, -2.508056640625, -2.111328125, -1.714599609375, -1.31787109375, -0.921142578125, -0.5244140625, -0.127685546875, 0.26904296875, 0.665771484375, 1.0625, 1.459228515625, 1.85595703125, 2.252685546875, 2.6494140625, 3.046142578125, 3.44287109375, 3.839599609375, 4.236328125, 4.633056640625, 5.02978515625, 5.426513671875, 5.8232421875, 6.219970703125, 6.61669921875, 7.013427734375, 7.41015625, 7.806884765625, 8.20361328125, 8.600341796875, 8.9970703125, 9.393798828125, 9.79052734375, 10.187255859375, 10.583984375, 10.980712890625, 11.37744140625, 11.774169921875, 12.1708984375, 12.567626953125, 12.96435546875, 13.361083984375, 13.7578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 2.0, 10.0, 4.0, 5.0, 12.0, 13.0, 20.0, 21.0, 11.0, 21.0, 17.0, 30.0, 32.0, 23.0, 37.0, 29.0, 40.0, 28.0, 32.0, 45.0, 34.0, 37.0, 42.0, 30.0, 23.0, 37.0, 35.0, 40.0, 30.0, 26.0, 23.0, 29.0, 17.0, 25.0, 18.0, 21.0, 19.0, 11.0, 9.0, 13.0, 2.0, 5.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.6953125, -2.603851318359375, -2.51239013671875, -2.420928955078125, -2.3294677734375, -2.238006591796875, -2.14654541015625, -2.055084228515625, -1.963623046875, -1.872161865234375, -1.78070068359375, -1.689239501953125, -1.5977783203125, -1.506317138671875, -1.41485595703125, -1.323394775390625, -1.23193359375, -1.140472412109375, -1.04901123046875, -0.957550048828125, -0.8660888671875, -0.774627685546875, -0.68316650390625, -0.591705322265625, -0.500244140625, -0.408782958984375, -0.31732177734375, -0.225860595703125, -0.1343994140625, -0.042938232421875, 0.04852294921875, 0.139984130859375, 0.2314453125, 0.322906494140625, 0.41436767578125, 0.505828857421875, 0.5972900390625, 0.688751220703125, 0.78021240234375, 0.871673583984375, 0.963134765625, 1.054595947265625, 1.14605712890625, 1.237518310546875, 1.3289794921875, 1.420440673828125, 1.51190185546875, 1.603363037109375, 1.69482421875, 1.786285400390625, 1.87774658203125, 1.969207763671875, 2.0606689453125, 2.152130126953125, 2.24359130859375, 2.335052490234375, 2.426513671875, 2.517974853515625, 2.60943603515625, 2.700897216796875, 2.7923583984375, 2.883819580078125, 2.97528076171875, 3.066741943359375, 3.158203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 15.0, 18.0, 29.0, 38.0, 52.0, 82.0, 114.0, 178.0, 275.0, 566.0, 931.0, 1796.0, 3783.0, 8710.0, 22786.0, 69000.0, 206756.0, 379512.0, 231592.0, 78169.0, 25704.0, 9893.0, 4119.0, 1979.0, 969.0, 543.0, 351.0, 162.0, 137.0, 74.0, 67.0, 41.0, 29.0, 15.0, 7.0, 6.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.922576904296875, -3.79827880859375, -3.673980712890625, -3.5496826171875, -3.425384521484375, -3.30108642578125, -3.176788330078125, -3.052490234375, -2.928192138671875, -2.80389404296875, -2.679595947265625, -2.5552978515625, -2.430999755859375, -2.30670166015625, -2.182403564453125, -2.05810546875, -1.933807373046875, -1.80950927734375, -1.685211181640625, -1.5609130859375, -1.436614990234375, -1.31231689453125, -1.188018798828125, -1.063720703125, -0.939422607421875, -0.81512451171875, -0.690826416015625, -0.5665283203125, -0.442230224609375, -0.31793212890625, -0.193634033203125, -0.0693359375, 0.054962158203125, 0.17926025390625, 0.303558349609375, 0.4278564453125, 0.552154541015625, 0.67645263671875, 0.800750732421875, 0.925048828125, 1.049346923828125, 1.17364501953125, 1.297943115234375, 1.4222412109375, 1.546539306640625, 1.67083740234375, 1.795135498046875, 1.91943359375, 2.043731689453125, 2.16802978515625, 2.292327880859375, 2.4166259765625, 2.540924072265625, 2.66522216796875, 2.789520263671875, 2.913818359375, 3.038116455078125, 3.16241455078125, 3.286712646484375, 3.4110107421875, 3.535308837890625, 3.65960693359375, 3.783905029296875, 3.908203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 11.0, 14.0, 20.0, 26.0, 40.0, 42.0, 74.0, 56.0, 79.0, 76.0, 91.0, 81.0, 68.0, 67.0, 53.0, 38.0, 24.0, 30.0, 24.0, 10.0, 9.0, 6.0, 5.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004622936248779297, -0.00044478848576545715, -0.0004272833466529846, -0.0004097782075405121, -0.00039227306842803955, -0.000374767929315567, -0.0003572627902030945, -0.00033975765109062195, -0.0003222525119781494, -0.0003047473728656769, -0.00028724223375320435, -0.0002697370946407318, -0.0002522319555282593, -0.00023472681641578674, -0.0002172216773033142, -0.00019971653819084167, -0.00018221139907836914, -0.0001647062599658966, -0.00014720112085342407, -0.00012969598174095154, -0.000112190842628479, -9.468570351600647e-05, -7.718056440353394e-05, -5.96754252910614e-05, -4.217028617858887e-05, -2.4665147066116333e-05, -7.160007953643799e-06, 1.0345131158828735e-05, 2.785027027130127e-05, 4.5355409383773804e-05, 6.286054849624634e-05, 8.036568760871887e-05, 9.78708267211914e-05, 0.00011537596583366394, 0.00013288110494613647, 0.000150386244058609, 0.00016789138317108154, 0.00018539652228355408, 0.0002029016613960266, 0.00022040680050849915, 0.00023791193962097168, 0.0002554170787334442, 0.00027292221784591675, 0.0002904273569583893, 0.0003079324960708618, 0.00032543763518333435, 0.0003429427742958069, 0.0003604479134082794, 0.00037795305252075195, 0.0003954581916332245, 0.000412963330745697, 0.00043046846985816956, 0.0004479736089706421, 0.0004654787480831146, 0.00048298388719558716, 0.0005004890263080597, 0.0005179941654205322, 0.0005354993045330048, 0.0005530044436454773, 0.0005705095827579498, 0.0005880147218704224, 0.0006055198609828949, 0.0006230250000953674, 0.00064053013920784, 0.0006580352783203125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 11.0, 12.0, 29.0, 38.0, 39.0, 108.0, 199.0, 353.0, 745.0, 1853.0, 6155.0, 30780.0, 304006.0, 614038.0, 74280.0, 11080.0, 2818.0, 1040.0, 440.0, 212.0, 116.0, 60.0, 43.0, 25.0, 22.0, 11.0, 3.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.533447265625, -8.23095703125, -7.928466796875, -7.6259765625, -7.323486328125, -7.02099609375, -6.718505859375, -6.416015625, -6.113525390625, -5.81103515625, -5.508544921875, -5.2060546875, -4.903564453125, -4.60107421875, -4.298583984375, -3.99609375, -3.693603515625, -3.39111328125, -3.088623046875, -2.7861328125, -2.483642578125, -2.18115234375, -1.878662109375, -1.576171875, -1.273681640625, -0.97119140625, -0.668701171875, -0.3662109375, -0.063720703125, 0.23876953125, 0.541259765625, 0.84375, 1.146240234375, 1.44873046875, 1.751220703125, 2.0537109375, 2.356201171875, 2.65869140625, 2.961181640625, 3.263671875, 3.566162109375, 3.86865234375, 4.171142578125, 4.4736328125, 4.776123046875, 5.07861328125, 5.381103515625, 5.68359375, 5.986083984375, 6.28857421875, 6.591064453125, 6.8935546875, 7.196044921875, 7.49853515625, 7.801025390625, 8.103515625, 8.406005859375, 8.70849609375, 9.010986328125, 9.3134765625, 9.615966796875, 9.91845703125, 10.220947265625, 10.5234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 8.0, 3.0, 9.0, 19.0, 12.0, 20.0, 31.0, 30.0, 39.0, 50.0, 73.0, 76.0, 62.0, 92.0, 87.0, 72.0, 73.0, 54.0, 50.0, 29.0, 21.0, 21.0, 12.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.22265625, -4.12652587890625, -4.0303955078125, -3.93426513671875, -3.838134765625, -3.74200439453125, -3.6458740234375, -3.54974365234375, -3.45361328125, -3.35748291015625, -3.2613525390625, -3.16522216796875, -3.069091796875, -2.97296142578125, -2.8768310546875, -2.78070068359375, -2.6845703125, -2.58843994140625, -2.4923095703125, -2.39617919921875, -2.300048828125, -2.20391845703125, -2.1077880859375, -2.01165771484375, -1.91552734375, -1.81939697265625, -1.7232666015625, -1.62713623046875, -1.531005859375, -1.43487548828125, -1.3387451171875, -1.24261474609375, -1.146484375, -1.05035400390625, -0.9542236328125, -0.85809326171875, -0.761962890625, -0.66583251953125, -0.5697021484375, -0.47357177734375, -0.37744140625, -0.28131103515625, -0.1851806640625, -0.08905029296875, 0.007080078125, 0.10321044921875, 0.1993408203125, 0.29547119140625, 0.3916015625, 0.48773193359375, 0.5838623046875, 0.67999267578125, 0.776123046875, 0.87225341796875, 0.9683837890625, 1.06451416015625, 1.16064453125, 1.25677490234375, 1.3529052734375, 1.44903564453125, 1.545166015625, 1.64129638671875, 1.7374267578125, 1.83355712890625, 1.9296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 6.0, 5.0, 10.0, 30.0, 46.0, 82.0, 108.0, 167.0, 181.0, 131.0, 102.0, 57.0, 32.0, 15.0, 13.0, 7.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-69.88543701171875, -68.19379425048828, -66.50214385986328, -64.81050109863281, -63.11885070800781, -61.427207946777344, -59.73556137084961, -58.043914794921875, -56.35226821899414, -54.660621643066406, -52.96897506713867, -51.27732849121094, -49.58568572998047, -47.89403533935547, -46.202392578125, -44.510746002197266, -42.81909942626953, -41.1274528503418, -39.43580627441406, -37.74415969848633, -36.052513122558594, -34.360870361328125, -32.66922378540039, -30.977577209472656, -29.285930633544922, -27.594284057617188, -25.902637481689453, -24.21099281311035, -22.519346237182617, -20.827699661254883, -19.13605499267578, -17.444408416748047, -15.752761840820312, -14.061115264892578, -12.36946964263916, -10.677824020385742, -8.986177444458008, -7.294530868530273, -5.6028852462768555, -3.9112396240234375, -2.219593048095703, -0.527946949005127, 1.1636991500854492, 2.8553452491760254, 4.546991348266602, 6.238637924194336, 7.930283546447754, 9.621929168701172, 11.313575744628906, 13.00522232055664, 14.696867942810059, 16.388513565063477, 18.08016014099121, 19.771806716918945, 21.463451385498047, 23.15509796142578, 24.846744537353516, 26.53839111328125, 28.230037689208984, 29.921682357788086, 31.61332893371582, 33.30497741699219, 34.996620178222656, 36.68826675415039, 38.379913330078125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 17.0, 13.0, 19.0, 40.0, 39.0, 40.0, 57.0, 46.0, 53.0, 69.0, 66.0, 65.0, 62.0, 56.0, 60.0, 45.0, 46.0, 43.0, 31.0, 27.0, 22.0, 19.0, 14.0, 8.0, 9.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.39739227294922, -23.33258056640625, -22.26776695251465, -21.20295524597168, -20.138141632080078, -19.07332992553711, -18.00851821899414, -16.943706512451172, -15.87889289855957, -14.814080238342285, -13.749267578125, -12.684455871582031, -11.619643211364746, -10.554830551147461, -9.490018844604492, -8.425206184387207, -7.360393524169922, -6.295580863952637, -5.23076868057251, -4.165956497192383, -3.1011438369750977, -2.0363311767578125, -0.9715189933776855, 0.0932931900024414, 1.1581058502197266, 2.2229182720184326, 3.2877306938171387, 4.352542877197266, 5.417355537414551, 6.482168197631836, 7.546980381011963, 8.61179256439209, 9.676605224609375, 10.74141788482666, 11.806230545043945, 12.871042251586914, 13.9358549118042, 15.000667572021484, 16.065479278564453, 17.130290985107422, 18.195104598999023, 19.259916305541992, 20.324729919433594, 21.389541625976562, 22.45435333251953, 23.519166946411133, 24.5839786529541, 25.648792266845703, 26.713603973388672, 27.77841567993164, 28.843229293823242, 29.90804100036621, 30.972854614257812, 32.03766632080078, 33.10247802734375, 34.16728973388672, 35.23210144042969, 36.296913146972656, 37.361724853515625, 38.42654037475586, 39.49135208129883, 40.5561637878418, 41.620975494384766, 42.685787200927734, 43.75060272216797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 13.0, 30.0, 28.0, 51.0, 60.0, 82.0, 104.0, 177.0, 242.0, 366.0, 684.0, 1153.0, 2417.0, 5130.0, 12425.0, 36777.0, 160907.0, 3352730.0, 511934.0, 73300.0, 21152.0, 7682.0, 3185.0, 1506.0, 774.0, 490.0, 286.0, 166.0, 137.0, 77.0, 56.0, 45.0, 23.0, 20.0, 11.0, 14.0, 5.0, 7.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.6396484375, -9.326171875, -9.0126953125, -8.69921875, -8.3857421875, -8.072265625, -7.7587890625, -7.4453125, -7.1318359375, -6.818359375, -6.5048828125, -6.19140625, -5.8779296875, -5.564453125, -5.2509765625, -4.9375, -4.6240234375, -4.310546875, -3.9970703125, -3.68359375, -3.3701171875, -3.056640625, -2.7431640625, -2.4296875, -2.1162109375, -1.802734375, -1.4892578125, -1.17578125, -0.8623046875, -0.548828125, -0.2353515625, 0.078125, 0.3916015625, 0.705078125, 1.0185546875, 1.33203125, 1.6455078125, 1.958984375, 2.2724609375, 2.5859375, 2.8994140625, 3.212890625, 3.5263671875, 3.83984375, 4.1533203125, 4.466796875, 4.7802734375, 5.09375, 5.4072265625, 5.720703125, 6.0341796875, 6.34765625, 6.6611328125, 6.974609375, 7.2880859375, 7.6015625, 7.9150390625, 8.228515625, 8.5419921875, 8.85546875, 9.1689453125, 9.482421875, 9.7958984375, 10.109375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 8.0, 12.0, 13.0, 8.0, 20.0, 14.0, 25.0, 15.0, 22.0, 23.0, 32.0, 30.0, 29.0, 38.0, 40.0, 44.0, 34.0, 53.0, 37.0, 50.0, 43.0, 44.0, 41.0, 44.0, 32.0, 32.0, 32.0, 27.0, 24.0, 23.0, 26.0, 18.0, 20.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.6031417846679688, -0.5832366943359375, -0.5633316040039062, -0.543426513671875, -0.5235214233398438, -0.5036163330078125, -0.48371124267578125, -0.46380615234375, -0.44390106201171875, -0.4239959716796875, -0.40409088134765625, -0.384185791015625, -0.36428070068359375, -0.3443756103515625, -0.32447052001953125, -0.3045654296875, -0.28466033935546875, -0.2647552490234375, -0.24485015869140625, -0.224945068359375, -0.20503997802734375, -0.1851348876953125, -0.16522979736328125, -0.14532470703125, -0.12541961669921875, -0.1055145263671875, -0.08560943603515625, -0.065704345703125, -0.04579925537109375, -0.0258941650390625, -0.00598907470703125, 0.013916015625, 0.03382110595703125, 0.0537261962890625, 0.07363128662109375, 0.093536376953125, 0.11344146728515625, 0.1333465576171875, 0.15325164794921875, 0.17315673828125, 0.19306182861328125, 0.2129669189453125, 0.23287200927734375, 0.252777099609375, 0.27268218994140625, 0.2925872802734375, 0.31249237060546875, 0.3323974609375, 0.35230255126953125, 0.3722076416015625, 0.39211273193359375, 0.412017822265625, 0.43192291259765625, 0.4518280029296875, 0.47173309326171875, 0.49163818359375, 0.5115432739257812, 0.5314483642578125, 0.5513534545898438, 0.571258544921875, 0.5911636352539062, 0.6110687255859375, 0.6309738159179688, 0.65087890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 7.0, 14.0, 17.0, 29.0, 30.0, 47.0, 58.0, 79.0, 159.0, 397.0, 965.0, 3461.0, 15458.0, 100457.0, 3002505.0, 987510.0, 67277.0, 11552.0, 2654.0, 769.0, 335.0, 173.0, 83.0, 61.0, 40.0, 33.0, 21.0, 24.0, 18.0, 11.0, 11.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.680419921875, -14.22021484375, -13.760009765625, -13.2998046875, -12.839599609375, -12.37939453125, -11.919189453125, -11.458984375, -10.998779296875, -10.53857421875, -10.078369140625, -9.6181640625, -9.157958984375, -8.69775390625, -8.237548828125, -7.77734375, -7.317138671875, -6.85693359375, -6.396728515625, -5.9365234375, -5.476318359375, -5.01611328125, -4.555908203125, -4.095703125, -3.635498046875, -3.17529296875, -2.715087890625, -2.2548828125, -1.794677734375, -1.33447265625, -0.874267578125, -0.4140625, 0.046142578125, 0.50634765625, 0.966552734375, 1.4267578125, 1.886962890625, 2.34716796875, 2.807373046875, 3.267578125, 3.727783203125, 4.18798828125, 4.648193359375, 5.1083984375, 5.568603515625, 6.02880859375, 6.489013671875, 6.94921875, 7.409423828125, 7.86962890625, 8.329833984375, 8.7900390625, 9.250244140625, 9.71044921875, 10.170654296875, 10.630859375, 11.091064453125, 11.55126953125, 12.011474609375, 12.4716796875, 12.931884765625, 13.39208984375, 13.852294921875, 14.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 8.0, 13.0, 10.0, 15.0, 14.0, 34.0, 32.0, 45.0, 64.0, 89.0, 97.0, 135.0, 241.0, 458.0, 1236.0, 567.0, 278.0, 191.0, 124.0, 95.0, 71.0, 50.0, 39.0, 39.0, 18.0, 18.0, 15.0, 9.0, 9.0, 10.0, 8.0, 7.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5693359375, -1.5146331787109375, -1.459930419921875, -1.4052276611328125, -1.35052490234375, -1.2958221435546875, -1.241119384765625, -1.1864166259765625, -1.1317138671875, -1.0770111083984375, -1.022308349609375, -0.9676055908203125, -0.91290283203125, -0.8582000732421875, -0.803497314453125, -0.7487945556640625, -0.694091796875, -0.6393890380859375, -0.584686279296875, -0.5299835205078125, -0.47528076171875, -0.4205780029296875, -0.365875244140625, -0.3111724853515625, -0.2564697265625, -0.2017669677734375, -0.147064208984375, -0.0923614501953125, -0.03765869140625, 0.0170440673828125, 0.071746826171875, 0.1264495849609375, 0.18115234375, 0.2358551025390625, 0.290557861328125, 0.3452606201171875, 0.39996337890625, 0.4546661376953125, 0.509368896484375, 0.5640716552734375, 0.6187744140625, 0.6734771728515625, 0.728179931640625, 0.7828826904296875, 0.83758544921875, 0.8922882080078125, 0.946990966796875, 1.0016937255859375, 1.056396484375, 1.1110992431640625, 1.165802001953125, 1.2205047607421875, 1.27520751953125, 1.3299102783203125, 1.384613037109375, 1.4393157958984375, 1.4940185546875, 1.5487213134765625, 1.603424072265625, 1.6581268310546875, 1.71282958984375, 1.7675323486328125, 1.822235107421875, 1.8769378662109375, 1.931640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 10.0, 48.0, 103.0, 194.0, 243.0, 212.0, 106.0, 49.0, 22.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.544408798217773, -14.5470552444458, -13.549701690673828, -12.552349090576172, -11.5549955368042, -10.557641983032227, -9.56028938293457, -8.562935829162598, -7.565582275390625, -6.568228721618652, -5.570875644683838, -4.573522567749023, -3.576169013977051, -2.578815460205078, -1.5814623832702637, -0.5841093063354492, 0.41324424743652344, 1.410597562789917, 2.4079508781433105, 3.405304193496704, 4.402657508850098, 5.40001106262207, 6.397364139556885, 7.394717216491699, 8.392070770263672, 9.389424324035645, 10.386777877807617, 11.384130477905273, 12.381484031677246, 13.378837585449219, 14.376190185546875, 15.373543739318848, 16.370899200439453, 17.36825180053711, 18.3656063079834, 19.362958908081055, 20.360313415527344, 21.357666015625, 22.355018615722656, 23.352371215820312, 24.3497257232666, 25.347078323364258, 26.344432830810547, 27.341785430908203, 28.33913803100586, 29.33649253845215, 30.333845138549805, 31.331199645996094, 32.32855224609375, 33.325904846191406, 34.32325744628906, 35.320613861083984, 36.31796646118164, 37.3153190612793, 38.31267166137695, 39.31002426147461, 40.30738067626953, 41.30473327636719, 42.302085876464844, 43.299442291259766, 44.29679489135742, 45.29414749145508, 46.291500091552734, 47.28885269165039, 48.28620529174805]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 8.0, 8.0, 15.0, 12.0, 16.0, 14.0, 24.0, 30.0, 31.0, 33.0, 43.0, 33.0, 50.0, 48.0, 42.0, 57.0, 44.0, 42.0, 47.0, 50.0, 46.0, 41.0, 37.0, 41.0, 21.0, 19.0, 23.0, 30.0, 19.0, 19.0, 11.0, 13.0, 10.0, 9.0, 6.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.305354595184326, -7.049162864685059, -6.792971134185791, -6.536779403686523, -6.280587196350098, -6.02439546585083, -5.7682037353515625, -5.512012004852295, -5.255820274353027, -4.99962854385376, -4.743436813354492, -4.487244606018066, -4.231052875518799, -3.9748611450195312, -3.7186694145202637, -3.462477684020996, -3.2062854766845703, -2.9500937461853027, -2.693901777267456, -2.4377100467681885, -2.181518077850342, -1.9253263473510742, -1.6691346168518066, -1.4129427671432495, -1.1567509174346924, -0.9005590677261353, -0.6443672776222229, -0.38817548751831055, -0.13198363780975342, 0.12420821189880371, 0.3803999423980713, 0.6365917921066284, 0.8927831649780273, 1.1489750146865845, 1.4051668643951416, 1.6613585948944092, 1.9175504446029663, 2.1737422943115234, 2.429934024810791, 2.6861257553100586, 2.9423177242279053, 3.198509454727173, 3.4547014236450195, 3.710893154144287, 3.9670848846435547, 4.2232770919799805, 4.47946834564209, 4.735660552978516, 4.991852283477783, 5.248044013977051, 5.504235744476318, 5.760427474975586, 6.016619682312012, 6.272811412811279, 6.529003143310547, 6.7851948738098145, 7.041386604309082, 7.29757833480835, 7.553770065307617, 7.809962272644043, 8.066153526306152, 8.322345733642578, 8.578536987304688, 8.834729194641113, 9.090921401977539]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 17.0, 14.0, 23.0, 45.0, 65.0, 85.0, 190.0, 298.0, 423.0, 743.0, 1192.0, 2097.0, 3695.0, 6571.0, 12119.0, 23180.0, 43364.0, 81095.0, 144999.0, 221055.0, 212815.0, 134346.0, 74296.0, 39144.0, 21088.0, 11302.0, 6120.0, 3322.0, 1892.0, 1139.0, 722.0, 425.0, 241.0, 139.0, 85.0, 69.0, 40.0, 30.0, 27.0, 7.0, 20.0, 10.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.0546875, -2.9453125, -2.8359375, -2.7265625, -2.6171875, -2.5078125, -2.3984375, -2.2890625, -2.1796875, -2.0703125, -1.9609375, -1.8515625, -1.7421875, -1.6328125, -1.5234375, -1.4140625, -1.3046875, -1.1953125, -1.0859375, -0.9765625, -0.8671875, -0.7578125, -0.6484375, -0.5390625, -0.4296875, -0.3203125, -0.2109375, -0.1015625, 0.0078125, 0.1171875, 0.2265625, 0.3359375, 0.4453125, 0.5546875, 0.6640625, 0.7734375, 0.8828125, 0.9921875, 1.1015625, 1.2109375, 1.3203125, 1.4296875, 1.5390625, 1.6484375, 1.7578125, 1.8671875, 1.9765625, 2.0859375, 2.1953125, 2.3046875, 2.4140625, 2.5234375, 2.6328125, 2.7421875, 2.8515625, 2.9609375, 3.0703125, 3.1796875, 3.2890625, 3.3984375, 3.5078125, 3.6171875, 3.7265625, 3.8359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 4.0, 6.0, 12.0, 9.0, 15.0, 19.0, 23.0, 17.0, 17.0, 28.0, 23.0, 32.0, 31.0, 37.0, 37.0, 37.0, 46.0, 38.0, 48.0, 50.0, 39.0, 43.0, 46.0, 36.0, 40.0, 33.0, 41.0, 29.0, 21.0, 26.0, 26.0, 21.0, 10.0, 9.0, 10.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6796875, -0.6588134765625, -0.637939453125, -0.6170654296875, -0.59619140625, -0.5753173828125, -0.554443359375, -0.5335693359375, -0.5126953125, -0.4918212890625, -0.470947265625, -0.4500732421875, -0.42919921875, -0.4083251953125, -0.387451171875, -0.3665771484375, -0.345703125, -0.3248291015625, -0.303955078125, -0.2830810546875, -0.26220703125, -0.2413330078125, -0.220458984375, -0.1995849609375, -0.1787109375, -0.1578369140625, -0.136962890625, -0.1160888671875, -0.09521484375, -0.0743408203125, -0.053466796875, -0.0325927734375, -0.01171875, 0.0091552734375, 0.030029296875, 0.0509033203125, 0.07177734375, 0.0926513671875, 0.113525390625, 0.1343994140625, 0.1552734375, 0.1761474609375, 0.197021484375, 0.2178955078125, 0.23876953125, 0.2596435546875, 0.280517578125, 0.3013916015625, 0.322265625, 0.3431396484375, 0.364013671875, 0.3848876953125, 0.40576171875, 0.4266357421875, 0.447509765625, 0.4683837890625, 0.4892578125, 0.5101318359375, 0.531005859375, 0.5518798828125, 0.57275390625, 0.5936279296875, 0.614501953125, 0.6353759765625, 0.65625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 8.0, 14.0, 20.0, 27.0, 35.0, 44.0, 59.0, 67.0, 113.0, 116.0, 165.0, 290.0, 410.0, 692.0, 1312.0, 3302.0, 11184.0, 47428.0, 211681.0, 499957.0, 208033.0, 45962.0, 10883.0, 3277.0, 1374.0, 704.0, 409.0, 286.0, 192.0, 133.0, 85.0, 71.0, 53.0, 34.0, 36.0, 25.0, 9.0, 15.0, 9.0, 7.0, 7.0, 4.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.91796875, -7.68841552734375, -7.4588623046875, -7.22930908203125, -6.999755859375, -6.77020263671875, -6.5406494140625, -6.31109619140625, -6.08154296875, -5.85198974609375, -5.6224365234375, -5.39288330078125, -5.163330078125, -4.93377685546875, -4.7042236328125, -4.47467041015625, -4.2451171875, -4.01556396484375, -3.7860107421875, -3.55645751953125, -3.326904296875, -3.09735107421875, -2.8677978515625, -2.63824462890625, -2.40869140625, -2.17913818359375, -1.9495849609375, -1.72003173828125, -1.490478515625, -1.26092529296875, -1.0313720703125, -0.80181884765625, -0.572265625, -0.34271240234375, -0.1131591796875, 0.11639404296875, 0.345947265625, 0.57550048828125, 0.8050537109375, 1.03460693359375, 1.26416015625, 1.49371337890625, 1.7232666015625, 1.95281982421875, 2.182373046875, 2.41192626953125, 2.6414794921875, 2.87103271484375, 3.1005859375, 3.33013916015625, 3.5596923828125, 3.78924560546875, 4.018798828125, 4.24835205078125, 4.4779052734375, 4.70745849609375, 4.93701171875, 5.16656494140625, 5.3961181640625, 5.62567138671875, 5.855224609375, 6.08477783203125, 6.3143310546875, 6.54388427734375, 6.7734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 4.0, 15.0, 15.0, 10.0, 16.0, 18.0, 17.0, 22.0, 27.0, 32.0, 28.0, 38.0, 24.0, 21.0, 48.0, 34.0, 37.0, 57.0, 33.0, 38.0, 49.0, 31.0, 35.0, 32.0, 30.0, 32.0, 32.0, 35.0, 28.0, 21.0, 23.0, 14.0, 16.0, 15.0, 10.0, 10.0, 12.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.261474609375, -3.15576171875, -3.050048828125, -2.9443359375, -2.838623046875, -2.73291015625, -2.627197265625, -2.521484375, -2.415771484375, -2.31005859375, -2.204345703125, -2.0986328125, -1.992919921875, -1.88720703125, -1.781494140625, -1.67578125, -1.570068359375, -1.46435546875, -1.358642578125, -1.2529296875, -1.147216796875, -1.04150390625, -0.935791015625, -0.830078125, -0.724365234375, -0.61865234375, -0.512939453125, -0.4072265625, -0.301513671875, -0.19580078125, -0.090087890625, 0.015625, 0.121337890625, 0.22705078125, 0.332763671875, 0.4384765625, 0.544189453125, 0.64990234375, 0.755615234375, 0.861328125, 0.967041015625, 1.07275390625, 1.178466796875, 1.2841796875, 1.389892578125, 1.49560546875, 1.601318359375, 1.70703125, 1.812744140625, 1.91845703125, 2.024169921875, 2.1298828125, 2.235595703125, 2.34130859375, 2.447021484375, 2.552734375, 2.658447265625, 2.76416015625, 2.869873046875, 2.9755859375, 3.081298828125, 3.18701171875, 3.292724609375, 3.3984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 6.0, 6.0, 11.0, 24.0, 34.0, 43.0, 75.0, 114.0, 217.0, 343.0, 684.0, 1418.0, 3207.0, 8920.0, 38089.0, 339529.0, 568204.0, 66759.0, 12880.0, 4200.0, 1829.0, 915.0, 444.0, 257.0, 147.0, 69.0, 36.0, 31.0, 18.0, 9.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.99566650390625, -4.8116455078125, -4.62762451171875, -4.443603515625, -4.25958251953125, -4.0755615234375, -3.89154052734375, -3.70751953125, -3.52349853515625, -3.3394775390625, -3.15545654296875, -2.971435546875, -2.78741455078125, -2.6033935546875, -2.41937255859375, -2.2353515625, -2.05133056640625, -1.8673095703125, -1.68328857421875, -1.499267578125, -1.31524658203125, -1.1312255859375, -0.94720458984375, -0.76318359375, -0.57916259765625, -0.3951416015625, -0.21112060546875, -0.027099609375, 0.15692138671875, 0.3409423828125, 0.52496337890625, 0.708984375, 0.89300537109375, 1.0770263671875, 1.26104736328125, 1.445068359375, 1.62908935546875, 1.8131103515625, 1.99713134765625, 2.18115234375, 2.36517333984375, 2.5491943359375, 2.73321533203125, 2.917236328125, 3.10125732421875, 3.2852783203125, 3.46929931640625, 3.6533203125, 3.83734130859375, 4.0213623046875, 4.20538330078125, 4.389404296875, 4.57342529296875, 4.7574462890625, 4.94146728515625, 5.12548828125, 5.30950927734375, 5.4935302734375, 5.67755126953125, 5.861572265625, 6.04559326171875, 6.2296142578125, 6.41363525390625, 6.59765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 11.0, 10.0, 23.0, 44.0, 61.0, 79.0, 150.0, 185.0, 158.0, 95.0, 63.0, 37.0, 29.0, 21.0, 7.0, 10.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009832382202148438, -0.0009556189179420471, -0.0009279996156692505, -0.0009003803133964539, -0.0008727610111236572, -0.0008451417088508606, -0.000817522406578064, -0.0007899031043052673, -0.0007622838020324707, -0.0007346644997596741, -0.0007070451974868774, -0.0006794258952140808, -0.0006518065929412842, -0.0006241872906684875, -0.0005965679883956909, -0.0005689486861228943, -0.0005413293838500977, -0.000513710081577301, -0.0004860907793045044, -0.00045847147703170776, -0.00043085217475891113, -0.0004032328724861145, -0.00037561357021331787, -0.00034799426794052124, -0.0003203749656677246, -0.000292755663394928, -0.00026513636112213135, -0.00023751705884933472, -0.00020989775657653809, -0.00018227845430374146, -0.00015465915203094482, -0.0001270398497581482, -9.942054748535156e-05, -7.180124521255493e-05, -4.41819429397583e-05, -1.656264066696167e-05, 1.1056661605834961e-05, 3.867596387863159e-05, 6.629526615142822e-05, 9.391456842422485e-05, 0.00012153387069702148, 0.00014915317296981812, 0.00017677247524261475, 0.00020439177751541138, 0.000232011079788208, 0.00025963038206100464, 0.00028724968433380127, 0.0003148689866065979, 0.00034248828887939453, 0.00037010759115219116, 0.0003977268934249878, 0.0004253461956977844, 0.00045296549797058105, 0.0004805848002433777, 0.0005082041025161743, 0.000535823404788971, 0.0005634427070617676, 0.0005910620093345642, 0.0006186813116073608, 0.0006463006138801575, 0.0006739199161529541, 0.0007015392184257507, 0.0007291585206985474, 0.000756777822971344, 0.0007843971252441406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 15.0, 12.0, 16.0, 36.0, 70.0, 102.0, 240.0, 688.0, 2873.0, 20824.0, 713154.0, 296685.0, 10997.0, 1928.0, 495.0, 196.0, 81.0, 53.0, 31.0, 18.0, 15.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.4453125, -9.09375, -8.7421875, -8.390625, -8.0390625, -7.6875, -7.3359375, -6.984375, -6.6328125, -6.28125, -5.9296875, -5.578125, -5.2265625, -4.875, -4.5234375, -4.171875, -3.8203125, -3.46875, -3.1171875, -2.765625, -2.4140625, -2.0625, -1.7109375, -1.359375, -1.0078125, -0.65625, -0.3046875, 0.046875, 0.3984375, 0.75, 1.1015625, 1.453125, 1.8046875, 2.15625, 2.5078125, 2.859375, 3.2109375, 3.5625, 3.9140625, 4.265625, 4.6171875, 4.96875, 5.3203125, 5.671875, 6.0234375, 6.375, 6.7265625, 7.078125, 7.4296875, 7.78125, 8.1328125, 8.484375, 8.8359375, 9.1875, 9.5390625, 9.890625, 10.2421875, 10.59375, 10.9453125, 11.296875, 11.6484375, 12.0, 12.3515625, 12.703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 3.0, 6.0, 10.0, 9.0, 19.0, 29.0, 32.0, 48.0, 74.0, 108.0, 116.0, 121.0, 110.0, 76.0, 56.0, 44.0, 27.0, 34.0, 19.0, 11.0, 8.0, 6.0, 9.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5390625, -2.438690185546875, -2.33831787109375, -2.237945556640625, -2.1375732421875, -2.037200927734375, -1.93682861328125, -1.836456298828125, -1.736083984375, -1.635711669921875, -1.53533935546875, -1.434967041015625, -1.3345947265625, -1.234222412109375, -1.13385009765625, -1.033477783203125, -0.93310546875, -0.832733154296875, -0.73236083984375, -0.631988525390625, -0.5316162109375, -0.431243896484375, -0.33087158203125, -0.230499267578125, -0.130126953125, -0.029754638671875, 0.07061767578125, 0.170989990234375, 0.2713623046875, 0.371734619140625, 0.47210693359375, 0.572479248046875, 0.6728515625, 0.773223876953125, 0.87359619140625, 0.973968505859375, 1.0743408203125, 1.174713134765625, 1.27508544921875, 1.375457763671875, 1.475830078125, 1.576202392578125, 1.67657470703125, 1.776947021484375, 1.8773193359375, 1.977691650390625, 2.07806396484375, 2.178436279296875, 2.27880859375, 2.379180908203125, 2.47955322265625, 2.579925537109375, 2.6802978515625, 2.780670166015625, 2.88104248046875, 2.981414794921875, 3.081787109375, 3.182159423828125, 3.28253173828125, 3.382904052734375, 3.4832763671875, 3.583648681640625, 3.68402099609375, 3.784393310546875, 3.884765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 17.0, 22.0, 31.0, 70.0, 97.0, 123.0, 161.0, 140.0, 125.0, 74.0, 50.0, 21.0, 27.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.855499267578125, -31.468908309936523, -30.082319259643555, -28.695728302001953, -27.309139251708984, -25.922548294067383, -24.53595733642578, -23.149368286132812, -21.76277732849121, -20.37618637084961, -18.98959732055664, -17.60300636291504, -16.216415405273438, -14.829826354980469, -13.443235397338867, -12.056645393371582, -10.670055389404297, -9.283465385437012, -7.896874904632568, -6.510284423828125, -5.12369441986084, -3.7371044158935547, -2.350513458251953, -0.963923454284668, 0.4226665496826172, 1.8092567920684814, 3.1958470344543457, 4.582437515258789, 5.969027519226074, 7.355617523193359, 8.742208480834961, 10.128798484802246, 11.515388488769531, 12.901978492736816, 14.288568496704102, 15.675159454345703, 17.061748504638672, 18.448339462280273, 19.834930419921875, 21.221519470214844, 22.608110427856445, 23.994701385498047, 25.381290435791016, 26.767881393432617, 28.15447235107422, 29.541061401367188, 30.92765235900879, 32.31424331665039, 33.70083236694336, 35.08742141723633, 36.47401428222656, 37.86060333251953, 39.2471923828125, 40.63378143310547, 42.0203742980957, 43.40696334838867, 44.793556213378906, 46.180145263671875, 47.56673812866211, 48.95332717895508, 50.33991622924805, 51.72650909423828, 53.11309814453125, 54.49968719482422, 55.88627624511719]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 7.0, 11.0, 13.0, 10.0, 11.0, 12.0, 22.0, 20.0, 18.0, 21.0, 28.0, 30.0, 35.0, 47.0, 44.0, 38.0, 49.0, 39.0, 42.0, 32.0, 41.0, 51.0, 35.0, 48.0, 32.0, 29.0, 27.0, 22.0, 31.0, 20.0, 23.0, 19.0, 14.0, 11.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 11.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-23.02880096435547, -22.35460662841797, -21.6804141998291, -21.0062198638916, -20.332027435302734, -19.657833099365234, -18.983638763427734, -18.309446334838867, -17.635251998901367, -16.961057662963867, -16.286865234375, -15.6126708984375, -14.938477516174316, -14.264284133911133, -13.59009075164795, -12.915897369384766, -12.241703987121582, -11.567510604858398, -10.893317222595215, -10.219123840332031, -9.544929504394531, -8.870736122131348, -8.196542739868164, -7.522348880767822, -6.848155498504639, -6.173962116241455, -5.499768257141113, -4.82557487487793, -4.151381492614746, -3.4771876335144043, -2.8029942512512207, -2.128800392150879, -1.4546070098876953, -0.7804134488105774, -0.10621988773345947, 0.5679736137390137, 1.2421672344207764, 1.916360855102539, 2.5905542373657227, 3.2647480964660645, 3.938941478729248, 4.613134860992432, 5.287328720092773, 5.961522102355957, 6.635715484619141, 7.309909343719482, 7.984102725982666, 8.658296585083008, 9.332489967346191, 10.006683349609375, 10.680876731872559, 11.355070114135742, 12.029264450073242, 12.703457832336426, 13.37765121459961, 14.05184555053711, 14.726037979125977, 15.40023136138916, 16.074424743652344, 16.748619079589844, 17.42281150817871, 18.09700584411621, 18.771198272705078, 19.445392608642578, 20.119586944580078]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 11.0, 14.0, 33.0, 39.0, 57.0, 78.0, 138.0, 174.0, 287.0, 501.0, 951.0, 1664.0, 3143.0, 6645.0, 15279.0, 41244.0, 153486.0, 3237716.0, 596100.0, 86653.0, 28208.0, 11372.0, 5077.0, 2440.0, 1253.0, 624.0, 403.0, 242.0, 163.0, 87.0, 65.0, 40.0, 27.0, 16.0, 12.0, 8.0, 10.0, 4.0, 0.0, 3.0], "bins": [-8.109375, -7.9154052734375, -7.721435546875, -7.5274658203125, -7.33349609375, -7.1395263671875, -6.945556640625, -6.7515869140625, -6.5576171875, -6.3636474609375, -6.169677734375, -5.9757080078125, -5.78173828125, -5.5877685546875, -5.393798828125, -5.1998291015625, -5.005859375, -4.8118896484375, -4.617919921875, -4.4239501953125, -4.22998046875, -4.0360107421875, -3.842041015625, -3.6480712890625, -3.4541015625, -3.2601318359375, -3.066162109375, -2.8721923828125, -2.67822265625, -2.4842529296875, -2.290283203125, -2.0963134765625, -1.90234375, -1.7083740234375, -1.514404296875, -1.3204345703125, -1.12646484375, -0.9324951171875, -0.738525390625, -0.5445556640625, -0.3505859375, -0.1566162109375, 0.037353515625, 0.2313232421875, 0.42529296875, 0.6192626953125, 0.813232421875, 1.0072021484375, 1.201171875, 1.3951416015625, 1.589111328125, 1.7830810546875, 1.97705078125, 2.1710205078125, 2.364990234375, 2.5589599609375, 2.7529296875, 2.9468994140625, 3.140869140625, 3.3348388671875, 3.52880859375, 3.7227783203125, 3.916748046875, 4.1107177734375, 4.3046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 4.0, 18.0, 14.0, 15.0, 29.0, 32.0, 24.0, 34.0, 37.0, 50.0, 62.0, 63.0, 69.0, 61.0, 69.0, 57.0, 60.0, 63.0, 40.0, 38.0, 31.0, 27.0, 20.0, 22.0, 20.0, 8.0, 8.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01953125, -0.9907302856445312, -0.9619293212890625, -0.9331283569335938, -0.904327392578125, -0.8755264282226562, -0.8467254638671875, -0.8179244995117188, -0.78912353515625, -0.7603225708007812, -0.7315216064453125, -0.7027206420898438, -0.673919677734375, -0.6451187133789062, -0.6163177490234375, -0.5875167846679688, -0.5587158203125, -0.5299148559570312, -0.5011138916015625, -0.47231292724609375, -0.443511962890625, -0.41471099853515625, -0.3859100341796875, -0.35710906982421875, -0.32830810546875, -0.29950714111328125, -0.2707061767578125, -0.24190521240234375, -0.213104248046875, -0.18430328369140625, -0.1555023193359375, -0.12670135498046875, -0.097900390625, -0.06909942626953125, -0.0402984619140625, -0.01149749755859375, 0.017303466796875, 0.04610443115234375, 0.0749053955078125, 0.10370635986328125, 0.13250732421875, 0.16130828857421875, 0.1901092529296875, 0.21891021728515625, 0.247711181640625, 0.27651214599609375, 0.3053131103515625, 0.33411407470703125, 0.3629150390625, 0.39171600341796875, 0.4205169677734375, 0.44931793212890625, 0.478118896484375, 0.5069198608398438, 0.5357208251953125, 0.5645217895507812, 0.59332275390625, 0.6221237182617188, 0.6509246826171875, 0.6797256469726562, 0.708526611328125, 0.7373275756835938, 0.7661285400390625, 0.7949295043945312, 0.82373046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 2.0, 10.0, 17.0, 19.0, 24.0, 22.0, 59.0, 80.0, 185.0, 324.0, 625.0, 1475.0, 3552.0, 8773.0, 25107.0, 83844.0, 431145.0, 3218446.0, 319852.0, 68435.0, 20301.0, 7123.0, 2725.0, 1107.0, 491.0, 250.0, 108.0, 67.0, 38.0, 27.0, 15.0, 14.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60546875, -6.38836669921875, -6.1712646484375, -5.95416259765625, -5.737060546875, -5.51995849609375, -5.3028564453125, -5.08575439453125, -4.86865234375, -4.65155029296875, -4.4344482421875, -4.21734619140625, -4.000244140625, -3.78314208984375, -3.5660400390625, -3.34893798828125, -3.1318359375, -2.91473388671875, -2.6976318359375, -2.48052978515625, -2.263427734375, -2.04632568359375, -1.8292236328125, -1.61212158203125, -1.39501953125, -1.17791748046875, -0.9608154296875, -0.74371337890625, -0.526611328125, -0.30950927734375, -0.0924072265625, 0.12469482421875, 0.341796875, 0.55889892578125, 0.7760009765625, 0.99310302734375, 1.210205078125, 1.42730712890625, 1.6444091796875, 1.86151123046875, 2.07861328125, 2.29571533203125, 2.5128173828125, 2.72991943359375, 2.947021484375, 3.16412353515625, 3.3812255859375, 3.59832763671875, 3.8154296875, 4.03253173828125, 4.2496337890625, 4.46673583984375, 4.683837890625, 4.90093994140625, 5.1180419921875, 5.33514404296875, 5.55224609375, 5.76934814453125, 5.9864501953125, 6.20355224609375, 6.420654296875, 6.63775634765625, 6.8548583984375, 7.07196044921875, 7.2890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 3.0, 6.0, 15.0, 14.0, 23.0, 24.0, 21.0, 43.0, 35.0, 55.0, 52.0, 92.0, 103.0, 174.0, 285.0, 559.0, 1242.0, 439.0, 224.0, 167.0, 105.0, 95.0, 65.0, 55.0, 37.0, 27.0, 15.0, 13.0, 14.0, 12.0, 14.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4091796875, -1.3656158447265625, -1.322052001953125, -1.2784881591796875, -1.23492431640625, -1.1913604736328125, -1.147796630859375, -1.1042327880859375, -1.0606689453125, -1.0171051025390625, -0.973541259765625, -0.9299774169921875, -0.88641357421875, -0.8428497314453125, -0.799285888671875, -0.7557220458984375, -0.712158203125, -0.6685943603515625, -0.625030517578125, -0.5814666748046875, -0.53790283203125, -0.4943389892578125, -0.450775146484375, -0.4072113037109375, -0.3636474609375, -0.3200836181640625, -0.276519775390625, -0.2329559326171875, -0.18939208984375, -0.1458282470703125, -0.102264404296875, -0.0587005615234375, -0.01513671875, 0.0284271240234375, 0.071990966796875, 0.1155548095703125, 0.15911865234375, 0.2026824951171875, 0.246246337890625, 0.2898101806640625, 0.3333740234375, 0.3769378662109375, 0.420501708984375, 0.4640655517578125, 0.50762939453125, 0.5511932373046875, 0.594757080078125, 0.6383209228515625, 0.681884765625, 0.7254486083984375, 0.769012451171875, 0.8125762939453125, 0.85614013671875, 0.8997039794921875, 0.943267822265625, 0.9868316650390625, 1.0303955078125, 1.0739593505859375, 1.117523193359375, 1.1610870361328125, 1.20465087890625, 1.2482147216796875, 1.291778564453125, 1.3353424072265625, 1.37890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 7.0, 15.0, 69.0, 215.0, 363.0, 239.0, 71.0, 17.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.0728759765625, -61.87200164794922, -60.67112731933594, -59.47025680541992, -58.26938247680664, -57.06850814819336, -55.86763381958008, -54.6667594909668, -53.46588897705078, -52.2650146484375, -51.06414031982422, -49.8632698059082, -48.66239547729492, -47.46152114868164, -46.26064682006836, -45.05977249145508, -43.8588981628418, -42.658023834228516, -41.457149505615234, -40.25627899169922, -39.05540466308594, -37.854530334472656, -36.653656005859375, -35.452781677246094, -34.25190734863281, -33.05103302001953, -31.850160598754883, -30.6492862701416, -29.448413848876953, -28.247539520263672, -27.04666519165039, -25.84579086303711, -24.644916534423828, -23.444042205810547, -22.2431697845459, -21.042295455932617, -19.84142303466797, -18.640548706054688, -17.439674377441406, -16.238800048828125, -15.037927627563477, -13.837054252624512, -12.636180877685547, -11.435306549072266, -10.2344331741333, -9.033559799194336, -7.832685947418213, -6.63181209564209, -5.430938720703125, -4.23006534576416, -3.029191493988037, -1.8283178806304932, -0.6274442672729492, 0.5734291076660156, 1.7743029594421387, 2.9751768112182617, 4.176050186157227, 5.376923561096191, 6.5777974128723145, 7.7786712646484375, 8.979544639587402, 10.180418014526367, 11.381292343139648, 12.582165718078613, 13.783039093017578]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 18.0, 17.0, 18.0, 17.0, 20.0, 28.0, 35.0, 42.0, 37.0, 48.0, 48.0, 45.0, 54.0, 46.0, 57.0, 47.0, 56.0, 60.0, 39.0, 39.0, 28.0, 28.0, 24.0, 15.0, 18.0, 22.0, 13.0, 13.0, 9.0, 9.0, 9.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.536355972290039, -5.313342094421387, -5.090328693389893, -4.86731481552124, -4.644301414489746, -4.421287536621094, -4.1982741355896, -3.9752602577209473, -3.752246856689453, -3.52923321723938, -3.3062195777893066, -3.0832059383392334, -2.86019229888916, -2.637178421020508, -2.4141650199890137, -2.1911511421203613, -1.968137502670288, -1.7451238632202148, -1.5221102237701416, -1.2990965843200684, -1.0760829448699951, -0.8530691862106323, -0.6300555467605591, -0.40704190731048584, -0.1840282678604126, 0.03898538649082184, 0.2619990408420563, 0.4850127100944519, 0.7080263495445251, 0.9310400485992432, 1.1540536880493164, 1.3770673274993896, 1.600080966949463, 1.8230946063995361, 2.0461082458496094, 2.2691218852996826, 2.492135524749756, 2.715149402618408, 2.9381628036499023, 3.1611766815185547, 3.384190082550049, 3.607203722000122, 3.8302173614501953, 4.053231239318848, 4.276244640350342, 4.499258518218994, 4.722271919250488, 4.945285797119141, 5.168299674987793, 5.391313552856445, 5.6143269538879395, 5.837340831756592, 6.060354232788086, 6.283368110656738, 6.506381511688232, 6.729395389556885, 6.952408790588379, 7.175422668457031, 7.398436069488525, 7.621449947357178, 7.844463348388672, 8.067477226257324, 8.290491104125977, 8.513504028320312, 8.736517906188965]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 8.0, 1.0, 8.0, 6.0, 11.0, 15.0, 10.0, 19.0, 19.0, 37.0, 42.0, 57.0, 81.0, 137.0, 171.0, 259.0, 356.0, 510.0, 783.0, 1186.0, 1915.0, 3201.0, 5588.0, 11076.0, 22741.0, 49097.0, 106615.0, 212611.0, 277742.0, 183645.0, 88725.0, 40343.0, 19248.0, 9479.0, 5011.0, 2780.0, 1705.0, 1006.0, 695.0, 499.0, 287.0, 255.0, 176.0, 104.0, 79.0, 65.0, 52.0, 22.0, 27.0, 13.0, 14.0, 10.0, 8.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0], "bins": [-3.875, -3.7589111328125, -3.642822265625, -3.5267333984375, -3.41064453125, -3.2945556640625, -3.178466796875, -3.0623779296875, -2.9462890625, -2.8302001953125, -2.714111328125, -2.5980224609375, -2.48193359375, -2.3658447265625, -2.249755859375, -2.1336669921875, -2.017578125, -1.9014892578125, -1.785400390625, -1.6693115234375, -1.55322265625, -1.4371337890625, -1.321044921875, -1.2049560546875, -1.0888671875, -0.9727783203125, -0.856689453125, -0.7406005859375, -0.62451171875, -0.5084228515625, -0.392333984375, -0.2762451171875, -0.16015625, -0.0440673828125, 0.072021484375, 0.1881103515625, 0.30419921875, 0.4202880859375, 0.536376953125, 0.6524658203125, 0.7685546875, 0.8846435546875, 1.000732421875, 1.1168212890625, 1.23291015625, 1.3489990234375, 1.465087890625, 1.5811767578125, 1.697265625, 1.8133544921875, 1.929443359375, 2.0455322265625, 2.16162109375, 2.2777099609375, 2.393798828125, 2.5098876953125, 2.6259765625, 2.7420654296875, 2.858154296875, 2.9742431640625, 3.09033203125, 3.2064208984375, 3.322509765625, 3.4385986328125, 3.5546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 12.0, 8.0, 10.0, 19.0, 9.0, 14.0, 17.0, 25.0, 26.0, 26.0, 34.0, 36.0, 33.0, 42.0, 48.0, 45.0, 55.0, 76.0, 60.0, 51.0, 40.0, 34.0, 42.0, 31.0, 27.0, 40.0, 30.0, 22.0, 20.0, 20.0, 19.0, 6.0, 8.0, 3.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.661224365234375, -0.63690185546875, -0.612579345703125, -0.5882568359375, -0.563934326171875, -0.53961181640625, -0.515289306640625, -0.490966796875, -0.466644287109375, -0.44232177734375, -0.417999267578125, -0.3936767578125, -0.369354248046875, -0.34503173828125, -0.320709228515625, -0.29638671875, -0.272064208984375, -0.24774169921875, -0.223419189453125, -0.1990966796875, -0.174774169921875, -0.15045166015625, -0.126129150390625, -0.101806640625, -0.077484130859375, -0.05316162109375, -0.028839111328125, -0.0045166015625, 0.019805908203125, 0.04412841796875, 0.068450927734375, 0.0927734375, 0.117095947265625, 0.14141845703125, 0.165740966796875, 0.1900634765625, 0.214385986328125, 0.23870849609375, 0.263031005859375, 0.287353515625, 0.311676025390625, 0.33599853515625, 0.360321044921875, 0.3846435546875, 0.408966064453125, 0.43328857421875, 0.457611083984375, 0.48193359375, 0.506256103515625, 0.53057861328125, 0.554901123046875, 0.5792236328125, 0.603546142578125, 0.62786865234375, 0.652191162109375, 0.676513671875, 0.700836181640625, 0.72515869140625, 0.749481201171875, 0.7738037109375, 0.798126220703125, 0.82244873046875, 0.846771240234375, 0.87109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 17.0, 10.0, 21.0, 16.0, 27.0, 44.0, 50.0, 58.0, 93.0, 147.0, 196.0, 245.0, 349.0, 483.0, 754.0, 1419.0, 3173.0, 8422.0, 27874.0, 102809.0, 327727.0, 382724.0, 136441.0, 36481.0, 10717.0, 3778.0, 1639.0, 940.0, 514.0, 365.0, 240.0, 204.0, 151.0, 109.0, 73.0, 61.0, 47.0, 32.0, 27.0, 24.0, 16.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.24609375, -5.08270263671875, -4.9193115234375, -4.75592041015625, -4.592529296875, -4.42913818359375, -4.2657470703125, -4.10235595703125, -3.93896484375, -3.77557373046875, -3.6121826171875, -3.44879150390625, -3.285400390625, -3.12200927734375, -2.9586181640625, -2.79522705078125, -2.6318359375, -2.46844482421875, -2.3050537109375, -2.14166259765625, -1.978271484375, -1.81488037109375, -1.6514892578125, -1.48809814453125, -1.32470703125, -1.16131591796875, -0.9979248046875, -0.83453369140625, -0.671142578125, -0.50775146484375, -0.3443603515625, -0.18096923828125, -0.017578125, 0.14581298828125, 0.3092041015625, 0.47259521484375, 0.635986328125, 0.79937744140625, 0.9627685546875, 1.12615966796875, 1.28955078125, 1.45294189453125, 1.6163330078125, 1.77972412109375, 1.943115234375, 2.10650634765625, 2.2698974609375, 2.43328857421875, 2.5966796875, 2.76007080078125, 2.9234619140625, 3.08685302734375, 3.250244140625, 3.41363525390625, 3.5770263671875, 3.74041748046875, 3.90380859375, 4.06719970703125, 4.2305908203125, 4.39398193359375, 4.557373046875, 4.72076416015625, 4.8841552734375, 5.04754638671875, 5.2109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 12.0, 7.0, 12.0, 14.0, 13.0, 13.0, 19.0, 19.0, 35.0, 26.0, 27.0, 35.0, 25.0, 38.0, 44.0, 57.0, 38.0, 41.0, 51.0, 31.0, 38.0, 46.0, 38.0, 38.0, 39.0, 34.0, 35.0, 30.0, 21.0, 36.0, 15.0, 12.0, 19.0, 6.0, 7.0, 4.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.498046875, -3.394775390625, -3.29150390625, -3.188232421875, -3.0849609375, -2.981689453125, -2.87841796875, -2.775146484375, -2.671875, -2.568603515625, -2.46533203125, -2.362060546875, -2.2587890625, -2.155517578125, -2.05224609375, -1.948974609375, -1.845703125, -1.742431640625, -1.63916015625, -1.535888671875, -1.4326171875, -1.329345703125, -1.22607421875, -1.122802734375, -1.01953125, -0.916259765625, -0.81298828125, -0.709716796875, -0.6064453125, -0.503173828125, -0.39990234375, -0.296630859375, -0.193359375, -0.090087890625, 0.01318359375, 0.116455078125, 0.2197265625, 0.322998046875, 0.42626953125, 0.529541015625, 0.6328125, 0.736083984375, 0.83935546875, 0.942626953125, 1.0458984375, 1.149169921875, 1.25244140625, 1.355712890625, 1.458984375, 1.562255859375, 1.66552734375, 1.768798828125, 1.8720703125, 1.975341796875, 2.07861328125, 2.181884765625, 2.28515625, 2.388427734375, 2.49169921875, 2.594970703125, 2.6982421875, 2.801513671875, 2.90478515625, 3.008056640625, 3.111328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 14.0, 24.0, 44.0, 57.0, 119.0, 188.0, 358.0, 782.0, 1981.0, 5878.0, 24234.0, 145849.0, 587807.0, 231853.0, 36666.0, 8161.0, 2513.0, 1024.0, 436.0, 232.0, 118.0, 65.0, 46.0, 15.0, 22.0, 8.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.640869140625, -3.52197265625, -3.403076171875, -3.2841796875, -3.165283203125, -3.04638671875, -2.927490234375, -2.80859375, -2.689697265625, -2.57080078125, -2.451904296875, -2.3330078125, -2.214111328125, -2.09521484375, -1.976318359375, -1.857421875, -1.738525390625, -1.61962890625, -1.500732421875, -1.3818359375, -1.262939453125, -1.14404296875, -1.025146484375, -0.90625, -0.787353515625, -0.66845703125, -0.549560546875, -0.4306640625, -0.311767578125, -0.19287109375, -0.073974609375, 0.044921875, 0.163818359375, 0.28271484375, 0.401611328125, 0.5205078125, 0.639404296875, 0.75830078125, 0.877197265625, 0.99609375, 1.114990234375, 1.23388671875, 1.352783203125, 1.4716796875, 1.590576171875, 1.70947265625, 1.828369140625, 1.947265625, 2.066162109375, 2.18505859375, 2.303955078125, 2.4228515625, 2.541748046875, 2.66064453125, 2.779541015625, 2.8984375, 3.017333984375, 3.13623046875, 3.255126953125, 3.3740234375, 3.492919921875, 3.61181640625, 3.730712890625, 3.849609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 3.0, 10.0, 3.0, 6.0, 7.0, 13.0, 11.0, 20.0, 22.0, 34.0, 26.0, 39.0, 42.0, 58.0, 85.0, 80.0, 87.0, 89.0, 70.0, 62.0, 39.0, 36.0, 26.0, 22.0, 18.0, 10.0, 9.0, 9.0, 12.0, 7.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003113746643066406, -0.00030067190527915955, -0.00028996914625167847, -0.0002792663872241974, -0.0002685636281967163, -0.00025786086916923523, -0.00024715811014175415, -0.00023645535111427307, -0.000225752592086792, -0.0002150498330593109, -0.00020434707403182983, -0.00019364431500434875, -0.00018294155597686768, -0.0001722387969493866, -0.00016153603792190552, -0.00015083327889442444, -0.00014013051986694336, -0.00012942776083946228, -0.0001187250018119812, -0.00010802224278450012, -9.731948375701904e-05, -8.661672472953796e-05, -7.591396570205688e-05, -6.52112066745758e-05, -5.4508447647094727e-05, -4.380568861961365e-05, -3.310292959213257e-05, -2.240017056465149e-05, -1.169741153717041e-05, -9.94652509689331e-07, 9.708106517791748e-06, 2.0410865545272827e-05, 3.1113624572753906e-05, 4.1816383600234985e-05, 5.2519142627716064e-05, 6.322190165519714e-05, 7.392466068267822e-05, 8.46274197101593e-05, 9.533017873764038e-05, 0.00010603293776512146, 0.00011673569679260254, 0.00012743845582008362, 0.0001381412148475647, 0.00014884397387504578, 0.00015954673290252686, 0.00017024949193000793, 0.00018095225095748901, 0.0001916550099849701, 0.00020235776901245117, 0.00021306052803993225, 0.00022376328706741333, 0.0002344660460948944, 0.0002451688051223755, 0.00025587156414985657, 0.00026657432317733765, 0.0002772770822048187, 0.0002879798412322998, 0.0002986826002597809, 0.00030938535928726196, 0.00032008811831474304, 0.0003307908773422241, 0.0003414936363697052, 0.0003521963953971863, 0.00036289915442466736, 0.00037360191345214844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 6.0, 12.0, 10.0, 22.0, 36.0, 42.0, 66.0, 120.0, 205.0, 388.0, 605.0, 1296.0, 3058.0, 9377.0, 42068.0, 273489.0, 571352.0, 116205.0, 20554.0, 5396.0, 2045.0, 960.0, 485.0, 290.0, 182.0, 85.0, 69.0, 29.0, 22.0, 22.0, 15.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.47100830078125, -3.3482666015625, -3.22552490234375, -3.102783203125, -2.98004150390625, -2.8572998046875, -2.73455810546875, -2.61181640625, -2.48907470703125, -2.3663330078125, -2.24359130859375, -2.120849609375, -1.99810791015625, -1.8753662109375, -1.75262451171875, -1.6298828125, -1.50714111328125, -1.3843994140625, -1.26165771484375, -1.138916015625, -1.01617431640625, -0.8934326171875, -0.77069091796875, -0.64794921875, -0.52520751953125, -0.4024658203125, -0.27972412109375, -0.156982421875, -0.03424072265625, 0.0885009765625, 0.21124267578125, 0.333984375, 0.45672607421875, 0.5794677734375, 0.70220947265625, 0.824951171875, 0.94769287109375, 1.0704345703125, 1.19317626953125, 1.31591796875, 1.43865966796875, 1.5614013671875, 1.68414306640625, 1.806884765625, 1.92962646484375, 2.0523681640625, 2.17510986328125, 2.2978515625, 2.42059326171875, 2.5433349609375, 2.66607666015625, 2.788818359375, 2.91156005859375, 3.0343017578125, 3.15704345703125, 3.27978515625, 3.40252685546875, 3.5252685546875, 3.64801025390625, 3.770751953125, 3.89349365234375, 4.0162353515625, 4.13897705078125, 4.26171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 14.0, 5.0, 18.0, 18.0, 26.0, 30.0, 27.0, 30.0, 70.0, 69.0, 79.0, 70.0, 95.0, 95.0, 81.0, 69.0, 58.0, 40.0, 30.0, 19.0, 18.0, 8.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.608673095703125, -1.53570556640625, -1.462738037109375, -1.3897705078125, -1.316802978515625, -1.24383544921875, -1.170867919921875, -1.097900390625, -1.024932861328125, -0.95196533203125, -0.878997802734375, -0.8060302734375, -0.733062744140625, -0.66009521484375, -0.587127685546875, -0.51416015625, -0.441192626953125, -0.36822509765625, -0.295257568359375, -0.2222900390625, -0.149322509765625, -0.07635498046875, -0.003387451171875, 0.069580078125, 0.142547607421875, 0.21551513671875, 0.288482666015625, 0.3614501953125, 0.434417724609375, 0.50738525390625, 0.580352783203125, 0.6533203125, 0.726287841796875, 0.79925537109375, 0.872222900390625, 0.9451904296875, 1.018157958984375, 1.09112548828125, 1.164093017578125, 1.237060546875, 1.310028076171875, 1.38299560546875, 1.455963134765625, 1.5289306640625, 1.601898193359375, 1.67486572265625, 1.747833251953125, 1.82080078125, 1.893768310546875, 1.96673583984375, 2.039703369140625, 2.1126708984375, 2.185638427734375, 2.25860595703125, 2.331573486328125, 2.404541015625, 2.477508544921875, 2.55047607421875, 2.623443603515625, 2.6964111328125, 2.769378662109375, 2.84234619140625, 2.915313720703125, 2.98828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 10.0, 24.0, 48.0, 89.0, 161.0, 203.0, 210.0, 126.0, 59.0, 36.0, 16.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.85749816894531, -59.107975006103516, -57.35844802856445, -55.608924865722656, -53.859397888183594, -52.1098747253418, -50.3603515625, -48.61082458496094, -46.86130142211914, -45.111778259277344, -43.36225128173828, -41.612728118896484, -39.86320114135742, -38.113677978515625, -36.36415100097656, -34.614627838134766, -32.86510467529297, -31.11557960510254, -29.36605453491211, -27.616531372070312, -25.867006301879883, -24.117481231689453, -22.367956161499023, -20.618431091308594, -18.86890411376953, -17.1193790435791, -15.369854927062988, -13.620329856872559, -11.870805740356445, -10.121280670166016, -8.371755599975586, -6.622231483459473, -4.872707366943359, -3.123182773590088, -1.3736579418182373, 0.3758668899536133, 2.1253914833068848, 3.8749160766601562, 5.624441146850586, 7.373965263366699, 9.123490333557129, 10.873015403747559, 12.622539520263672, 14.372064590454102, 16.12158966064453, 17.871112823486328, 19.62063980102539, 21.370162963867188, 23.119688034057617, 24.869213104248047, 26.618738174438477, 28.368263244628906, 30.117786407470703, 31.867311477661133, 33.61683654785156, 35.36635971069336, 37.11588668823242, 38.86540985107422, 40.61493682861328, 42.36445999145508, 44.11398696899414, 45.86351013183594, 47.613037109375, 49.3625602722168, 51.112083435058594]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 16.0, 16.0, 18.0, 27.0, 22.0, 30.0, 23.0, 42.0, 56.0, 55.0, 57.0, 49.0, 66.0, 60.0, 64.0, 53.0, 41.0, 34.0, 48.0, 25.0, 40.0, 25.0, 22.0, 12.0, 16.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.422504425048828, -24.69485855102539, -23.967212677001953, -23.239564895629883, -22.511919021606445, -21.784273147583008, -21.05662727355957, -20.3289794921875, -19.601333618164062, -18.873687744140625, -18.146041870117188, -17.418394088745117, -16.69074821472168, -15.963102340698242, -15.235456466674805, -14.50780963897705, -13.780163764953613, -13.052517890930176, -12.324871063232422, -11.597225189208984, -10.86957836151123, -10.141932487487793, -9.414285659790039, -8.686639785766602, -7.958993434906006, -7.23134708404541, -6.5037007331848145, -5.776054382324219, -5.048408508300781, -4.320761680603027, -3.59311580657959, -2.865469455718994, -2.1378231048583984, -1.4101767539978027, -0.6825305223464966, 0.04511570930480957, 0.7727620601654053, 1.500408411026001, 2.2280545234680176, 2.9557008743286133, 3.683347225189209, 4.410993576049805, 5.1386399269104, 5.866286277770996, 6.593932151794434, 7.3215789794921875, 8.049224853515625, 8.776870727539062, 9.504517555236816, 10.232163429260254, 10.959810256958008, 11.687456130981445, 12.4151029586792, 13.142748832702637, 13.87039566040039, 14.598041534423828, 15.325687408447266, 16.053333282470703, 16.78097915649414, 17.50862693786621, 18.23627281188965, 18.963918685913086, 19.691564559936523, 20.419212341308594, 21.14685821533203]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 10.0, 14.0, 27.0, 35.0, 34.0, 64.0, 87.0, 121.0, 204.0, 288.0, 412.0, 637.0, 1063.0, 1704.0, 2785.0, 4774.0, 8729.0, 16250.0, 33438.0, 75294.0, 209098.0, 1350362.0, 2105453.0, 226856.0, 81283.0, 35584.0, 17593.0, 9263.0, 5105.0, 3067.0, 1708.0, 1049.0, 665.0, 417.0, 274.0, 174.0, 106.0, 92.0, 42.0, 32.0, 16.0, 17.0, 18.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4375, -3.32305908203125, -3.2086181640625, -3.09417724609375, -2.979736328125, -2.86529541015625, -2.7508544921875, -2.63641357421875, -2.52197265625, -2.40753173828125, -2.2930908203125, -2.17864990234375, -2.064208984375, -1.94976806640625, -1.8353271484375, -1.72088623046875, -1.6064453125, -1.49200439453125, -1.3775634765625, -1.26312255859375, -1.148681640625, -1.03424072265625, -0.9197998046875, -0.80535888671875, -0.69091796875, -0.57647705078125, -0.4620361328125, -0.34759521484375, -0.233154296875, -0.11871337890625, -0.0042724609375, 0.11016845703125, 0.224609375, 0.33905029296875, 0.4534912109375, 0.56793212890625, 0.682373046875, 0.79681396484375, 0.9112548828125, 1.02569580078125, 1.14013671875, 1.25457763671875, 1.3690185546875, 1.48345947265625, 1.597900390625, 1.71234130859375, 1.8267822265625, 1.94122314453125, 2.0556640625, 2.17010498046875, 2.2845458984375, 2.39898681640625, 2.513427734375, 2.62786865234375, 2.7423095703125, 2.85675048828125, 2.97119140625, 3.08563232421875, 3.2000732421875, 3.31451416015625, 3.428955078125, 3.54339599609375, 3.6578369140625, 3.77227783203125, 3.88671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 9.0, 6.0, 8.0, 12.0, 10.0, 18.0, 12.0, 19.0, 17.0, 31.0, 19.0, 27.0, 31.0, 34.0, 43.0, 43.0, 47.0, 43.0, 47.0, 44.0, 57.0, 36.0, 54.0, 46.0, 31.0, 25.0, 32.0, 39.0, 32.0, 26.0, 19.0, 11.0, 16.0, 11.0, 10.0, 7.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.705078125, -0.6837310791015625, -0.662384033203125, -0.6410369873046875, -0.61968994140625, -0.5983428955078125, -0.576995849609375, -0.5556488037109375, -0.5343017578125, -0.5129547119140625, -0.491607666015625, -0.4702606201171875, -0.44891357421875, -0.4275665283203125, -0.406219482421875, -0.3848724365234375, -0.363525390625, -0.3421783447265625, -0.320831298828125, -0.2994842529296875, -0.27813720703125, -0.2567901611328125, -0.235443115234375, -0.2140960693359375, -0.1927490234375, -0.1714019775390625, -0.150054931640625, -0.1287078857421875, -0.10736083984375, -0.0860137939453125, -0.064666748046875, -0.0433197021484375, -0.02197265625, -0.0006256103515625, 0.020721435546875, 0.0420684814453125, 0.06341552734375, 0.0847625732421875, 0.106109619140625, 0.1274566650390625, 0.1488037109375, 0.1701507568359375, 0.191497802734375, 0.2128448486328125, 0.23419189453125, 0.2555389404296875, 0.276885986328125, 0.2982330322265625, 0.319580078125, 0.3409271240234375, 0.362274169921875, 0.3836212158203125, 0.40496826171875, 0.4263153076171875, 0.447662353515625, 0.4690093994140625, 0.4903564453125, 0.5117034912109375, 0.533050537109375, 0.5543975830078125, 0.57574462890625, 0.5970916748046875, 0.618438720703125, 0.6397857666015625, 0.6611328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 17.0, 24.0, 26.0, 50.0, 73.0, 101.0, 182.0, 284.0, 563.0, 1133.0, 2827.0, 7949.0, 27065.0, 118538.0, 949563.0, 2811153.0, 212407.0, 43364.0, 11885.0, 3983.0, 1527.0, 704.0, 309.0, 189.0, 107.0, 83.0, 34.0, 30.0, 27.0, 7.0, 15.0, 7.0, 9.0, 3.0, 4.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.4609375, -7.254638671875, -7.04833984375, -6.842041015625, -6.6357421875, -6.429443359375, -6.22314453125, -6.016845703125, -5.810546875, -5.604248046875, -5.39794921875, -5.191650390625, -4.9853515625, -4.779052734375, -4.57275390625, -4.366455078125, -4.16015625, -3.953857421875, -3.74755859375, -3.541259765625, -3.3349609375, -3.128662109375, -2.92236328125, -2.716064453125, -2.509765625, -2.303466796875, -2.09716796875, -1.890869140625, -1.6845703125, -1.478271484375, -1.27197265625, -1.065673828125, -0.859375, -0.653076171875, -0.44677734375, -0.240478515625, -0.0341796875, 0.172119140625, 0.37841796875, 0.584716796875, 0.791015625, 0.997314453125, 1.20361328125, 1.409912109375, 1.6162109375, 1.822509765625, 2.02880859375, 2.235107421875, 2.44140625, 2.647705078125, 2.85400390625, 3.060302734375, 3.2666015625, 3.472900390625, 3.67919921875, 3.885498046875, 4.091796875, 4.298095703125, 4.50439453125, 4.710693359375, 4.9169921875, 5.123291015625, 5.32958984375, 5.535888671875, 5.7421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 15.0, 12.0, 17.0, 21.0, 28.0, 48.0, 61.0, 94.0, 128.0, 204.0, 267.0, 616.0, 1210.0, 465.0, 283.0, 168.0, 123.0, 74.0, 65.0, 50.0, 28.0, 21.0, 18.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.4273681640625, -2.356689453125, -2.2860107421875, -2.21533203125, -2.1446533203125, -2.073974609375, -2.0032958984375, -1.9326171875, -1.8619384765625, -1.791259765625, -1.7205810546875, -1.64990234375, -1.5792236328125, -1.508544921875, -1.4378662109375, -1.3671875, -1.2965087890625, -1.225830078125, -1.1551513671875, -1.08447265625, -1.0137939453125, -0.943115234375, -0.8724365234375, -0.8017578125, -0.7310791015625, -0.660400390625, -0.5897216796875, -0.51904296875, -0.4483642578125, -0.377685546875, -0.3070068359375, -0.236328125, -0.1656494140625, -0.094970703125, -0.0242919921875, 0.04638671875, 0.1170654296875, 0.187744140625, 0.2584228515625, 0.3291015625, 0.3997802734375, 0.470458984375, 0.5411376953125, 0.61181640625, 0.6824951171875, 0.753173828125, 0.8238525390625, 0.89453125, 0.9652099609375, 1.035888671875, 1.1065673828125, 1.17724609375, 1.2479248046875, 1.318603515625, 1.3892822265625, 1.4599609375, 1.5306396484375, 1.601318359375, 1.6719970703125, 1.74267578125, 1.8133544921875, 1.884033203125, 1.9547119140625, 2.025390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 9.0, 20.0, 26.0, 71.0, 139.0, 178.0, 193.0, 157.0, 105.0, 51.0, 26.0, 18.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.428184509277344, -19.50799560546875, -18.587806701660156, -17.667617797851562, -16.747426986694336, -15.827238082885742, -14.907049179077148, -13.986860275268555, -13.066671371459961, -12.146482467651367, -11.226292610168457, -10.306103706359863, -9.38591480255127, -8.46572494506836, -7.545536041259766, -6.625347137451172, -5.705157279968262, -4.78496789932251, -3.864778995513916, -2.944589614868164, -2.024400472640991, -1.1042113304138184, -0.1840219497680664, 0.7361669540405273, 1.6563563346862793, 2.576545476913452, 3.496734619140625, 4.416923999786377, 5.337113380432129, 6.257302284240723, 7.177491664886475, 8.097681045532227, 9.01786994934082, 9.938058853149414, 10.858248710632324, 11.778437614440918, 12.698626518249512, 13.618816375732422, 14.539005279541016, 15.45919418334961, 16.379383087158203, 17.299571990966797, 18.21976089477539, 19.139949798583984, 20.06014060974121, 20.980329513549805, 21.9005184173584, 22.820707321166992, 23.74089813232422, 24.661087036132812, 25.581275939941406, 26.50146484375, 27.421655654907227, 28.34184455871582, 29.262033462524414, 30.182222366333008, 31.1024112701416, 32.02260208129883, 32.94279098510742, 33.862979888916016, 34.78316879272461, 35.7033576965332, 36.6235466003418, 37.54373550415039, 38.463924407958984]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 12.0, 7.0, 4.0, 12.0, 9.0, 16.0, 16.0, 19.0, 20.0, 26.0, 30.0, 31.0, 45.0, 29.0, 40.0, 36.0, 39.0, 35.0, 35.0, 39.0, 50.0, 38.0, 46.0, 36.0, 44.0, 37.0, 35.0, 29.0, 22.0, 24.0, 19.0, 22.0, 15.0, 13.0, 14.0, 11.0, 9.0, 9.0, 6.0, 1.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.7333598136901855, -7.492978096008301, -7.252595901489258, -7.012214183807373, -6.771832466125488, -6.531450271606445, -6.2910685539245605, -6.050686836242676, -5.810304641723633, -5.569922924041748, -5.329540729522705, -5.08915901184082, -4.848776817321777, -4.608395099639893, -4.368013381958008, -4.127631187438965, -3.88724946975708, -3.646867513656616, -3.4064855575561523, -3.1661038398742676, -2.9257218837738037, -2.68533992767334, -2.444958209991455, -2.204576253890991, -1.9641942977905273, -1.7238123416900635, -1.4834305047988892, -1.2430486679077148, -1.002666711807251, -0.7622847557067871, -0.5219029188156128, -0.2815210819244385, -0.041138648986816406, 0.19924324750900269, 0.4396251440048218, 0.6800070405006409, 0.92038893699646, 1.1607708930969238, 1.4011527299880981, 1.6415345668792725, 1.8819165229797363, 2.1222984790802, 2.362680435180664, 2.603062152862549, 2.8434441089630127, 3.0838260650634766, 3.3242077827453613, 3.564589738845825, 3.804971694946289, 4.045353412628174, 4.285735607147217, 4.526117324829102, 4.7664995193481445, 5.006881237030029, 5.247262954711914, 5.487645149230957, 5.728026866912842, 5.968408584594727, 6.2087907791137695, 6.449172496795654, 6.689554214477539, 6.929936408996582, 7.170318126678467, 7.410699844360352, 7.6510820388793945]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 5.0, 2.0, 8.0, 11.0, 14.0, 22.0, 34.0, 54.0, 78.0, 98.0, 165.0, 280.0, 456.0, 724.0, 1348.0, 2500.0, 4895.0, 10118.0, 22152.0, 49362.0, 110492.0, 242045.0, 312929.0, 158749.0, 71635.0, 31879.0, 14215.0, 6704.0, 3324.0, 1692.0, 999.0, 603.0, 341.0, 226.0, 147.0, 95.0, 53.0, 24.0, 20.0, 16.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89080810546875, -3.7620849609375, -3.63336181640625, -3.504638671875, -3.37591552734375, -3.2471923828125, -3.11846923828125, -2.98974609375, -2.86102294921875, -2.7322998046875, -2.60357666015625, -2.474853515625, -2.34613037109375, -2.2174072265625, -2.08868408203125, -1.9599609375, -1.83123779296875, -1.7025146484375, -1.57379150390625, -1.445068359375, -1.31634521484375, -1.1876220703125, -1.05889892578125, -0.93017578125, -0.80145263671875, -0.6727294921875, -0.54400634765625, -0.415283203125, -0.28656005859375, -0.1578369140625, -0.02911376953125, 0.099609375, 0.22833251953125, 0.3570556640625, 0.48577880859375, 0.614501953125, 0.74322509765625, 0.8719482421875, 1.00067138671875, 1.12939453125, 1.25811767578125, 1.3868408203125, 1.51556396484375, 1.644287109375, 1.77301025390625, 1.9017333984375, 2.03045654296875, 2.1591796875, 2.28790283203125, 2.4166259765625, 2.54534912109375, 2.674072265625, 2.80279541015625, 2.9315185546875, 3.06024169921875, 3.18896484375, 3.31768798828125, 3.4464111328125, 3.57513427734375, 3.703857421875, 3.83258056640625, 3.9613037109375, 4.09002685546875, 4.21875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 8.0, 11.0, 9.0, 13.0, 14.0, 17.0, 20.0, 22.0, 25.0, 21.0, 40.0, 40.0, 33.0, 51.0, 38.0, 52.0, 53.0, 52.0, 48.0, 51.0, 47.0, 47.0, 32.0, 32.0, 24.0, 35.0, 26.0, 23.0, 27.0, 20.0, 15.0, 5.0, 8.0, 5.0, 4.0, 1.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7138671875, -0.6916122436523438, -0.6693572998046875, -0.6471023559570312, -0.624847412109375, -0.6025924682617188, -0.5803375244140625, -0.5580825805664062, -0.53582763671875, -0.5135726928710938, -0.4913177490234375, -0.46906280517578125, -0.446807861328125, -0.42455291748046875, -0.4022979736328125, -0.38004302978515625, -0.3577880859375, -0.33553314208984375, -0.3132781982421875, -0.29102325439453125, -0.268768310546875, -0.24651336669921875, -0.2242584228515625, -0.20200347900390625, -0.17974853515625, -0.15749359130859375, -0.1352386474609375, -0.11298370361328125, -0.090728759765625, -0.06847381591796875, -0.0462188720703125, -0.02396392822265625, -0.001708984375, 0.02054595947265625, 0.0428009033203125, 0.06505584716796875, 0.087310791015625, 0.10956573486328125, 0.1318206787109375, 0.15407562255859375, 0.17633056640625, 0.19858551025390625, 0.2208404541015625, 0.24309539794921875, 0.265350341796875, 0.28760528564453125, 0.3098602294921875, 0.33211517333984375, 0.3543701171875, 0.37662506103515625, 0.3988800048828125, 0.42113494873046875, 0.443389892578125, 0.46564483642578125, 0.4878997802734375, 0.5101547241210938, 0.53240966796875, 0.5546646118164062, 0.5769195556640625, 0.5991744995117188, 0.621429443359375, 0.6436843872070312, 0.6659393310546875, 0.6881942749023438, 0.71044921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 17.0, 11.0, 20.0, 29.0, 35.0, 64.0, 64.0, 82.0, 140.0, 185.0, 286.0, 359.0, 602.0, 956.0, 1832.0, 3978.0, 9071.0, 22401.0, 57299.0, 144686.0, 325712.0, 282937.0, 117576.0, 46562.0, 18496.0, 7493.0, 3364.0, 1674.0, 862.0, 541.0, 338.0, 232.0, 205.0, 120.0, 77.0, 62.0, 54.0, 33.0, 25.0, 20.0, 13.0, 8.0, 2.0, 8.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.482421875, -3.36590576171875, -3.2493896484375, -3.13287353515625, -3.016357421875, -2.89984130859375, -2.7833251953125, -2.66680908203125, -2.55029296875, -2.43377685546875, -2.3172607421875, -2.20074462890625, -2.084228515625, -1.96771240234375, -1.8511962890625, -1.73468017578125, -1.6181640625, -1.50164794921875, -1.3851318359375, -1.26861572265625, -1.152099609375, -1.03558349609375, -0.9190673828125, -0.80255126953125, -0.68603515625, -0.56951904296875, -0.4530029296875, -0.33648681640625, -0.219970703125, -0.10345458984375, 0.0130615234375, 0.12957763671875, 0.24609375, 0.36260986328125, 0.4791259765625, 0.59564208984375, 0.712158203125, 0.82867431640625, 0.9451904296875, 1.06170654296875, 1.17822265625, 1.29473876953125, 1.4112548828125, 1.52777099609375, 1.644287109375, 1.76080322265625, 1.8773193359375, 1.99383544921875, 2.1103515625, 2.22686767578125, 2.3433837890625, 2.45989990234375, 2.576416015625, 2.69293212890625, 2.8094482421875, 2.92596435546875, 3.04248046875, 3.15899658203125, 3.2755126953125, 3.39202880859375, 3.508544921875, 3.62506103515625, 3.7415771484375, 3.85809326171875, 3.974609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 9.0, 5.0, 12.0, 11.0, 10.0, 19.0, 19.0, 15.0, 17.0, 33.0, 31.0, 38.0, 23.0, 29.0, 30.0, 38.0, 45.0, 30.0, 42.0, 47.0, 42.0, 37.0, 42.0, 42.0, 43.0, 36.0, 27.0, 30.0, 32.0, 23.0, 27.0, 17.0, 19.0, 16.0, 15.0, 13.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.091796875, -3.000823974609375, -2.90985107421875, -2.818878173828125, -2.7279052734375, -2.636932373046875, -2.54595947265625, -2.454986572265625, -2.364013671875, -2.273040771484375, -2.18206787109375, -2.091094970703125, -2.0001220703125, -1.909149169921875, -1.81817626953125, -1.727203369140625, -1.63623046875, -1.545257568359375, -1.45428466796875, -1.363311767578125, -1.2723388671875, -1.181365966796875, -1.09039306640625, -0.999420166015625, -0.908447265625, -0.817474365234375, -0.72650146484375, -0.635528564453125, -0.5445556640625, -0.453582763671875, -0.36260986328125, -0.271636962890625, -0.1806640625, -0.089691162109375, 0.00128173828125, 0.092254638671875, 0.1832275390625, 0.274200439453125, 0.36517333984375, 0.456146240234375, 0.547119140625, 0.638092041015625, 0.72906494140625, 0.820037841796875, 0.9110107421875, 1.001983642578125, 1.09295654296875, 1.183929443359375, 1.27490234375, 1.365875244140625, 1.45684814453125, 1.547821044921875, 1.6387939453125, 1.729766845703125, 1.82073974609375, 1.911712646484375, 2.002685546875, 2.093658447265625, 2.18463134765625, 2.275604248046875, 2.3665771484375, 2.457550048828125, 2.54852294921875, 2.639495849609375, 2.73046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 9.0, 2.0, 2.0, 8.0, 10.0, 12.0, 19.0, 13.0, 26.0, 39.0, 64.0, 91.0, 126.0, 203.0, 348.0, 527.0, 999.0, 1930.0, 4522.0, 13534.0, 55554.0, 291554.0, 515514.0, 124073.0, 25645.0, 7455.0, 2897.0, 1389.0, 739.0, 442.0, 289.0, 170.0, 120.0, 67.0, 53.0, 30.0, 24.0, 20.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.20703125, -3.107574462890625, -3.00811767578125, -2.908660888671875, -2.8092041015625, -2.709747314453125, -2.61029052734375, -2.510833740234375, -2.411376953125, -2.311920166015625, -2.21246337890625, -2.113006591796875, -2.0135498046875, -1.914093017578125, -1.81463623046875, -1.715179443359375, -1.61572265625, -1.516265869140625, -1.41680908203125, -1.317352294921875, -1.2178955078125, -1.118438720703125, -1.01898193359375, -0.919525146484375, -0.820068359375, -0.720611572265625, -0.62115478515625, -0.521697998046875, -0.4222412109375, -0.322784423828125, -0.22332763671875, -0.123870849609375, -0.0244140625, 0.075042724609375, 0.17449951171875, 0.273956298828125, 0.3734130859375, 0.472869873046875, 0.57232666015625, 0.671783447265625, 0.771240234375, 0.870697021484375, 0.97015380859375, 1.069610595703125, 1.1690673828125, 1.268524169921875, 1.36798095703125, 1.467437744140625, 1.56689453125, 1.666351318359375, 1.76580810546875, 1.865264892578125, 1.9647216796875, 2.064178466796875, 2.16363525390625, 2.263092041015625, 2.362548828125, 2.462005615234375, 2.56146240234375, 2.660919189453125, 2.7603759765625, 2.859832763671875, 2.95928955078125, 3.058746337890625, 3.158203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 5.0, 13.0, 9.0, 18.0, 12.0, 24.0, 17.0, 19.0, 26.0, 39.0, 50.0, 82.0, 109.0, 107.0, 108.0, 72.0, 54.0, 47.0, 32.0, 26.0, 22.0, 20.0, 13.0, 12.0, 13.0, 3.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003070831298828125, -0.0002958737313747406, -0.0002846643328666687, -0.0002734549343585968, -0.0002622455358505249, -0.000251036137342453, -0.0002398267388343811, -0.0002286173403263092, -0.0002174079418182373, -0.0002061985433101654, -0.0001949891448020935, -0.0001837797462940216, -0.0001725703477859497, -0.0001613609492778778, -0.0001501515507698059, -0.000138942152261734, -0.0001277327537536621, -0.00011652335524559021, -0.00010531395673751831, -9.410455822944641e-05, -8.289515972137451e-05, -7.168576121330261e-05, -6.047636270523071e-05, -4.9266964197158813e-05, -3.8057565689086914e-05, -2.6848167181015015e-05, -1.5638768672943115e-05, -4.429370164871216e-06, 6.780028343200684e-06, 1.7989426851272583e-05, 2.9198825359344482e-05, 4.040822386741638e-05, 5.161762237548828e-05, 6.282702088356018e-05, 7.403641939163208e-05, 8.524581789970398e-05, 9.645521640777588e-05, 0.00010766461491584778, 0.00011887401342391968, 0.00013008341193199158, 0.00014129281044006348, 0.00015250220894813538, 0.00016371160745620728, 0.00017492100596427917, 0.00018613040447235107, 0.00019733980298042297, 0.00020854920148849487, 0.00021975859999656677, 0.00023096799850463867, 0.00024217739701271057, 0.00025338679552078247, 0.00026459619402885437, 0.00027580559253692627, 0.00028701499104499817, 0.00029822438955307007, 0.00030943378806114197, 0.00032064318656921387, 0.00033185258507728577, 0.00034306198358535767, 0.00035427138209342957, 0.00036548078060150146, 0.00037669017910957336, 0.00038789957761764526, 0.00039910897612571716, 0.00041031837463378906]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 18.0, 16.0, 20.0, 29.0, 46.0, 86.0, 120.0, 250.0, 460.0, 938.0, 2035.0, 5956.0, 26203.0, 304515.0, 633941.0, 58612.0, 9648.0, 3086.0, 1294.0, 584.0, 274.0, 146.0, 81.0, 49.0, 47.0, 20.0, 16.0, 14.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.90899658203125, -4.7515869140625, -4.59417724609375, -4.436767578125, -4.27935791015625, -4.1219482421875, -3.96453857421875, -3.80712890625, -3.64971923828125, -3.4923095703125, -3.33489990234375, -3.177490234375, -3.02008056640625, -2.8626708984375, -2.70526123046875, -2.5478515625, -2.39044189453125, -2.2330322265625, -2.07562255859375, -1.918212890625, -1.76080322265625, -1.6033935546875, -1.44598388671875, -1.28857421875, -1.13116455078125, -0.9737548828125, -0.81634521484375, -0.658935546875, -0.50152587890625, -0.3441162109375, -0.18670654296875, -0.029296875, 0.12811279296875, 0.2855224609375, 0.44293212890625, 0.600341796875, 0.75775146484375, 0.9151611328125, 1.07257080078125, 1.22998046875, 1.38739013671875, 1.5447998046875, 1.70220947265625, 1.859619140625, 2.01702880859375, 2.1744384765625, 2.33184814453125, 2.4892578125, 2.64666748046875, 2.8040771484375, 2.96148681640625, 3.118896484375, 3.27630615234375, 3.4337158203125, 3.59112548828125, 3.74853515625, 3.90594482421875, 4.0633544921875, 4.22076416015625, 4.378173828125, 4.53558349609375, 4.6929931640625, 4.85040283203125, 5.0078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 9.0, 19.0, 22.0, 67.0, 124.0, 175.0, 217.0, 157.0, 102.0, 44.0, 20.0, 8.0, 9.0, 7.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.1024169921875, -3.962646484375, -3.8228759765625, -3.68310546875, -3.5433349609375, -3.403564453125, -3.2637939453125, -3.1240234375, -2.9842529296875, -2.844482421875, -2.7047119140625, -2.56494140625, -2.4251708984375, -2.285400390625, -2.1456298828125, -2.005859375, -1.8660888671875, -1.726318359375, -1.5865478515625, -1.44677734375, -1.3070068359375, -1.167236328125, -1.0274658203125, -0.8876953125, -0.7479248046875, -0.608154296875, -0.4683837890625, -0.32861328125, -0.1888427734375, -0.049072265625, 0.0906982421875, 0.23046875, 0.3702392578125, 0.510009765625, 0.6497802734375, 0.78955078125, 0.9293212890625, 1.069091796875, 1.2088623046875, 1.3486328125, 1.4884033203125, 1.628173828125, 1.7679443359375, 1.90771484375, 2.0474853515625, 2.187255859375, 2.3270263671875, 2.466796875, 2.6065673828125, 2.746337890625, 2.8861083984375, 3.02587890625, 3.1656494140625, 3.305419921875, 3.4451904296875, 3.5849609375, 3.7247314453125, 3.864501953125, 4.0042724609375, 4.14404296875, 4.2838134765625, 4.423583984375, 4.5633544921875, 4.703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 17.0, 27.0, 82.0, 141.0, 198.0, 226.0, 146.0, 99.0, 31.0, 18.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5025405883789, -64.65855407714844, -62.8145637512207, -60.970577239990234, -59.1265869140625, -57.28260040283203, -55.43861389160156, -53.594627380371094, -51.75063705444336, -49.90665054321289, -48.062660217285156, -46.21867370605469, -44.37468719482422, -42.530696868896484, -40.686710357666016, -38.84272003173828, -36.99873352050781, -35.154747009277344, -33.31075668334961, -31.46677017211914, -29.62278175354004, -27.778793334960938, -25.93480682373047, -24.090818405151367, -22.246829986572266, -20.402841567993164, -18.558853149414062, -16.714866638183594, -14.870878219604492, -13.02688980102539, -11.182902336120605, -9.33891487121582, -7.494926452636719, -5.650938510894775, -3.806950569152832, -1.9629626274108887, -0.11897468566894531, 1.7250137329101562, 3.5690011978149414, 5.412988662719727, 7.256977081298828, 9.10096549987793, 10.944952964782715, 12.7889404296875, 14.632928848266602, 16.476917266845703, 18.320903778076172, 20.164892196655273, 22.008880615234375, 23.852869033813477, 25.696857452392578, 27.540843963623047, 29.38483238220215, 31.22882080078125, 33.07280731201172, 34.91679382324219, 36.76078414916992, 38.60477066040039, 40.448760986328125, 42.292747497558594, 44.13673400878906, 45.9807243347168, 47.824710845947266, 49.668701171875, 51.51268768310547]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 7.0, 10.0, 10.0, 13.0, 14.0, 15.0, 18.0, 24.0, 27.0, 30.0, 32.0, 32.0, 34.0, 38.0, 30.0, 46.0, 51.0, 40.0, 45.0, 51.0, 46.0, 34.0, 40.0, 40.0, 32.0, 25.0, 20.0, 28.0, 28.0, 20.0, 17.0, 23.0, 10.0, 9.0, 9.0, 5.0, 9.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.858320236206055, -15.334580421447754, -14.810840606689453, -14.287100791931152, -13.763360977172852, -13.239620208740234, -12.715880393981934, -12.192140579223633, -11.668400764465332, -11.144660949707031, -10.62092113494873, -10.09718132019043, -9.573440551757812, -9.049701690673828, -8.525960922241211, -8.00222110748291, -7.478481292724609, -6.954741477966309, -6.431001663208008, -5.907261371612549, -5.383521556854248, -4.859781742095947, -4.336041450500488, -3.8123016357421875, -3.2885618209838867, -2.764822006225586, -2.241081953048706, -1.7173420190811157, -1.1936020851135254, -0.6698622703552246, -0.14612221717834473, 0.37761783599853516, 0.9013557434082031, 1.4250956773757935, 1.9488356113433838, 2.4725756645202637, 2.9963154792785645, 3.5200552940368652, 4.043795585632324, 4.567535400390625, 5.091275215148926, 5.615015029907227, 6.138754844665527, 6.662495136260986, 7.186234951019287, 7.709974765777588, 8.233715057373047, 8.757454872131348, 9.281194686889648, 9.80493450164795, 10.32867431640625, 10.85241413116455, 11.376153945922852, 11.899894714355469, 12.42363452911377, 12.94737434387207, 13.471114158630371, 13.994853973388672, 14.518593788146973, 15.042333602905273, 15.56607437133789, 16.089813232421875, 16.613554000854492, 17.13729476928711, 17.661033630371094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 13.0, 3.0, 9.0, 20.0, 16.0, 29.0, 36.0, 68.0, 92.0, 123.0, 210.0, 304.0, 465.0, 746.0, 1273.0, 2217.0, 4083.0, 8022.0, 17157.0, 41839.0, 141427.0, 2967215.0, 839675.0, 104441.0, 34454.0, 14598.0, 7024.0, 3662.0, 1989.0, 1136.0, 671.0, 427.0, 277.0, 189.0, 115.0, 83.0, 60.0, 39.0, 22.0, 11.0, 10.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-4.8046875, -4.6669921875, -4.529296875, -4.3916015625, -4.25390625, -4.1162109375, -3.978515625, -3.8408203125, -3.703125, -3.5654296875, -3.427734375, -3.2900390625, -3.15234375, -3.0146484375, -2.876953125, -2.7392578125, -2.6015625, -2.4638671875, -2.326171875, -2.1884765625, -2.05078125, -1.9130859375, -1.775390625, -1.6376953125, -1.5, -1.3623046875, -1.224609375, -1.0869140625, -0.94921875, -0.8115234375, -0.673828125, -0.5361328125, -0.3984375, -0.2607421875, -0.123046875, 0.0146484375, 0.15234375, 0.2900390625, 0.427734375, 0.5654296875, 0.703125, 0.8408203125, 0.978515625, 1.1162109375, 1.25390625, 1.3916015625, 1.529296875, 1.6669921875, 1.8046875, 1.9423828125, 2.080078125, 2.2177734375, 2.35546875, 2.4931640625, 2.630859375, 2.7685546875, 2.90625, 3.0439453125, 3.181640625, 3.3193359375, 3.45703125, 3.5947265625, 3.732421875, 3.8701171875, 4.0078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 8.0, 10.0, 6.0, 11.0, 9.0, 7.0, 24.0, 17.0, 26.0, 23.0, 31.0, 34.0, 37.0, 36.0, 38.0, 58.0, 54.0, 51.0, 50.0, 45.0, 50.0, 47.0, 42.0, 58.0, 34.0, 31.0, 21.0, 28.0, 22.0, 22.0, 16.0, 10.0, 11.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.759765625, -0.7361907958984375, -0.712615966796875, -0.6890411376953125, -0.66546630859375, -0.6418914794921875, -0.618316650390625, -0.5947418212890625, -0.5711669921875, -0.5475921630859375, -0.524017333984375, -0.5004425048828125, -0.47686767578125, -0.4532928466796875, -0.429718017578125, -0.4061431884765625, -0.382568359375, -0.3589935302734375, -0.335418701171875, -0.3118438720703125, -0.28826904296875, -0.2646942138671875, -0.241119384765625, -0.2175445556640625, -0.1939697265625, -0.1703948974609375, -0.146820068359375, -0.1232452392578125, -0.09967041015625, -0.0760955810546875, -0.052520751953125, -0.0289459228515625, -0.00537109375, 0.0182037353515625, 0.041778564453125, 0.0653533935546875, 0.08892822265625, 0.1125030517578125, 0.136077880859375, 0.1596527099609375, 0.1832275390625, 0.2068023681640625, 0.230377197265625, 0.2539520263671875, 0.27752685546875, 0.3011016845703125, 0.324676513671875, 0.3482513427734375, 0.371826171875, 0.3954010009765625, 0.418975830078125, 0.4425506591796875, 0.46612548828125, 0.4897003173828125, 0.513275146484375, 0.5368499755859375, 0.5604248046875, 0.5839996337890625, 0.607574462890625, 0.6311492919921875, 0.65472412109375, 0.6782989501953125, 0.701873779296875, 0.7254486083984375, 0.7490234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 12.0, 17.0, 16.0, 20.0, 35.0, 46.0, 65.0, 102.0, 156.0, 246.0, 433.0, 744.0, 1602.0, 3446.0, 8866.0, 24660.0, 83513.0, 460749.0, 3223504.0, 290833.0, 62527.0, 19492.0, 7057.0, 2978.0, 1344.0, 668.0, 383.0, 215.0, 153.0, 114.0, 67.0, 44.0, 36.0, 33.0, 26.0, 16.0, 5.0, 12.0, 7.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-4.72265625, -4.5672607421875, -4.411865234375, -4.2564697265625, -4.10107421875, -3.9456787109375, -3.790283203125, -3.6348876953125, -3.4794921875, -3.3240966796875, -3.168701171875, -3.0133056640625, -2.85791015625, -2.7025146484375, -2.547119140625, -2.3917236328125, -2.236328125, -2.0809326171875, -1.925537109375, -1.7701416015625, -1.61474609375, -1.4593505859375, -1.303955078125, -1.1485595703125, -0.9931640625, -0.8377685546875, -0.682373046875, -0.5269775390625, -0.37158203125, -0.2161865234375, -0.060791015625, 0.0946044921875, 0.25, 0.4053955078125, 0.560791015625, 0.7161865234375, 0.87158203125, 1.0269775390625, 1.182373046875, 1.3377685546875, 1.4931640625, 1.6485595703125, 1.803955078125, 1.9593505859375, 2.11474609375, 2.2701416015625, 2.425537109375, 2.5809326171875, 2.736328125, 2.8917236328125, 3.047119140625, 3.2025146484375, 3.35791015625, 3.5133056640625, 3.668701171875, 3.8240966796875, 3.9794921875, 4.1348876953125, 4.290283203125, 4.4456787109375, 4.60107421875, 4.7564697265625, 4.911865234375, 5.0672607421875, 5.22265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 13.0, 10.0, 22.0, 21.0, 38.0, 45.0, 80.0, 154.0, 228.0, 515.0, 1620.0, 635.0, 249.0, 147.0, 88.0, 62.0, 34.0, 31.0, 23.0, 14.0, 7.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2562255859375, -1.192138671875, -1.1280517578125, -1.06396484375, -0.9998779296875, -0.935791015625, -0.8717041015625, -0.8076171875, -0.7435302734375, -0.679443359375, -0.6153564453125, -0.55126953125, -0.4871826171875, -0.423095703125, -0.3590087890625, -0.294921875, -0.2308349609375, -0.166748046875, -0.1026611328125, -0.03857421875, 0.0255126953125, 0.089599609375, 0.1536865234375, 0.2177734375, 0.2818603515625, 0.345947265625, 0.4100341796875, 0.47412109375, 0.5382080078125, 0.602294921875, 0.6663818359375, 0.73046875, 0.7945556640625, 0.858642578125, 0.9227294921875, 0.98681640625, 1.0509033203125, 1.114990234375, 1.1790771484375, 1.2431640625, 1.3072509765625, 1.371337890625, 1.4354248046875, 1.49951171875, 1.5635986328125, 1.627685546875, 1.6917724609375, 1.755859375, 1.8199462890625, 1.884033203125, 1.9481201171875, 2.01220703125, 2.0762939453125, 2.140380859375, 2.2044677734375, 2.2685546875, 2.3326416015625, 2.396728515625, 2.4608154296875, 2.52490234375, 2.5889892578125, 2.653076171875, 2.7171630859375, 2.78125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 11.0, 14.0, 51.0, 77.0, 97.0, 131.0, 184.0, 143.0, 126.0, 59.0, 41.0, 31.0, 15.0, 10.0, 8.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.526201248168945, -20.995834350585938, -20.46546745300293, -19.935100555419922, -19.40473175048828, -18.874364852905273, -18.343997955322266, -17.813631057739258, -17.28326416015625, -16.752897262573242, -16.222530364990234, -15.69216251373291, -15.161795616149902, -14.631427764892578, -14.10106086730957, -13.570693969726562, -13.040326118469238, -12.50995922088623, -11.979591369628906, -11.449224472045898, -10.91885757446289, -10.388490676879883, -9.858122825622559, -9.32775592803955, -8.797388076782227, -8.267021179199219, -7.736653804779053, -7.206286430358887, -6.675919532775879, -6.145552158355713, -5.615184783935547, -5.084817886352539, -4.554450988769531, -4.024083614349365, -3.4937167167663574, -2.9633493423461914, -2.4329822063446045, -1.9026150703430176, -1.3722476959228516, -0.8418805599212646, -0.31151342391967773, 0.21885377168655396, 0.7492209672927856, 1.279588222503662, 1.809955358505249, 2.340322494506836, 2.870689868927002, 3.401057004928589, 3.931424140930176, 4.461791515350342, 4.99215841293335, 5.522525787353516, 6.052892684936523, 6.5832600593566895, 7.1136274337768555, 7.643994331359863, 8.174362182617188, 8.704729080200195, 9.23509693145752, 9.765463829040527, 10.295830726623535, 10.82619857788086, 11.356565475463867, 11.886932373046875, 12.417299270629883]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 4.0, 13.0, 8.0, 12.0, 6.0, 8.0, 20.0, 21.0, 25.0, 27.0, 31.0, 23.0, 37.0, 42.0, 37.0, 42.0, 42.0, 49.0, 37.0, 40.0, 43.0, 31.0, 34.0, 34.0, 43.0, 32.0, 20.0, 19.0, 32.0, 32.0, 28.0, 19.0, 25.0, 16.0, 14.0, 13.0, 11.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.710840702056885, -5.529642581939697, -5.348443984985352, -5.167245864868164, -4.986047744750977, -4.804849147796631, -4.623651027679443, -4.442452430725098, -4.26125431060791, -4.080056190490723, -3.898857593536377, -3.7176594734191895, -3.536461114883423, -3.3552627563476562, -3.1740646362304688, -2.992866277694702, -2.8116679191589355, -2.630469560623169, -2.4492712020874023, -2.268073081970215, -2.0868747234344482, -1.9056763648986816, -1.7244781255722046, -1.5432798862457275, -1.362081527709961, -1.1808831691741943, -0.9996849298477173, -0.8184866309165955, -0.6372883319854736, -0.4560900330543518, -0.27489173412323, -0.09369349479675293, 0.08750438690185547, 0.2687026858329773, 0.4499009847640991, 0.631099283695221, 0.8122975826263428, 0.9934958815574646, 1.1746941804885864, 1.3558924198150635, 1.53709077835083, 1.7182891368865967, 1.8994873762130737, 2.080685615539551, 2.2618839740753174, 2.443082332611084, 2.6242804527282715, 2.805478811264038, 2.9866771697998047, 3.1678755283355713, 3.349073886871338, 3.5302720069885254, 3.711470365524292, 3.8926687240600586, 4.073866844177246, 4.255064964294434, 4.436263561248779, 4.617461681365967, 4.7986602783203125, 4.9798583984375, 5.1610565185546875, 5.342255115509033, 5.523453235626221, 5.704651832580566, 5.885849952697754]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 6.0, 10.0, 14.0, 20.0, 33.0, 58.0, 107.0, 197.0, 394.0, 953.0, 2603.0, 8447.0, 30250.0, 128867.0, 490151.0, 295628.0, 66154.0, 16643.0, 4992.0, 1708.0, 650.0, 288.0, 154.0, 81.0, 51.0, 31.0, 20.0, 8.0, 6.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.8316650390625, -7.585205078125, -7.3387451171875, -7.09228515625, -6.8458251953125, -6.599365234375, -6.3529052734375, -6.1064453125, -5.8599853515625, -5.613525390625, -5.3670654296875, -5.12060546875, -4.8741455078125, -4.627685546875, -4.3812255859375, -4.134765625, -3.8883056640625, -3.641845703125, -3.3953857421875, -3.14892578125, -2.9024658203125, -2.656005859375, -2.4095458984375, -2.1630859375, -1.9166259765625, -1.670166015625, -1.4237060546875, -1.17724609375, -0.9307861328125, -0.684326171875, -0.4378662109375, -0.19140625, 0.0550537109375, 0.301513671875, 0.5479736328125, 0.79443359375, 1.0408935546875, 1.287353515625, 1.5338134765625, 1.7802734375, 2.0267333984375, 2.273193359375, 2.5196533203125, 2.76611328125, 3.0125732421875, 3.259033203125, 3.5054931640625, 3.751953125, 3.9984130859375, 4.244873046875, 4.4913330078125, 4.73779296875, 4.9842529296875, 5.230712890625, 5.4771728515625, 5.7236328125, 5.9700927734375, 6.216552734375, 6.4630126953125, 6.70947265625, 6.9559326171875, 7.202392578125, 7.4488525390625, 7.6953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 9.0, 12.0, 8.0, 7.0, 10.0, 12.0, 14.0, 22.0, 28.0, 27.0, 31.0, 47.0, 40.0, 44.0, 47.0, 51.0, 53.0, 51.0, 64.0, 48.0, 39.0, 53.0, 48.0, 33.0, 42.0, 32.0, 26.0, 21.0, 11.0, 15.0, 15.0, 10.0, 5.0, 6.0, 6.0, 2.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78662109375, -0.7624053955078125, -0.738189697265625, -0.7139739990234375, -0.68975830078125, -0.6655426025390625, -0.641326904296875, -0.6171112060546875, -0.5928955078125, -0.5686798095703125, -0.544464111328125, -0.5202484130859375, -0.49603271484375, -0.4718170166015625, -0.447601318359375, -0.4233856201171875, -0.399169921875, -0.3749542236328125, -0.350738525390625, -0.3265228271484375, -0.30230712890625, -0.2780914306640625, -0.253875732421875, -0.2296600341796875, -0.2054443359375, -0.1812286376953125, -0.157012939453125, -0.1327972412109375, -0.10858154296875, -0.0843658447265625, -0.060150146484375, -0.0359344482421875, -0.01171875, 0.0124969482421875, 0.036712646484375, 0.0609283447265625, 0.08514404296875, 0.1093597412109375, 0.133575439453125, 0.1577911376953125, 0.1820068359375, 0.2062225341796875, 0.230438232421875, 0.2546539306640625, 0.27886962890625, 0.3030853271484375, 0.327301025390625, 0.3515167236328125, 0.375732421875, 0.3999481201171875, 0.424163818359375, 0.4483795166015625, 0.47259521484375, 0.4968109130859375, 0.521026611328125, 0.5452423095703125, 0.5694580078125, 0.5936737060546875, 0.617889404296875, 0.6421051025390625, 0.66632080078125, 0.6905364990234375, 0.714752197265625, 0.7389678955078125, 0.76318359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 10.0, 16.0, 8.0, 26.0, 25.0, 41.0, 50.0, 63.0, 77.0, 120.0, 152.0, 192.0, 267.0, 342.0, 476.0, 825.0, 1395.0, 2939.0, 7207.0, 19718.0, 56381.0, 161973.0, 369005.0, 271292.0, 99716.0, 33840.0, 12226.0, 4751.0, 2082.0, 1066.0, 646.0, 429.0, 305.0, 221.0, 168.0, 120.0, 83.0, 70.0, 62.0, 46.0, 41.0, 19.0, 13.0, 11.0, 6.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.05078125, -3.930816650390625, -3.81085205078125, -3.690887451171875, -3.5709228515625, -3.450958251953125, -3.33099365234375, -3.211029052734375, -3.091064453125, -2.971099853515625, -2.85113525390625, -2.731170654296875, -2.6112060546875, -2.491241455078125, -2.37127685546875, -2.251312255859375, -2.13134765625, -2.011383056640625, -1.89141845703125, -1.771453857421875, -1.6514892578125, -1.531524658203125, -1.41156005859375, -1.291595458984375, -1.171630859375, -1.051666259765625, -0.93170166015625, -0.811737060546875, -0.6917724609375, -0.571807861328125, -0.45184326171875, -0.331878662109375, -0.2119140625, -0.091949462890625, 0.02801513671875, 0.147979736328125, 0.2679443359375, 0.387908935546875, 0.50787353515625, 0.627838134765625, 0.747802734375, 0.867767333984375, 0.98773193359375, 1.107696533203125, 1.2276611328125, 1.347625732421875, 1.46759033203125, 1.587554931640625, 1.70751953125, 1.827484130859375, 1.94744873046875, 2.067413330078125, 2.1873779296875, 2.307342529296875, 2.42730712890625, 2.547271728515625, 2.667236328125, 2.787200927734375, 2.90716552734375, 3.027130126953125, 3.1470947265625, 3.267059326171875, 3.38702392578125, 3.506988525390625, 3.626953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 7.0, 6.0, 2.0, 4.0, 17.0, 17.0, 12.0, 21.0, 24.0, 25.0, 29.0, 36.0, 32.0, 35.0, 37.0, 36.0, 40.0, 44.0, 38.0, 44.0, 42.0, 49.0, 37.0, 31.0, 35.0, 37.0, 34.0, 37.0, 24.0, 23.0, 20.0, 29.0, 17.0, 15.0, 10.0, 8.0, 6.0, 7.0, 7.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.34344482421875, -2.2572021484375, -2.17095947265625, -2.084716796875, -1.99847412109375, -1.9122314453125, -1.82598876953125, -1.73974609375, -1.65350341796875, -1.5672607421875, -1.48101806640625, -1.394775390625, -1.30853271484375, -1.2222900390625, -1.13604736328125, -1.0498046875, -0.96356201171875, -0.8773193359375, -0.79107666015625, -0.704833984375, -0.61859130859375, -0.5323486328125, -0.44610595703125, -0.35986328125, -0.27362060546875, -0.1873779296875, -0.10113525390625, -0.014892578125, 0.07135009765625, 0.1575927734375, 0.24383544921875, 0.330078125, 0.41632080078125, 0.5025634765625, 0.58880615234375, 0.675048828125, 0.76129150390625, 0.8475341796875, 0.93377685546875, 1.02001953125, 1.10626220703125, 1.1925048828125, 1.27874755859375, 1.364990234375, 1.45123291015625, 1.5374755859375, 1.62371826171875, 1.7099609375, 1.79620361328125, 1.8824462890625, 1.96868896484375, 2.054931640625, 2.14117431640625, 2.2274169921875, 2.31365966796875, 2.39990234375, 2.48614501953125, 2.5723876953125, 2.65863037109375, 2.744873046875, 2.83111572265625, 2.9173583984375, 3.00360107421875, 3.08984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 1.0, 4.0, 2.0, 4.0, 9.0, 10.0, 13.0, 13.0, 25.0, 42.0, 52.0, 98.0, 154.0, 301.0, 589.0, 1445.0, 3952.0, 13150.0, 70002.0, 495892.0, 393319.0, 52995.0, 10736.0, 3257.0, 1262.0, 548.0, 280.0, 151.0, 82.0, 55.0, 49.0, 14.0, 13.0, 12.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.392486572265625, -3.27520751953125, -3.157928466796875, -3.0406494140625, -2.923370361328125, -2.80609130859375, -2.688812255859375, -2.571533203125, -2.454254150390625, -2.33697509765625, -2.219696044921875, -2.1024169921875, -1.985137939453125, -1.86785888671875, -1.750579833984375, -1.63330078125, -1.516021728515625, -1.39874267578125, -1.281463623046875, -1.1641845703125, -1.046905517578125, -0.92962646484375, -0.812347412109375, -0.695068359375, -0.577789306640625, -0.46051025390625, -0.343231201171875, -0.2259521484375, -0.108673095703125, 0.00860595703125, 0.125885009765625, 0.2431640625, 0.360443115234375, 0.47772216796875, 0.595001220703125, 0.7122802734375, 0.829559326171875, 0.94683837890625, 1.064117431640625, 1.181396484375, 1.298675537109375, 1.41595458984375, 1.533233642578125, 1.6505126953125, 1.767791748046875, 1.88507080078125, 2.002349853515625, 2.11962890625, 2.236907958984375, 2.35418701171875, 2.471466064453125, 2.5887451171875, 2.706024169921875, 2.82330322265625, 2.940582275390625, 3.057861328125, 3.175140380859375, 3.29241943359375, 3.409698486328125, 3.5269775390625, 3.644256591796875, 3.76153564453125, 3.878814697265625, 3.99609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 5.0, 5.0, 6.0, 14.0, 7.0, 16.0, 9.0, 25.0, 19.0, 23.0, 25.0, 39.0, 46.0, 71.0, 85.0, 122.0, 92.0, 83.0, 54.0, 41.0, 39.0, 30.0, 30.0, 22.0, 19.0, 20.0, 4.0, 11.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.0004062652587890625, -0.00039550289511680603, -0.00038474053144454956, -0.0003739781677722931, -0.0003632158041000366, -0.00035245344042778015, -0.0003416910767555237, -0.0003309287130832672, -0.00032016634941101074, -0.00030940398573875427, -0.0002986416220664978, -0.00028787925839424133, -0.00027711689472198486, -0.0002663545310497284, -0.0002555921673774719, -0.00024482980370521545, -0.00023406744003295898, -0.00022330507636070251, -0.00021254271268844604, -0.00020178034901618958, -0.0001910179853439331, -0.00018025562167167664, -0.00016949325799942017, -0.0001587308943271637, -0.00014796853065490723, -0.00013720616698265076, -0.0001264438033103943, -0.00011568143963813782, -0.00010491907596588135, -9.415671229362488e-05, -8.339434862136841e-05, -7.263198494911194e-05, -6.186962127685547e-05, -5.1107257604599e-05, -4.034489393234253e-05, -2.958253026008606e-05, -1.882016658782959e-05, -8.05780291557312e-06, 2.7045607566833496e-06, 1.346692442893982e-05, 2.422928810119629e-05, 3.499165177345276e-05, 4.575401544570923e-05, 5.65163791179657e-05, 6.727874279022217e-05, 7.804110646247864e-05, 8.880347013473511e-05, 9.956583380699158e-05, 0.00011032819747924805, 0.00012109056115150452, 0.00013185292482376099, 0.00014261528849601746, 0.00015337765216827393, 0.0001641400158405304, 0.00017490237951278687, 0.00018566474318504333, 0.0001964271068572998, 0.00020718947052955627, 0.00021795183420181274, 0.00022871419787406921, 0.00023947656154632568, 0.00025023892521858215, 0.0002610012888908386, 0.0002717636525630951, 0.00028252601623535156]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 10.0, 7.0, 5.0, 12.0, 24.0, 15.0, 38.0, 35.0, 79.0, 98.0, 159.0, 283.0, 519.0, 1001.0, 2154.0, 5212.0, 18268.0, 106296.0, 625479.0, 241904.0, 33015.0, 7891.0, 2993.0, 1343.0, 635.0, 412.0, 234.0, 135.0, 99.0, 60.0, 32.0, 23.0, 17.0, 14.0, 8.0, 11.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33984375, -3.21923828125, -3.0986328125, -2.97802734375, -2.857421875, -2.73681640625, -2.6162109375, -2.49560546875, -2.375, -2.25439453125, -2.1337890625, -2.01318359375, -1.892578125, -1.77197265625, -1.6513671875, -1.53076171875, -1.41015625, -1.28955078125, -1.1689453125, -1.04833984375, -0.927734375, -0.80712890625, -0.6865234375, -0.56591796875, -0.4453125, -0.32470703125, -0.2041015625, -0.08349609375, 0.037109375, 0.15771484375, 0.2783203125, 0.39892578125, 0.51953125, 0.64013671875, 0.7607421875, 0.88134765625, 1.001953125, 1.12255859375, 1.2431640625, 1.36376953125, 1.484375, 1.60498046875, 1.7255859375, 1.84619140625, 1.966796875, 2.08740234375, 2.2080078125, 2.32861328125, 2.44921875, 2.56982421875, 2.6904296875, 2.81103515625, 2.931640625, 3.05224609375, 3.1728515625, 3.29345703125, 3.4140625, 3.53466796875, 3.6552734375, 3.77587890625, 3.896484375, 4.01708984375, 4.1376953125, 4.25830078125, 4.37890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 2.0, 11.0, 14.0, 12.0, 13.0, 25.0, 39.0, 37.0, 43.0, 76.0, 58.0, 105.0, 98.0, 97.0, 86.0, 56.0, 57.0, 44.0, 28.0, 18.0, 22.0, 8.0, 3.0, 7.0, 2.0, 9.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.966064453125, -1.89892578125, -1.831787109375, -1.7646484375, -1.697509765625, -1.63037109375, -1.563232421875, -1.49609375, -1.428955078125, -1.36181640625, -1.294677734375, -1.2275390625, -1.160400390625, -1.09326171875, -1.026123046875, -0.958984375, -0.891845703125, -0.82470703125, -0.757568359375, -0.6904296875, -0.623291015625, -0.55615234375, -0.489013671875, -0.421875, -0.354736328125, -0.28759765625, -0.220458984375, -0.1533203125, -0.086181640625, -0.01904296875, 0.048095703125, 0.115234375, 0.182373046875, 0.24951171875, 0.316650390625, 0.3837890625, 0.450927734375, 0.51806640625, 0.585205078125, 0.65234375, 0.719482421875, 0.78662109375, 0.853759765625, 0.9208984375, 0.988037109375, 1.05517578125, 1.122314453125, 1.189453125, 1.256591796875, 1.32373046875, 1.390869140625, 1.4580078125, 1.525146484375, 1.59228515625, 1.659423828125, 1.7265625, 1.793701171875, 1.86083984375, 1.927978515625, 1.9951171875, 2.062255859375, 2.12939453125, 2.196533203125, 2.263671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 9.0, 20.0, 39.0, 67.0, 99.0, 160.0, 176.0, 152.0, 109.0, 72.0, 47.0, 29.0, 11.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.64947509765625, -35.317970275878906, -33.98646545410156, -32.65495681762695, -31.32345199584961, -29.991947174072266, -28.66044044494629, -27.328933715820312, -25.99742889404297, -24.665924072265625, -23.33441734313965, -22.002910614013672, -20.671405792236328, -19.339900970458984, -18.008394241333008, -16.67688751220703, -15.345382690429688, -14.013876914978027, -12.682371139526367, -11.350865364074707, -10.019359588623047, -8.687853813171387, -7.356348037719727, -6.024842262268066, -4.693336486816406, -3.361830711364746, -2.030324935913086, -0.6988191604614258, 0.6326866149902344, 1.9641923904418945, 3.2956981658935547, 4.627203941345215, 5.958713531494141, 7.290219306945801, 8.621725082397461, 9.953230857849121, 11.284736633300781, 12.616242408752441, 13.947748184204102, 15.279253959655762, 16.610759735107422, 17.942264556884766, 19.273771286010742, 20.60527801513672, 21.936782836914062, 23.268287658691406, 24.599794387817383, 25.93130111694336, 27.262805938720703, 28.594310760498047, 29.925817489624023, 31.25732421875, 32.588829040527344, 33.92033386230469, 35.25183868408203, 36.58334732055664, 37.914852142333984, 39.24635696411133, 40.57786560058594, 41.90937042236328, 43.240875244140625, 44.57238006591797, 45.90388488769531, 47.23539352416992, 48.566898345947266]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 8.0, 7.0, 6.0, 9.0, 9.0, 13.0, 9.0, 14.0, 15.0, 21.0, 27.0, 17.0, 36.0, 36.0, 28.0, 43.0, 35.0, 36.0, 46.0, 41.0, 46.0, 44.0, 40.0, 46.0, 51.0, 36.0, 41.0, 22.0, 31.0, 24.0, 29.0, 29.0, 20.0, 13.0, 12.0, 16.0, 12.0, 3.0, 11.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.586642265319824, -14.08240032196045, -13.578158378601074, -13.0739164352417, -12.569674491882324, -12.06543254852295, -11.561189651489258, -11.056947708129883, -10.552705764770508, -10.048463821411133, -9.544221878051758, -9.039979934692383, -8.535737991333008, -8.031496047973633, -7.5272536277771, -7.023011684417725, -6.518770217895508, -6.014528274536133, -5.510286331176758, -5.006044387817383, -4.501802444458008, -3.9975602626800537, -3.4933180809020996, -2.9890761375427246, -2.4848341941833496, -1.9805922508239746, -1.47635018825531, -0.9721081256866455, -0.4678661823272705, 0.03637576103210449, 0.5406179428100586, 1.0448598861694336, 1.5491008758544922, 2.053342819213867, 2.557584762573242, 3.0618269443511963, 3.5660688877105713, 4.070310592651367, 4.5745530128479, 5.078794956207275, 5.58303689956665, 6.087278842926025, 6.5915207862854, 7.095763206481934, 7.600005149841309, 8.104247093200684, 8.608489036560059, 9.112730979919434, 9.616972923278809, 10.121214866638184, 10.625456809997559, 11.129698753356934, 11.633940696716309, 12.138182640075684, 12.642425537109375, 13.14666748046875, 13.650909423828125, 14.1551513671875, 14.659393310546875, 15.16363525390625, 15.667877197265625, 16.172119140625, 16.676361083984375, 17.18060302734375, 17.684844970703125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 11.0, 22.0, 16.0, 32.0, 48.0, 53.0, 68.0, 120.0, 187.0, 296.0, 421.0, 704.0, 1111.0, 1871.0, 3349.0, 6151.0, 12927.0, 28387.0, 76750.0, 304462.0, 3208946.0, 395204.0, 90039.0, 32800.0, 14285.0, 7078.0, 3662.0, 2083.0, 1147.0, 726.0, 468.0, 273.0, 182.0, 103.0, 86.0, 57.0, 41.0, 41.0, 16.0, 14.0, 9.0, 5.0, 4.0, 0.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.274993896484375, -4.14373779296875, -4.012481689453125, -3.8812255859375, -3.749969482421875, -3.61871337890625, -3.487457275390625, -3.356201171875, -3.224945068359375, -3.09368896484375, -2.962432861328125, -2.8311767578125, -2.699920654296875, -2.56866455078125, -2.437408447265625, -2.30615234375, -2.174896240234375, -2.04364013671875, -1.912384033203125, -1.7811279296875, -1.649871826171875, -1.51861572265625, -1.387359619140625, -1.256103515625, -1.124847412109375, -0.99359130859375, -0.862335205078125, -0.7310791015625, -0.599822998046875, -0.46856689453125, -0.337310791015625, -0.2060546875, -0.074798583984375, 0.05645751953125, 0.187713623046875, 0.3189697265625, 0.450225830078125, 0.58148193359375, 0.712738037109375, 0.843994140625, 0.975250244140625, 1.10650634765625, 1.237762451171875, 1.3690185546875, 1.500274658203125, 1.63153076171875, 1.762786865234375, 1.89404296875, 2.025299072265625, 2.15655517578125, 2.287811279296875, 2.4190673828125, 2.550323486328125, 2.68157958984375, 2.812835693359375, 2.944091796875, 3.075347900390625, 3.20660400390625, 3.337860107421875, 3.4691162109375, 3.600372314453125, 3.73162841796875, 3.862884521484375, 3.994140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 11.0, 8.0, 6.0, 15.0, 18.0, 11.0, 14.0, 22.0, 31.0, 28.0, 46.0, 44.0, 42.0, 51.0, 43.0, 61.0, 45.0, 57.0, 52.0, 53.0, 40.0, 53.0, 34.0, 34.0, 30.0, 33.0, 25.0, 21.0, 18.0, 11.0, 9.0, 11.0, 7.0, 4.0, 1.0, 7.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87841796875, -0.8538131713867188, -0.8292083740234375, -0.8046035766601562, -0.779998779296875, -0.7553939819335938, -0.7307891845703125, -0.7061843872070312, -0.68157958984375, -0.6569747924804688, -0.6323699951171875, -0.6077651977539062, -0.583160400390625, -0.5585556030273438, -0.5339508056640625, -0.5093460083007812, -0.4847412109375, -0.46013641357421875, -0.4355316162109375, -0.41092681884765625, -0.386322021484375, -0.36171722412109375, -0.3371124267578125, -0.31250762939453125, -0.28790283203125, -0.26329803466796875, -0.2386932373046875, -0.21408843994140625, -0.189483642578125, -0.16487884521484375, -0.1402740478515625, -0.11566925048828125, -0.091064453125, -0.06645965576171875, -0.0418548583984375, -0.01725006103515625, 0.007354736328125, 0.03195953369140625, 0.0565643310546875, 0.08116912841796875, 0.10577392578125, 0.13037872314453125, 0.1549835205078125, 0.17958831787109375, 0.204193115234375, 0.22879791259765625, 0.2534027099609375, 0.27800750732421875, 0.3026123046875, 0.32721710205078125, 0.3518218994140625, 0.37642669677734375, 0.401031494140625, 0.42563629150390625, 0.4502410888671875, 0.47484588623046875, 0.49945068359375, 0.5240554809570312, 0.5486602783203125, 0.5732650756835938, 0.597869873046875, 0.6224746704101562, 0.6470794677734375, 0.6716842651367188, 0.6962890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 7.0, 13.0, 22.0, 20.0, 34.0, 38.0, 54.0, 104.0, 139.0, 207.0, 330.0, 624.0, 1070.0, 1910.0, 3631.0, 7336.0, 14789.0, 33052.0, 81296.0, 247420.0, 1968428.0, 1470468.0, 226670.0, 76238.0, 31741.0, 14174.0, 6593.0, 3389.0, 1834.0, 1035.0, 596.0, 340.0, 236.0, 147.0, 96.0, 57.0, 38.0, 35.0, 23.0, 14.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.710052490234375, -2.60955810546875, -2.509063720703125, -2.4085693359375, -2.308074951171875, -2.20758056640625, -2.107086181640625, -2.006591796875, -1.906097412109375, -1.80560302734375, -1.705108642578125, -1.6046142578125, -1.504119873046875, -1.40362548828125, -1.303131103515625, -1.20263671875, -1.102142333984375, -1.00164794921875, -0.901153564453125, -0.8006591796875, -0.700164794921875, -0.59967041015625, -0.499176025390625, -0.398681640625, -0.298187255859375, -0.19769287109375, -0.097198486328125, 0.0032958984375, 0.103790283203125, 0.20428466796875, 0.304779052734375, 0.4052734375, 0.505767822265625, 0.60626220703125, 0.706756591796875, 0.8072509765625, 0.907745361328125, 1.00823974609375, 1.108734130859375, 1.209228515625, 1.309722900390625, 1.41021728515625, 1.510711669921875, 1.6112060546875, 1.711700439453125, 1.81219482421875, 1.912689208984375, 2.01318359375, 2.113677978515625, 2.21417236328125, 2.314666748046875, 2.4151611328125, 2.515655517578125, 2.61614990234375, 2.716644287109375, 2.817138671875, 2.917633056640625, 3.01812744140625, 3.118621826171875, 3.2191162109375, 3.319610595703125, 3.42010498046875, 3.520599365234375, 3.62109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 9.0, 16.0, 26.0, 19.0, 42.0, 34.0, 44.0, 65.0, 116.0, 161.0, 248.0, 494.0, 1203.0, 650.0, 305.0, 186.0, 93.0, 83.0, 64.0, 53.0, 35.0, 32.0, 20.0, 12.0, 13.0, 6.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4814453125, -1.4259490966796875, -1.370452880859375, -1.3149566650390625, -1.25946044921875, -1.2039642333984375, -1.148468017578125, -1.0929718017578125, -1.0374755859375, -0.9819793701171875, -0.926483154296875, -0.8709869384765625, -0.81549072265625, -0.7599945068359375, -0.704498291015625, -0.6490020751953125, -0.593505859375, -0.5380096435546875, -0.482513427734375, -0.4270172119140625, -0.37152099609375, -0.3160247802734375, -0.260528564453125, -0.2050323486328125, -0.1495361328125, -0.0940399169921875, -0.038543701171875, 0.0169525146484375, 0.07244873046875, 0.1279449462890625, 0.183441162109375, 0.2389373779296875, 0.29443359375, 0.3499298095703125, 0.405426025390625, 0.4609222412109375, 0.51641845703125, 0.5719146728515625, 0.627410888671875, 0.6829071044921875, 0.7384033203125, 0.7938995361328125, 0.849395751953125, 0.9048919677734375, 0.96038818359375, 1.0158843994140625, 1.071380615234375, 1.1268768310546875, 1.182373046875, 1.2378692626953125, 1.293365478515625, 1.3488616943359375, 1.40435791015625, 1.4598541259765625, 1.515350341796875, 1.5708465576171875, 1.6263427734375, 1.6818389892578125, 1.737335205078125, 1.7928314208984375, 1.84832763671875, 1.9038238525390625, 1.959320068359375, 2.0148162841796875, 2.0703125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 14.0, 10.0, 32.0, 47.0, 105.0, 163.0, 181.0, 165.0, 113.0, 95.0, 40.0, 18.0, 13.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.20398712158203, -18.53911590576172, -17.874244689941406, -17.209373474121094, -16.54450225830078, -15.879631042480469, -15.214759826660156, -14.549888610839844, -13.885017395019531, -13.220146179199219, -12.555274963378906, -11.890403747558594, -11.225532531738281, -10.560661315917969, -9.895790100097656, -9.230918884277344, -8.566047668457031, -7.901176452636719, -7.236305236816406, -6.571434020996094, -5.906562805175781, -5.241691589355469, -4.576820373535156, -3.9119491577148438, -3.2470779418945312, -2.5822067260742188, -1.9173355102539062, -1.2524642944335938, -0.5875930786132812, 0.07727813720703125, 0.7421493530273438, 1.4070205688476562, 2.0718917846679688, 2.7367630004882812, 3.4016342163085938, 4.066505432128906, 4.731376647949219, 5.396247863769531, 6.061119079589844, 6.725990295410156, 7.390861511230469, 8.055732727050781, 8.720603942871094, 9.385475158691406, 10.050346374511719, 10.715217590332031, 11.380088806152344, 12.044960021972656, 12.709831237792969, 13.374702453613281, 14.039573669433594, 14.704444885253906, 15.369316101074219, 16.03418731689453, 16.699058532714844, 17.363929748535156, 18.02880096435547, 18.69367218017578, 19.358543395996094, 20.023414611816406, 20.68828582763672, 21.35315704345703, 22.018028259277344, 22.682899475097656, 23.34777069091797]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 11.0, 12.0, 6.0, 10.0, 14.0, 16.0, 24.0, 22.0, 28.0, 30.0, 28.0, 24.0, 45.0, 35.0, 37.0, 41.0, 37.0, 56.0, 43.0, 51.0, 39.0, 38.0, 49.0, 48.0, 26.0, 34.0, 28.0, 21.0, 32.0, 15.0, 18.0, 13.0, 13.0, 11.0, 6.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.75253963470459, -7.532620906829834, -7.312702178955078, -7.0927839279174805, -6.872865200042725, -6.652946472167969, -6.433027744293213, -6.213109016418457, -5.993190288543701, -5.773271560668945, -5.5533528327941895, -5.333434104919434, -5.113515853881836, -4.89359712600708, -4.673678398132324, -4.453759670257568, -4.2338409423828125, -4.013922214508057, -3.79400372505188, -3.574084997177124, -3.354166269302368, -3.1342477798461914, -2.9143290519714355, -2.6944103240966797, -2.474492073059082, -2.254573345184326, -2.0346548557281494, -1.8147361278533936, -1.5948173999786377, -1.3748987913131714, -1.154980182647705, -0.9350614547729492, -0.7151427268981934, -0.4952240586280823, -0.2753054201602936, -0.05538678169250488, 0.1645318865776062, 0.3844505548477173, 0.6043691635131836, 0.8242878913879395, 1.0442065000534058, 1.264125108718872, 1.484043836593628, 1.7039624452590942, 1.9238810539245605, 2.1437997817993164, 2.3637185096740723, 2.583637237548828, 2.803555727005005, 3.0234744548797607, 3.2433929443359375, 3.4633116722106934, 3.683230400085449, 3.903149127960205, 4.123067855834961, 4.342986106872559, 4.5629048347473145, 4.78282356262207, 5.002742290496826, 5.222661018371582, 5.44257926940918, 5.6624979972839355, 5.882416725158691, 6.102335453033447, 6.322254180908203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 14.0, 24.0, 32.0, 49.0, 81.0, 115.0, 179.0, 253.0, 435.0, 826.0, 1587.0, 3271.0, 7338.0, 17054.0, 42284.0, 116329.0, 429672.0, 288192.0, 84065.0, 32294.0, 13072.0, 5713.0, 2576.0, 1289.0, 711.0, 415.0, 227.0, 146.0, 86.0, 74.0, 36.0, 17.0, 16.0, 12.0, 12.0, 7.0, 5.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.76068115234375, -4.6112060546875, -4.46173095703125, -4.312255859375, -4.16278076171875, -4.0133056640625, -3.86383056640625, -3.71435546875, -3.56488037109375, -3.4154052734375, -3.26593017578125, -3.116455078125, -2.96697998046875, -2.8175048828125, -2.66802978515625, -2.5185546875, -2.36907958984375, -2.2196044921875, -2.07012939453125, -1.920654296875, -1.77117919921875, -1.6217041015625, -1.47222900390625, -1.32275390625, -1.17327880859375, -1.0238037109375, -0.87432861328125, -0.724853515625, -0.57537841796875, -0.4259033203125, -0.27642822265625, -0.126953125, 0.02252197265625, 0.1719970703125, 0.32147216796875, 0.470947265625, 0.62042236328125, 0.7698974609375, 0.91937255859375, 1.06884765625, 1.21832275390625, 1.3677978515625, 1.51727294921875, 1.666748046875, 1.81622314453125, 1.9656982421875, 2.11517333984375, 2.2646484375, 2.41412353515625, 2.5635986328125, 2.71307373046875, 2.862548828125, 3.01202392578125, 3.1614990234375, 3.31097412109375, 3.46044921875, 3.60992431640625, 3.7593994140625, 3.90887451171875, 4.058349609375, 4.20782470703125, 4.3572998046875, 4.50677490234375, 4.65625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 7.0, 7.0, 11.0, 15.0, 18.0, 19.0, 25.0, 28.0, 36.0, 45.0, 43.0, 46.0, 43.0, 42.0, 54.0, 61.0, 59.0, 55.0, 62.0, 38.0, 31.0, 39.0, 30.0, 36.0, 33.0, 23.0, 18.0, 15.0, 15.0, 10.0, 8.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.955078125, -0.9302139282226562, -0.9053497314453125, -0.8804855346679688, -0.855621337890625, -0.8307571411132812, -0.8058929443359375, -0.7810287475585938, -0.75616455078125, -0.7313003540039062, -0.7064361572265625, -0.6815719604492188, -0.656707763671875, -0.6318435668945312, -0.6069793701171875, -0.5821151733398438, -0.5572509765625, -0.5323867797851562, -0.5075225830078125, -0.48265838623046875, -0.457794189453125, -0.43292999267578125, -0.4080657958984375, -0.38320159912109375, -0.35833740234375, -0.33347320556640625, -0.3086090087890625, -0.28374481201171875, -0.258880615234375, -0.23401641845703125, -0.2091522216796875, -0.18428802490234375, -0.159423828125, -0.13455963134765625, -0.1096954345703125, -0.08483123779296875, -0.059967041015625, -0.03510284423828125, -0.0102386474609375, 0.01462554931640625, 0.03948974609375, 0.06435394287109375, 0.0892181396484375, 0.11408233642578125, 0.138946533203125, 0.16381072998046875, 0.1886749267578125, 0.21353912353515625, 0.2384033203125, 0.26326751708984375, 0.2881317138671875, 0.31299591064453125, 0.337860107421875, 0.36272430419921875, 0.3875885009765625, 0.41245269775390625, 0.43731689453125, 0.46218109130859375, 0.4870452880859375, 0.5119094848632812, 0.536773681640625, 0.5616378784179688, 0.5865020751953125, 0.6113662719726562, 0.63623046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 13.0, 13.0, 25.0, 40.0, 49.0, 68.0, 81.0, 114.0, 172.0, 238.0, 348.0, 565.0, 1096.0, 2460.0, 7032.0, 21928.0, 75023.0, 289630.0, 476598.0, 121252.0, 34142.0, 10503.0, 3596.0, 1471.0, 698.0, 408.0, 279.0, 173.0, 130.0, 94.0, 68.0, 47.0, 48.0, 31.0, 28.0, 21.0, 16.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.443359375, -3.311859130859375, -3.18035888671875, -3.048858642578125, -2.9173583984375, -2.785858154296875, -2.65435791015625, -2.522857666015625, -2.391357421875, -2.259857177734375, -2.12835693359375, -1.996856689453125, -1.8653564453125, -1.733856201171875, -1.60235595703125, -1.470855712890625, -1.33935546875, -1.207855224609375, -1.07635498046875, -0.944854736328125, -0.8133544921875, -0.681854248046875, -0.55035400390625, -0.418853759765625, -0.287353515625, -0.155853271484375, -0.02435302734375, 0.107147216796875, 0.2386474609375, 0.370147705078125, 0.50164794921875, 0.633148193359375, 0.7646484375, 0.896148681640625, 1.02764892578125, 1.159149169921875, 1.2906494140625, 1.422149658203125, 1.55364990234375, 1.685150146484375, 1.816650390625, 1.948150634765625, 2.07965087890625, 2.211151123046875, 2.3426513671875, 2.474151611328125, 2.60565185546875, 2.737152099609375, 2.86865234375, 3.000152587890625, 3.13165283203125, 3.263153076171875, 3.3946533203125, 3.526153564453125, 3.65765380859375, 3.789154052734375, 3.920654296875, 4.052154541015625, 4.18365478515625, 4.315155029296875, 4.4466552734375, 4.578155517578125, 4.70965576171875, 4.841156005859375, 4.97265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 7.0, 4.0, 5.0, 14.0, 10.0, 17.0, 17.0, 20.0, 26.0, 18.0, 26.0, 28.0, 32.0, 39.0, 29.0, 35.0, 29.0, 34.0, 46.0, 37.0, 40.0, 42.0, 45.0, 35.0, 44.0, 27.0, 42.0, 30.0, 29.0, 43.0, 19.0, 27.0, 15.0, 18.0, 7.0, 14.0, 6.0, 10.0, 10.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.227935791015625, -2.14727783203125, -2.066619873046875, -1.9859619140625, -1.905303955078125, -1.82464599609375, -1.743988037109375, -1.663330078125, -1.582672119140625, -1.50201416015625, -1.421356201171875, -1.3406982421875, -1.260040283203125, -1.17938232421875, -1.098724365234375, -1.01806640625, -0.937408447265625, -0.85675048828125, -0.776092529296875, -0.6954345703125, -0.614776611328125, -0.53411865234375, -0.453460693359375, -0.372802734375, -0.292144775390625, -0.21148681640625, -0.130828857421875, -0.0501708984375, 0.030487060546875, 0.11114501953125, 0.191802978515625, 0.2724609375, 0.353118896484375, 0.43377685546875, 0.514434814453125, 0.5950927734375, 0.675750732421875, 0.75640869140625, 0.837066650390625, 0.917724609375, 0.998382568359375, 1.07904052734375, 1.159698486328125, 1.2403564453125, 1.321014404296875, 1.40167236328125, 1.482330322265625, 1.56298828125, 1.643646240234375, 1.72430419921875, 1.804962158203125, 1.8856201171875, 1.966278076171875, 2.04693603515625, 2.127593994140625, 2.208251953125, 2.288909912109375, 2.36956787109375, 2.450225830078125, 2.5308837890625, 2.611541748046875, 2.69219970703125, 2.772857666015625, 2.853515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 9.0, 8.0, 10.0, 11.0, 31.0, 19.0, 33.0, 43.0, 56.0, 89.0, 113.0, 173.0, 270.0, 394.0, 686.0, 1222.0, 2349.0, 5340.0, 14366.0, 45327.0, 165083.0, 528799.0, 201674.0, 53898.0, 16646.0, 6065.0, 2463.0, 1285.0, 693.0, 418.0, 310.0, 213.0, 137.0, 90.0, 56.0, 44.0, 30.0, 24.0, 18.0, 10.0, 11.0, 8.0, 7.0, 2.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.1953125, -2.131805419921875, -2.06829833984375, -2.004791259765625, -1.9412841796875, -1.877777099609375, -1.81427001953125, -1.750762939453125, -1.687255859375, -1.623748779296875, -1.56024169921875, -1.496734619140625, -1.4332275390625, -1.369720458984375, -1.30621337890625, -1.242706298828125, -1.17919921875, -1.115692138671875, -1.05218505859375, -0.988677978515625, -0.9251708984375, -0.861663818359375, -0.79815673828125, -0.734649658203125, -0.671142578125, -0.607635498046875, -0.54412841796875, -0.480621337890625, -0.4171142578125, -0.353607177734375, -0.29010009765625, -0.226593017578125, -0.1630859375, -0.099578857421875, -0.03607177734375, 0.027435302734375, 0.0909423828125, 0.154449462890625, 0.21795654296875, 0.281463623046875, 0.344970703125, 0.408477783203125, 0.47198486328125, 0.535491943359375, 0.5989990234375, 0.662506103515625, 0.72601318359375, 0.789520263671875, 0.85302734375, 0.916534423828125, 0.98004150390625, 1.043548583984375, 1.1070556640625, 1.170562744140625, 1.23406982421875, 1.297576904296875, 1.361083984375, 1.424591064453125, 1.48809814453125, 1.551605224609375, 1.6151123046875, 1.678619384765625, 1.74212646484375, 1.805633544921875, 1.869140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 9.0, 17.0, 17.0, 20.0, 35.0, 48.0, 77.0, 177.0, 215.0, 119.0, 59.0, 39.0, 33.0, 33.0, 22.0, 12.0, 12.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005965232849121094, -0.0005809217691421509, -0.0005653202533721924, -0.0005497187376022339, -0.0005341172218322754, -0.0005185157060623169, -0.0005029141902923584, -0.0004873126745223999, -0.0004717111587524414, -0.0004561096429824829, -0.0004405081272125244, -0.0004249066114425659, -0.0004093050956726074, -0.0003937035799026489, -0.00037810206413269043, -0.00036250054836273193, -0.00034689903259277344, -0.00033129751682281494, -0.00031569600105285645, -0.00030009448528289795, -0.00028449296951293945, -0.00026889145374298096, -0.00025328993797302246, -0.00023768842220306396, -0.00022208690643310547, -0.00020648539066314697, -0.00019088387489318848, -0.00017528235912322998, -0.00015968084335327148, -0.000144079327583313, -0.0001284778118133545, -0.000112876296043396, -9.72747802734375e-05, -8.1673264503479e-05, -6.607174873352051e-05, -5.047023296356201e-05, -3.4868717193603516e-05, -1.926720142364502e-05, -3.6656856536865234e-06, 1.1935830116271973e-05, 2.753734588623047e-05, 4.3138861656188965e-05, 5.874037742614746e-05, 7.434189319610596e-05, 8.994340896606445e-05, 0.00010554492473602295, 0.00012114644050598145, 0.00013674795627593994, 0.00015234947204589844, 0.00016795098781585693, 0.00018355250358581543, 0.00019915401935577393, 0.00021475553512573242, 0.00023035705089569092, 0.0002459585666656494, 0.0002615600824356079, 0.0002771615982055664, 0.0002927631139755249, 0.0003083646297454834, 0.0003239661455154419, 0.0003395676612854004, 0.0003551691770553589, 0.0003707706928253174, 0.0003863722085952759, 0.0004019737243652344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 7.0, 9.0, 26.0, 29.0, 51.0, 64.0, 116.0, 174.0, 352.0, 515.0, 1152.0, 2830.0, 10514.0, 58951.0, 552304.0, 366933.0, 42021.0, 7875.0, 2458.0, 968.0, 491.0, 252.0, 165.0, 98.0, 71.0, 47.0, 21.0, 17.0, 8.0, 12.0, 2.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.018280029296875, -2.90179443359375, -2.785308837890625, -2.6688232421875, -2.552337646484375, -2.43585205078125, -2.319366455078125, -2.202880859375, -2.086395263671875, -1.96990966796875, -1.853424072265625, -1.7369384765625, -1.620452880859375, -1.50396728515625, -1.387481689453125, -1.27099609375, -1.154510498046875, -1.03802490234375, -0.921539306640625, -0.8050537109375, -0.688568115234375, -0.57208251953125, -0.455596923828125, -0.339111328125, -0.222625732421875, -0.10614013671875, 0.010345458984375, 0.1268310546875, 0.243316650390625, 0.35980224609375, 0.476287841796875, 0.5927734375, 0.709259033203125, 0.82574462890625, 0.942230224609375, 1.0587158203125, 1.175201416015625, 1.29168701171875, 1.408172607421875, 1.524658203125, 1.641143798828125, 1.75762939453125, 1.874114990234375, 1.9906005859375, 2.107086181640625, 2.22357177734375, 2.340057373046875, 2.45654296875, 2.573028564453125, 2.68951416015625, 2.805999755859375, 2.9224853515625, 3.038970947265625, 3.15545654296875, 3.271942138671875, 3.388427734375, 3.504913330078125, 3.62139892578125, 3.737884521484375, 3.8543701171875, 3.970855712890625, 4.08734130859375, 4.203826904296875, 4.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 3.0, 5.0, 11.0, 11.0, 8.0, 20.0, 11.0, 27.0, 21.0, 22.0, 35.0, 57.0, 64.0, 82.0, 99.0, 91.0, 95.0, 64.0, 47.0, 40.0, 33.0, 22.0, 31.0, 19.0, 17.0, 10.0, 6.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5433197021484375, -1.494842529296875, -1.4463653564453125, -1.39788818359375, -1.3494110107421875, -1.300933837890625, -1.2524566650390625, -1.2039794921875, -1.1555023193359375, -1.107025146484375, -1.0585479736328125, -1.01007080078125, -0.9615936279296875, -0.913116455078125, -0.8646392822265625, -0.816162109375, -0.7676849365234375, -0.719207763671875, -0.6707305908203125, -0.62225341796875, -0.5737762451171875, -0.525299072265625, -0.4768218994140625, -0.4283447265625, -0.3798675537109375, -0.331390380859375, -0.2829132080078125, -0.23443603515625, -0.1859588623046875, -0.137481689453125, -0.0890045166015625, -0.04052734375, 0.0079498291015625, 0.056427001953125, 0.1049041748046875, 0.15338134765625, 0.2018585205078125, 0.250335693359375, 0.2988128662109375, 0.3472900390625, 0.3957672119140625, 0.444244384765625, 0.4927215576171875, 0.54119873046875, 0.5896759033203125, 0.638153076171875, 0.6866302490234375, 0.735107421875, 0.7835845947265625, 0.832061767578125, 0.8805389404296875, 0.92901611328125, 0.9774932861328125, 1.025970458984375, 1.0744476318359375, 1.1229248046875, 1.1714019775390625, 1.219879150390625, 1.2683563232421875, 1.31683349609375, 1.3653106689453125, 1.413787841796875, 1.4622650146484375, 1.5107421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 18.0, 22.0, 29.0, 39.0, 61.0, 73.0, 92.0, 123.0, 118.0, 104.0, 96.0, 76.0, 55.0, 25.0, 27.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.383358001708984, -27.580856323242188, -26.778356552124023, -25.97585678100586, -25.173355102539062, -24.370853424072266, -23.5683536529541, -22.765853881835938, -21.96335220336914, -21.160850524902344, -20.35835075378418, -19.555850982666016, -18.75334930419922, -17.950847625732422, -17.148347854614258, -16.345848083496094, -15.543346405029297, -14.740845680236816, -13.938344955444336, -13.135844230651855, -12.333343505859375, -11.530842781066895, -10.728342056274414, -9.925841331481934, -9.123340606689453, -8.320839881896973, -7.518339157104492, -6.715838432312012, -5.913337707519531, -5.110836982727051, -4.30833625793457, -3.50583553314209, -2.7033329010009766, -1.900832176208496, -1.0983314514160156, -0.29583072662353516, 0.5066699981689453, 1.3091707229614258, 2.1116714477539062, 2.9141721725463867, 3.716672897338867, 4.519173622131348, 5.321674346923828, 6.124175071716309, 6.926675796508789, 7.7291765213012695, 8.53167724609375, 9.33417797088623, 10.136678695678711, 10.939179420471191, 11.741680145263672, 12.544180870056152, 13.346681594848633, 14.149182319641113, 14.951683044433594, 15.754183769226074, 16.556684494018555, 17.35918426513672, 18.161685943603516, 18.964187622070312, 19.766687393188477, 20.56918716430664, 21.371688842773438, 22.174190521240234, 22.9766902923584]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 9.0, 10.0, 14.0, 17.0, 32.0, 28.0, 25.0, 29.0, 38.0, 23.0, 37.0, 40.0, 38.0, 38.0, 34.0, 32.0, 40.0, 46.0, 44.0, 36.0, 34.0, 41.0, 34.0, 30.0, 25.0, 33.0, 28.0, 21.0, 21.0, 22.0, 20.0, 11.0, 10.0, 9.0, 9.0, 5.0, 11.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.834770202636719, -12.40081787109375, -11.966865539550781, -11.532912254333496, -11.098959922790527, -10.665007591247559, -10.23105525970459, -9.797101974487305, -9.363149642944336, -8.929197311401367, -8.495244979858398, -8.061291694641113, -7.6273393630981445, -7.193387031555176, -6.759434700012207, -6.32548189163208, -5.891529560089111, -5.457577228546143, -5.023624420166016, -4.589672088623047, -4.15571928024292, -3.721766948699951, -3.2878143787384033, -2.8538618087768555, -2.4199092388153076, -1.9859566688537598, -1.552004098892212, -1.1180516481399536, -0.6840990781784058, -0.25014662742614746, 0.1838059425354004, 0.6177585124969482, 1.051711082458496, 1.485663652420044, 1.9196162223815918, 2.3535685539245605, 2.7875213623046875, 3.2214736938476562, 3.655426263809204, 4.089378833770752, 4.523331642150879, 4.957283973693848, 5.391236782073975, 5.825189113616943, 6.25914192199707, 6.693094253540039, 7.127046585083008, 7.560999393463135, 7.9949517250061035, 8.42890453338623, 8.8628568649292, 9.296809196472168, 9.730761528015137, 10.164714813232422, 10.59866714477539, 11.03261947631836, 11.466571807861328, 11.900524139404297, 12.334476470947266, 12.76842975616455, 13.20238208770752, 13.636334419250488, 14.070286750793457, 14.504240036010742, 14.938192367553711]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 15.0, 13.0, 15.0, 20.0, 28.0, 35.0, 52.0, 102.0, 178.0, 372.0, 1047.0, 2986.0, 10929.0, 56191.0, 1604114.0, 2443819.0, 58097.0, 11534.0, 3001.0, 965.0, 346.0, 137.0, 74.0, 46.0, 34.0, 26.0, 20.0, 15.0, 12.0, 7.0, 7.0, 1.0, 10.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.6402587890625, -10.327392578125, -10.0145263671875, -9.70166015625, -9.3887939453125, -9.075927734375, -8.7630615234375, -8.4501953125, -8.1373291015625, -7.824462890625, -7.5115966796875, -7.19873046875, -6.8858642578125, -6.572998046875, -6.2601318359375, -5.947265625, -5.6343994140625, -5.321533203125, -5.0086669921875, -4.69580078125, -4.3829345703125, -4.070068359375, -3.7572021484375, -3.4443359375, -3.1314697265625, -2.818603515625, -2.5057373046875, -2.19287109375, -1.8800048828125, -1.567138671875, -1.2542724609375, -0.94140625, -0.6285400390625, -0.315673828125, -0.0028076171875, 0.31005859375, 0.6229248046875, 0.935791015625, 1.2486572265625, 1.5615234375, 1.8743896484375, 2.187255859375, 2.5001220703125, 2.81298828125, 3.1258544921875, 3.438720703125, 3.7515869140625, 4.064453125, 4.3773193359375, 4.690185546875, 5.0030517578125, 5.31591796875, 5.6287841796875, 5.941650390625, 6.2545166015625, 6.5673828125, 6.8802490234375, 7.193115234375, 7.5059814453125, 7.81884765625, 8.1317138671875, 8.444580078125, 8.7574462890625, 9.0703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 3.0, 8.0, 11.0, 17.0, 17.0, 15.0, 29.0, 33.0, 39.0, 44.0, 45.0, 39.0, 40.0, 48.0, 41.0, 53.0, 43.0, 43.0, 48.0, 56.0, 37.0, 40.0, 40.0, 29.0, 37.0, 27.0, 18.0, 10.0, 15.0, 14.0, 12.0, 13.0, 6.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.92041015625, -0.896636962890625, -0.87286376953125, -0.849090576171875, -0.8253173828125, -0.801544189453125, -0.77777099609375, -0.753997802734375, -0.730224609375, -0.706451416015625, -0.68267822265625, -0.658905029296875, -0.6351318359375, -0.611358642578125, -0.58758544921875, -0.563812255859375, -0.5400390625, -0.516265869140625, -0.49249267578125, -0.468719482421875, -0.4449462890625, -0.421173095703125, -0.39739990234375, -0.373626708984375, -0.349853515625, -0.326080322265625, -0.30230712890625, -0.278533935546875, -0.2547607421875, -0.230987548828125, -0.20721435546875, -0.183441162109375, -0.15966796875, -0.135894775390625, -0.11212158203125, -0.088348388671875, -0.0645751953125, -0.040802001953125, -0.01702880859375, 0.006744384765625, 0.030517578125, 0.054290771484375, 0.07806396484375, 0.101837158203125, 0.1256103515625, 0.149383544921875, 0.17315673828125, 0.196929931640625, 0.220703125, 0.244476318359375, 0.26824951171875, 0.292022705078125, 0.3157958984375, 0.339569091796875, 0.36334228515625, 0.387115478515625, 0.410888671875, 0.434661865234375, 0.45843505859375, 0.482208251953125, 0.5059814453125, 0.529754638671875, 0.55352783203125, 0.577301025390625, 0.60107421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 6.0, 7.0, 11.0, 16.0, 17.0, 24.0, 28.0, 64.0, 87.0, 105.0, 174.0, 294.0, 442.0, 784.0, 1504.0, 3116.0, 7099.0, 18831.0, 60121.0, 281249.0, 3189849.0, 501232.0, 86737.0, 25432.0, 9154.0, 3792.0, 1784.0, 933.0, 497.0, 288.0, 171.0, 128.0, 79.0, 66.0, 39.0, 29.0, 25.0, 18.0, 5.0, 11.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.13671875, -4.9884033203125, -4.840087890625, -4.6917724609375, -4.54345703125, -4.3951416015625, -4.246826171875, -4.0985107421875, -3.9501953125, -3.8018798828125, -3.653564453125, -3.5052490234375, -3.35693359375, -3.2086181640625, -3.060302734375, -2.9119873046875, -2.763671875, -2.6153564453125, -2.467041015625, -2.3187255859375, -2.17041015625, -2.0220947265625, -1.873779296875, -1.7254638671875, -1.5771484375, -1.4288330078125, -1.280517578125, -1.1322021484375, -0.98388671875, -0.8355712890625, -0.687255859375, -0.5389404296875, -0.390625, -0.2423095703125, -0.093994140625, 0.0543212890625, 0.20263671875, 0.3509521484375, 0.499267578125, 0.6475830078125, 0.7958984375, 0.9442138671875, 1.092529296875, 1.2408447265625, 1.38916015625, 1.5374755859375, 1.685791015625, 1.8341064453125, 1.982421875, 2.1307373046875, 2.279052734375, 2.4273681640625, 2.57568359375, 2.7239990234375, 2.872314453125, 3.0206298828125, 3.1689453125, 3.3172607421875, 3.465576171875, 3.6138916015625, 3.76220703125, 3.9105224609375, 4.058837890625, 4.2071533203125, 4.35546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 11.0, 8.0, 10.0, 15.0, 27.0, 29.0, 34.0, 46.0, 70.0, 152.0, 240.0, 517.0, 1509.0, 619.0, 287.0, 160.0, 113.0, 63.0, 44.0, 35.0, 27.0, 15.0, 11.0, 11.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.92578125, -1.8667144775390625, -1.807647705078125, -1.7485809326171875, -1.68951416015625, -1.6304473876953125, -1.571380615234375, -1.5123138427734375, -1.4532470703125, -1.3941802978515625, -1.335113525390625, -1.2760467529296875, -1.21697998046875, -1.1579132080078125, -1.098846435546875, -1.0397796630859375, -0.980712890625, -0.9216461181640625, -0.862579345703125, -0.8035125732421875, -0.74444580078125, -0.6853790283203125, -0.626312255859375, -0.5672454833984375, -0.5081787109375, -0.4491119384765625, -0.390045166015625, -0.3309783935546875, -0.27191162109375, -0.2128448486328125, -0.153778076171875, -0.0947113037109375, -0.03564453125, 0.0234222412109375, 0.082489013671875, 0.1415557861328125, 0.20062255859375, 0.2596893310546875, 0.318756103515625, 0.3778228759765625, 0.4368896484375, 0.4959564208984375, 0.555023193359375, 0.6140899658203125, 0.67315673828125, 0.7322235107421875, 0.791290283203125, 0.8503570556640625, 0.909423828125, 0.9684906005859375, 1.027557373046875, 1.0866241455078125, 1.14569091796875, 1.2047576904296875, 1.263824462890625, 1.3228912353515625, 1.3819580078125, 1.4410247802734375, 1.500091552734375, 1.5591583251953125, 1.61822509765625, 1.6772918701171875, 1.736358642578125, 1.7954254150390625, 1.8544921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 12.0, 11.0, 22.0, 27.0, 54.0, 71.0, 97.0, 106.0, 108.0, 102.0, 93.0, 90.0, 76.0, 37.0, 39.0, 17.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.358756065368652, -12.982189178466797, -12.605622291564941, -12.229055404663086, -11.852487564086914, -11.475920677185059, -11.099353790283203, -10.722786903381348, -10.346220016479492, -9.969653129577637, -9.593086242675781, -9.21651840209961, -8.839951515197754, -8.463384628295898, -8.086817741394043, -7.7102508544921875, -7.333683013916016, -6.95711612701416, -6.5805487632751465, -6.203981876373291, -5.827414512634277, -5.450847625732422, -5.074280738830566, -4.697713851928711, -4.321146488189697, -3.9445793628692627, -3.568012237548828, -3.1914453506469727, -2.814878225326538, -2.4383111000061035, -2.061744213104248, -1.6851770877838135, -1.3086109161376953, -0.9320438504219055, -0.5554767847061157, -0.1789097785949707, 0.19765734672546387, 0.5742244720458984, 0.9507913589477539, 1.3273584842681885, 1.703925609588623, 2.0804927349090576, 2.457059860229492, 2.8336267471313477, 3.2101938724517822, 3.586760997772217, 3.9633278846740723, 4.339895248413086, 4.716462135314941, 5.093029022216797, 5.4695963859558105, 5.846163272857666, 6.22273063659668, 6.599297523498535, 6.975864410400391, 7.352431297302246, 7.72899866104126, 8.105566024780273, 8.482132911682129, 8.858699798583984, 9.23526668548584, 9.611833572387695, 9.988401412963867, 10.364968299865723, 10.741535186767578]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 4.0, 9.0, 13.0, 12.0, 17.0, 24.0, 11.0, 12.0, 24.0, 27.0, 19.0, 35.0, 37.0, 44.0, 38.0, 25.0, 40.0, 37.0, 44.0, 46.0, 35.0, 34.0, 46.0, 42.0, 38.0, 35.0, 24.0, 19.0, 23.0, 14.0, 28.0, 14.0, 17.0, 16.0, 9.0, 11.0, 11.0, 5.0, 10.0, 9.0, 8.0, 4.0, 8.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.032009124755859, -4.871853351593018, -4.711697578430176, -4.551541805267334, -4.391386032104492, -4.23123025894165, -4.071074485778809, -3.910918951034546, -3.750763177871704, -3.5906074047088623, -3.4304516315460205, -3.2702958583831787, -3.110140323638916, -2.949984550476074, -2.7898287773132324, -2.6296730041503906, -2.469517230987549, -2.309361457824707, -2.1492056846618652, -1.989050030708313, -1.8288942575454712, -1.6687384843826294, -1.5085828304290771, -1.3484270572662354, -1.1882712841033936, -1.0281155109405518, -0.8679597973823547, -0.7078040838241577, -0.5476483106613159, -0.3874925374984741, -0.2273368239402771, -0.06718111038208008, 0.09297418594360352, 0.2531299293041229, 0.41328567266464233, 0.5734413862228394, 0.7335971593856812, 0.893752932548523, 1.0539085865020752, 1.214064359664917, 1.3742201328277588, 1.5343759059906006, 1.6945316791534424, 1.8546873331069946, 2.014842987060547, 2.1749987602233887, 2.3351545333862305, 2.4953103065490723, 2.655466079711914, 2.815621852874756, 2.9757776260375977, 3.1359333992004395, 3.2960891723632812, 3.456244945526123, 3.6164004802703857, 3.7765562534332275, 3.9367120265960693, 4.096867561340332, 4.257023334503174, 4.417179107666016, 4.577334880828857, 4.737490653991699, 4.897646427154541, 5.057802200317383, 5.217957973480225]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 20.0, 23.0, 41.0, 50.0, 96.0, 132.0, 217.0, 359.0, 626.0, 1131.0, 2165.0, 4524.0, 10060.0, 22579.0, 53820.0, 144422.0, 483586.0, 204193.0, 68064.0, 28656.0, 12441.0, 5544.0, 2630.0, 1352.0, 735.0, 397.0, 236.0, 140.0, 98.0, 63.0, 40.0, 32.0, 26.0, 13.0, 10.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.94140625, -4.8065185546875, -4.671630859375, -4.5367431640625, -4.40185546875, -4.2669677734375, -4.132080078125, -3.9971923828125, -3.8623046875, -3.7274169921875, -3.592529296875, -3.4576416015625, -3.32275390625, -3.1878662109375, -3.052978515625, -2.9180908203125, -2.783203125, -2.6483154296875, -2.513427734375, -2.3785400390625, -2.24365234375, -2.1087646484375, -1.973876953125, -1.8389892578125, -1.7041015625, -1.5692138671875, -1.434326171875, -1.2994384765625, -1.16455078125, -1.0296630859375, -0.894775390625, -0.7598876953125, -0.625, -0.4901123046875, -0.355224609375, -0.2203369140625, -0.08544921875, 0.0494384765625, 0.184326171875, 0.3192138671875, 0.4541015625, 0.5889892578125, 0.723876953125, 0.8587646484375, 0.99365234375, 1.1285400390625, 1.263427734375, 1.3983154296875, 1.533203125, 1.6680908203125, 1.802978515625, 1.9378662109375, 2.07275390625, 2.2076416015625, 2.342529296875, 2.4774169921875, 2.6123046875, 2.7471923828125, 2.882080078125, 3.0169677734375, 3.15185546875, 3.2867431640625, 3.421630859375, 3.5565185546875, 3.69140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 5.0, 14.0, 14.0, 18.0, 15.0, 25.0, 34.0, 30.0, 44.0, 40.0, 49.0, 44.0, 35.0, 52.0, 52.0, 49.0, 53.0, 46.0, 53.0, 38.0, 47.0, 35.0, 29.0, 21.0, 24.0, 28.0, 24.0, 15.0, 9.0, 11.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8926315307617188, -0.8677825927734375, -0.8429336547851562, -0.818084716796875, -0.7932357788085938, -0.7683868408203125, -0.7435379028320312, -0.71868896484375, -0.6938400268554688, -0.6689910888671875, -0.6441421508789062, -0.619293212890625, -0.5944442749023438, -0.5695953369140625, -0.5447463989257812, -0.5198974609375, -0.49504852294921875, -0.4701995849609375, -0.44535064697265625, -0.420501708984375, -0.39565277099609375, -0.3708038330078125, -0.34595489501953125, -0.32110595703125, -0.29625701904296875, -0.2714080810546875, -0.24655914306640625, -0.221710205078125, -0.19686126708984375, -0.1720123291015625, -0.14716339111328125, -0.122314453125, -0.09746551513671875, -0.0726165771484375, -0.04776763916015625, -0.022918701171875, 0.00193023681640625, 0.0267791748046875, 0.05162811279296875, 0.07647705078125, 0.10132598876953125, 0.1261749267578125, 0.15102386474609375, 0.175872802734375, 0.20072174072265625, 0.2255706787109375, 0.25041961669921875, 0.2752685546875, 0.30011749267578125, 0.3249664306640625, 0.34981536865234375, 0.374664306640625, 0.39951324462890625, 0.4243621826171875, 0.44921112060546875, 0.47406005859375, 0.49890899658203125, 0.5237579345703125, 0.5486068725585938, 0.573455810546875, 0.5983047485351562, 0.6231536865234375, 0.6480026245117188, 0.6728515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 4.0, 8.0, 10.0, 19.0, 24.0, 31.0, 40.0, 71.0, 71.0, 132.0, 217.0, 348.0, 627.0, 1316.0, 2737.0, 5690.0, 12325.0, 29132.0, 71253.0, 209367.0, 460719.0, 154270.0, 56817.0, 23625.0, 10245.0, 4682.0, 2229.0, 1061.0, 543.0, 337.0, 196.0, 132.0, 60.0, 49.0, 32.0, 31.0, 29.0, 19.0, 12.0, 6.0, 6.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.169677734375, -3.07177734375, -2.973876953125, -2.8759765625, -2.778076171875, -2.68017578125, -2.582275390625, -2.484375, -2.386474609375, -2.28857421875, -2.190673828125, -2.0927734375, -1.994873046875, -1.89697265625, -1.799072265625, -1.701171875, -1.603271484375, -1.50537109375, -1.407470703125, -1.3095703125, -1.211669921875, -1.11376953125, -1.015869140625, -0.91796875, -0.820068359375, -0.72216796875, -0.624267578125, -0.5263671875, -0.428466796875, -0.33056640625, -0.232666015625, -0.134765625, -0.036865234375, 0.06103515625, 0.158935546875, 0.2568359375, 0.354736328125, 0.45263671875, 0.550537109375, 0.6484375, 0.746337890625, 0.84423828125, 0.942138671875, 1.0400390625, 1.137939453125, 1.23583984375, 1.333740234375, 1.431640625, 1.529541015625, 1.62744140625, 1.725341796875, 1.8232421875, 1.921142578125, 2.01904296875, 2.116943359375, 2.21484375, 2.312744140625, 2.41064453125, 2.508544921875, 2.6064453125, 2.704345703125, 2.80224609375, 2.900146484375, 2.998046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 4.0, 11.0, 5.0, 10.0, 19.0, 24.0, 10.0, 28.0, 22.0, 40.0, 34.0, 35.0, 39.0, 50.0, 43.0, 42.0, 53.0, 46.0, 49.0, 49.0, 37.0, 48.0, 29.0, 38.0, 35.0, 36.0, 28.0, 18.0, 19.0, 20.0, 14.0, 10.0, 10.0, 8.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.868255615234375, -2.76971435546875, -2.671173095703125, -2.5726318359375, -2.474090576171875, -2.37554931640625, -2.277008056640625, -2.178466796875, -2.079925537109375, -1.98138427734375, -1.882843017578125, -1.7843017578125, -1.685760498046875, -1.58721923828125, -1.488677978515625, -1.39013671875, -1.291595458984375, -1.19305419921875, -1.094512939453125, -0.9959716796875, -0.897430419921875, -0.79888916015625, -0.700347900390625, -0.601806640625, -0.503265380859375, -0.40472412109375, -0.306182861328125, -0.2076416015625, -0.109100341796875, -0.01055908203125, 0.087982177734375, 0.1865234375, 0.285064697265625, 0.38360595703125, 0.482147216796875, 0.5806884765625, 0.679229736328125, 0.77777099609375, 0.876312255859375, 0.974853515625, 1.073394775390625, 1.17193603515625, 1.270477294921875, 1.3690185546875, 1.467559814453125, 1.56610107421875, 1.664642333984375, 1.76318359375, 1.861724853515625, 1.96026611328125, 2.058807373046875, 2.1573486328125, 2.255889892578125, 2.35443115234375, 2.452972412109375, 2.551513671875, 2.650054931640625, 2.74859619140625, 2.847137451171875, 2.9456787109375, 3.044219970703125, 3.14276123046875, 3.241302490234375, 3.33984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 9.0, 7.0, 15.0, 21.0, 22.0, 26.0, 58.0, 98.0, 171.0, 291.0, 585.0, 1416.0, 3615.0, 11328.0, 42348.0, 202293.0, 588810.0, 149580.0, 33189.0, 9181.0, 3117.0, 1172.0, 544.0, 274.0, 144.0, 84.0, 47.0, 36.0, 23.0, 11.0, 12.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.07421875, -2.010223388671875, -1.94622802734375, -1.882232666015625, -1.8182373046875, -1.754241943359375, -1.69024658203125, -1.626251220703125, -1.562255859375, -1.498260498046875, -1.43426513671875, -1.370269775390625, -1.3062744140625, -1.242279052734375, -1.17828369140625, -1.114288330078125, -1.05029296875, -0.986297607421875, -0.92230224609375, -0.858306884765625, -0.7943115234375, -0.730316162109375, -0.66632080078125, -0.602325439453125, -0.538330078125, -0.474334716796875, -0.41033935546875, -0.346343994140625, -0.2823486328125, -0.218353271484375, -0.15435791015625, -0.090362548828125, -0.0263671875, 0.037628173828125, 0.10162353515625, 0.165618896484375, 0.2296142578125, 0.293609619140625, 0.35760498046875, 0.421600341796875, 0.485595703125, 0.549591064453125, 0.61358642578125, 0.677581787109375, 0.7415771484375, 0.805572509765625, 0.86956787109375, 0.933563232421875, 0.99755859375, 1.061553955078125, 1.12554931640625, 1.189544677734375, 1.2535400390625, 1.317535400390625, 1.38153076171875, 1.445526123046875, 1.509521484375, 1.573516845703125, 1.63751220703125, 1.701507568359375, 1.7655029296875, 1.829498291015625, 1.89349365234375, 1.957489013671875, 2.021484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 6.0, 8.0, 15.0, 17.0, 17.0, 29.0, 49.0, 96.0, 209.0, 222.0, 123.0, 67.0, 39.0, 22.0, 17.0, 15.0, 14.0, 5.0, 2.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005578994750976562, -0.0005436614155769348, -0.0005294233560562134, -0.0005151852965354919, -0.0005009472370147705, -0.00048670917749404907, -0.00047247111797332764, -0.0004582330584526062, -0.00044399499893188477, -0.00042975693941116333, -0.0004155188798904419, -0.00040128082036972046, -0.000387042760848999, -0.0003728047013282776, -0.00035856664180755615, -0.0003443285822868347, -0.0003300905227661133, -0.00031585246324539185, -0.0003016144037246704, -0.000287376344203949, -0.00027313828468322754, -0.0002589002251625061, -0.00024466216564178467, -0.00023042410612106323, -0.0002161860466003418, -0.00020194798707962036, -0.00018770992755889893, -0.0001734718680381775, -0.00015923380851745605, -0.00014499574899673462, -0.00013075768947601318, -0.00011651962995529175, -0.00010228157043457031, -8.804351091384888e-05, -7.380545139312744e-05, -5.9567391872406006e-05, -4.532933235168457e-05, -3.1091272830963135e-05, -1.68532133102417e-05, -2.6151537895202637e-06, 1.1622905731201172e-05, 2.5860965251922607e-05, 4.009902477264404e-05, 5.433708429336548e-05, 6.857514381408691e-05, 8.281320333480835e-05, 9.705126285552979e-05, 0.00011128932237625122, 0.00012552738189697266, 0.0001397654414176941, 0.00015400350093841553, 0.00016824156045913696, 0.0001824796199798584, 0.00019671767950057983, 0.00021095573902130127, 0.0002251937985420227, 0.00023943185806274414, 0.0002536699175834656, 0.000267907977104187, 0.00028214603662490845, 0.0002963840961456299, 0.0003106221556663513, 0.00032486021518707275, 0.0003390982747077942, 0.0003533363342285156]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 13.0, 21.0, 19.0, 31.0, 44.0, 61.0, 97.0, 149.0, 228.0, 324.0, 550.0, 945.0, 1713.0, 3335.0, 7070.0, 16720.0, 42765.0, 121977.0, 377153.0, 313120.0, 99697.0, 35655.0, 13942.0, 6225.0, 2915.0, 1467.0, 844.0, 506.0, 297.0, 207.0, 115.0, 98.0, 66.0, 45.0, 31.0, 18.0, 23.0, 19.0, 8.0, 4.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3955078125, -1.3503570556640625, -1.305206298828125, -1.2600555419921875, -1.21490478515625, -1.1697540283203125, -1.124603271484375, -1.0794525146484375, -1.0343017578125, -0.9891510009765625, -0.944000244140625, -0.8988494873046875, -0.85369873046875, -0.8085479736328125, -0.763397216796875, -0.7182464599609375, -0.673095703125, -0.6279449462890625, -0.582794189453125, -0.5376434326171875, -0.49249267578125, -0.4473419189453125, -0.402191162109375, -0.3570404052734375, -0.3118896484375, -0.2667388916015625, -0.221588134765625, -0.1764373779296875, -0.13128662109375, -0.0861358642578125, -0.040985107421875, 0.0041656494140625, 0.04931640625, 0.0944671630859375, 0.139617919921875, 0.1847686767578125, 0.22991943359375, 0.2750701904296875, 0.320220947265625, 0.3653717041015625, 0.4105224609375, 0.4556732177734375, 0.500823974609375, 0.5459747314453125, 0.59112548828125, 0.6362762451171875, 0.681427001953125, 0.7265777587890625, 0.771728515625, 0.8168792724609375, 0.862030029296875, 0.9071807861328125, 0.95233154296875, 0.9974822998046875, 1.042633056640625, 1.0877838134765625, 1.1329345703125, 1.1780853271484375, 1.223236083984375, 1.2683868408203125, 1.31353759765625, 1.3586883544921875, 1.403839111328125, 1.4489898681640625, 1.494140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 7.0, 12.0, 6.0, 18.0, 20.0, 15.0, 29.0, 34.0, 38.0, 38.0, 41.0, 55.0, 56.0, 83.0, 93.0, 72.0, 59.0, 48.0, 45.0, 31.0, 27.0, 31.0, 21.0, 30.0, 17.0, 13.0, 12.0, 5.0, 5.0, 6.0, 9.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.259765625, -1.2239227294921875, -1.188079833984375, -1.1522369384765625, -1.11639404296875, -1.0805511474609375, -1.044708251953125, -1.0088653564453125, -0.9730224609375, -0.9371795654296875, -0.901336669921875, -0.8654937744140625, -0.82965087890625, -0.7938079833984375, -0.757965087890625, -0.7221221923828125, -0.686279296875, -0.6504364013671875, -0.614593505859375, -0.5787506103515625, -0.54290771484375, -0.5070648193359375, -0.471221923828125, -0.4353790283203125, -0.3995361328125, -0.3636932373046875, -0.327850341796875, -0.2920074462890625, -0.25616455078125, -0.2203216552734375, -0.184478759765625, -0.1486358642578125, -0.11279296875, -0.0769500732421875, -0.041107177734375, -0.0052642822265625, 0.03057861328125, 0.0664215087890625, 0.102264404296875, 0.1381072998046875, 0.1739501953125, 0.2097930908203125, 0.245635986328125, 0.2814788818359375, 0.31732177734375, 0.3531646728515625, 0.389007568359375, 0.4248504638671875, 0.460693359375, 0.4965362548828125, 0.532379150390625, 0.5682220458984375, 0.60406494140625, 0.6399078369140625, 0.675750732421875, 0.7115936279296875, 0.7474365234375, 0.7832794189453125, 0.819122314453125, 0.8549652099609375, 0.89080810546875, 0.9266510009765625, 0.962493896484375, 0.9983367919921875, 1.0341796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 30.0, 59.0, 134.0, 207.0, 207.0, 144.0, 116.0, 56.0, 25.0, 12.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.401687622070312, -23.00246810913086, -21.603248596191406, -20.20402717590332, -18.804807662963867, -17.405588150024414, -16.006366729736328, -14.607147216796875, -13.207927703857422, -11.808708190917969, -10.4094877243042, -9.01026725769043, -7.611047744750977, -6.211827754974365, -4.812607765197754, -3.4133872985839844, -2.0141677856445312, -0.6149477958679199, 0.7842721939086914, 2.1834921836853027, 3.582712173461914, 4.981932163238525, 6.381152153015137, 7.780372619628906, 9.17959213256836, 10.578811645507812, 11.978032112121582, 13.377252578735352, 14.776472091674805, 16.175691604614258, 17.574913024902344, 18.974132537841797, 20.37335205078125, 21.772571563720703, 23.171791076660156, 24.571012496948242, 25.970232009887695, 27.36945152282715, 28.768672943115234, 30.167892456054688, 31.56711196899414, 32.966331481933594, 34.36555099487305, 35.7647705078125, 37.16399383544922, 38.56321334838867, 39.962432861328125, 41.36165237426758, 42.76087188720703, 44.160091400146484, 45.55931091308594, 46.95853042602539, 48.357749938964844, 49.75697326660156, 51.156192779541016, 52.55541229248047, 53.95463180541992, 55.353851318359375, 56.75307083129883, 58.15229034423828, 59.551513671875, 60.95073318481445, 62.349952697753906, 63.74917221069336, 65.14839172363281]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 10.0, 9.0, 16.0, 14.0, 23.0, 8.0, 18.0, 37.0, 20.0, 22.0, 37.0, 39.0, 46.0, 35.0, 34.0, 44.0, 47.0, 56.0, 26.0, 41.0, 34.0, 45.0, 40.0, 27.0, 38.0, 32.0, 22.0, 22.0, 19.0, 25.0, 17.0, 19.0, 11.0, 6.0, 10.0, 7.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.834763526916504, -12.426362037658691, -12.017960548400879, -11.60955810546875, -11.201156616210938, -10.792755126953125, -10.384353637695312, -9.9759521484375, -9.567549705505371, -9.159148216247559, -8.750746726989746, -8.342344284057617, -7.933942794799805, -7.525541305541992, -7.11713981628418, -6.708737850189209, -6.3003363609313965, -5.891934871673584, -5.483532905578613, -5.075131416320801, -4.66672945022583, -4.258327960968018, -3.849926233291626, -3.4415245056152344, -3.0331227779388428, -2.624721050262451, -2.2163193225860596, -1.8079177141189575, -1.399515986442566, -0.9911143779754639, -0.5827126502990723, -0.17431092262268066, 0.23409080505371094, 0.6424925327301025, 1.0508942604064941, 1.4592958688735962, 1.8676975965499878, 2.27609920501709, 2.6845009326934814, 3.092902660369873, 3.5013043880462646, 3.9097061157226562, 4.318107604980469, 4.7265095710754395, 5.134911060333252, 5.543313026428223, 5.951714515686035, 6.360116004943848, 6.768517971038818, 7.176919460296631, 7.585321426391602, 7.993722915649414, 8.402124404907227, 8.810525894165039, 9.218928337097168, 9.62732982635498, 10.035731315612793, 10.444132804870605, 10.852534294128418, 11.260936737060547, 11.66933822631836, 12.077739715576172, 12.486141204833984, 12.894542694091797, 13.302945137023926]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 13.0, 20.0, 29.0, 21.0, 40.0, 66.0, 83.0, 149.0, 188.0, 278.0, 497.0, 805.0, 1432.0, 2720.0, 5951.0, 13761.0, 39175.0, 154765.0, 3353515.0, 501782.0, 77039.0, 23940.0, 9056.0, 4198.0, 2013.0, 1096.0, 595.0, 381.0, 245.0, 132.0, 90.0, 53.0, 45.0, 32.0, 20.0, 16.0, 12.0, 11.0, 9.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.76995849609375, -6.5633544921875, -6.35675048828125, -6.150146484375, -5.94354248046875, -5.7369384765625, -5.53033447265625, -5.32373046875, -5.11712646484375, -4.9105224609375, -4.70391845703125, -4.497314453125, -4.29071044921875, -4.0841064453125, -3.87750244140625, -3.6708984375, -3.46429443359375, -3.2576904296875, -3.05108642578125, -2.844482421875, -2.63787841796875, -2.4312744140625, -2.22467041015625, -2.01806640625, -1.81146240234375, -1.6048583984375, -1.39825439453125, -1.191650390625, -0.98504638671875, -0.7784423828125, -0.57183837890625, -0.365234375, -0.15863037109375, 0.0479736328125, 0.25457763671875, 0.461181640625, 0.66778564453125, 0.8743896484375, 1.08099365234375, 1.28759765625, 1.49420166015625, 1.7008056640625, 1.90740966796875, 2.114013671875, 2.32061767578125, 2.5272216796875, 2.73382568359375, 2.9404296875, 3.14703369140625, 3.3536376953125, 3.56024169921875, 3.766845703125, 3.97344970703125, 4.1800537109375, 4.38665771484375, 4.59326171875, 4.79986572265625, 5.0064697265625, 5.21307373046875, 5.419677734375, 5.62628173828125, 5.8328857421875, 6.03948974609375, 6.24609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 12.0, 16.0, 14.0, 14.0, 16.0, 21.0, 24.0, 26.0, 43.0, 57.0, 36.0, 30.0, 46.0, 50.0, 48.0, 46.0, 51.0, 41.0, 45.0, 48.0, 48.0, 46.0, 33.0, 26.0, 23.0, 28.0, 15.0, 21.0, 15.0, 14.0, 11.0, 2.0, 6.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.89105224609375, -0.8665771484375, -0.84210205078125, -0.817626953125, -0.79315185546875, -0.7686767578125, -0.74420166015625, -0.7197265625, -0.69525146484375, -0.6707763671875, -0.64630126953125, -0.621826171875, -0.59735107421875, -0.5728759765625, -0.54840087890625, -0.52392578125, -0.49945068359375, -0.4749755859375, -0.45050048828125, -0.426025390625, -0.40155029296875, -0.3770751953125, -0.35260009765625, -0.328125, -0.30364990234375, -0.2791748046875, -0.25469970703125, -0.230224609375, -0.20574951171875, -0.1812744140625, -0.15679931640625, -0.13232421875, -0.10784912109375, -0.0833740234375, -0.05889892578125, -0.034423828125, -0.00994873046875, 0.0145263671875, 0.03900146484375, 0.0634765625, 0.08795166015625, 0.1124267578125, 0.13690185546875, 0.161376953125, 0.18585205078125, 0.2103271484375, 0.23480224609375, 0.25927734375, 0.28375244140625, 0.3082275390625, 0.33270263671875, 0.357177734375, 0.38165283203125, 0.4061279296875, 0.43060302734375, 0.455078125, 0.47955322265625, 0.5040283203125, 0.52850341796875, 0.552978515625, 0.57745361328125, 0.6019287109375, 0.62640380859375, 0.65087890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 13.0, 14.0, 26.0, 42.0, 47.0, 91.0, 150.0, 273.0, 497.0, 946.0, 1887.0, 3813.0, 8567.0, 19459.0, 50132.0, 161168.0, 2185521.0, 1525138.0, 153459.0, 48225.0, 18947.0, 8270.0, 3718.0, 1838.0, 905.0, 482.0, 270.0, 135.0, 78.0, 47.0, 37.0, 21.0, 18.0, 6.0, 10.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.508636474609375, -3.37860107421875, -3.248565673828125, -3.1185302734375, -2.988494873046875, -2.85845947265625, -2.728424072265625, -2.598388671875, -2.468353271484375, -2.33831787109375, -2.208282470703125, -2.0782470703125, -1.948211669921875, -1.81817626953125, -1.688140869140625, -1.55810546875, -1.428070068359375, -1.29803466796875, -1.167999267578125, -1.0379638671875, -0.907928466796875, -0.77789306640625, -0.647857666015625, -0.517822265625, -0.387786865234375, -0.25775146484375, -0.127716064453125, 0.0023193359375, 0.132354736328125, 0.26239013671875, 0.392425537109375, 0.5224609375, 0.652496337890625, 0.78253173828125, 0.912567138671875, 1.0426025390625, 1.172637939453125, 1.30267333984375, 1.432708740234375, 1.562744140625, 1.692779541015625, 1.82281494140625, 1.952850341796875, 2.0828857421875, 2.212921142578125, 2.34295654296875, 2.472991943359375, 2.60302734375, 2.733062744140625, 2.86309814453125, 2.993133544921875, 3.1231689453125, 3.253204345703125, 3.38323974609375, 3.513275146484375, 3.643310546875, 3.773345947265625, 3.90338134765625, 4.033416748046875, 4.1634521484375, 4.293487548828125, 4.42352294921875, 4.553558349609375, 4.68359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 9.0, 14.0, 16.0, 21.0, 30.0, 36.0, 60.0, 69.0, 109.0, 176.0, 349.0, 1415.0, 928.0, 310.0, 179.0, 88.0, 58.0, 55.0, 33.0, 25.0, 11.0, 17.0, 14.0, 9.0, 5.0, 11.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.602783203125, -1.54736328125, -1.491943359375, -1.4365234375, -1.381103515625, -1.32568359375, -1.270263671875, -1.21484375, -1.159423828125, -1.10400390625, -1.048583984375, -0.9931640625, -0.937744140625, -0.88232421875, -0.826904296875, -0.771484375, -0.716064453125, -0.66064453125, -0.605224609375, -0.5498046875, -0.494384765625, -0.43896484375, -0.383544921875, -0.328125, -0.272705078125, -0.21728515625, -0.161865234375, -0.1064453125, -0.051025390625, 0.00439453125, 0.059814453125, 0.115234375, 0.170654296875, 0.22607421875, 0.281494140625, 0.3369140625, 0.392333984375, 0.44775390625, 0.503173828125, 0.55859375, 0.614013671875, 0.66943359375, 0.724853515625, 0.7802734375, 0.835693359375, 0.89111328125, 0.946533203125, 1.001953125, 1.057373046875, 1.11279296875, 1.168212890625, 1.2236328125, 1.279052734375, 1.33447265625, 1.389892578125, 1.4453125, 1.500732421875, 1.55615234375, 1.611572265625, 1.6669921875, 1.722412109375, 1.77783203125, 1.833251953125, 1.888671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 7.0, 14.0, 20.0, 49.0, 52.0, 88.0, 133.0, 122.0, 110.0, 110.0, 94.0, 69.0, 41.0, 31.0, 17.0, 16.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.941224098205566, -10.575727462768555, -10.210230827331543, -9.844734191894531, -9.47923755645752, -9.113740921020508, -8.748244285583496, -8.382747650146484, -8.017251014709473, -7.651754379272461, -7.286257743835449, -6.9207611083984375, -6.555264472961426, -6.189767837524414, -5.824271202087402, -5.458774566650391, -5.093277931213379, -4.727781295776367, -4.3622846603393555, -3.9967880249023438, -3.631291389465332, -3.2657947540283203, -2.9002981185913086, -2.534801483154297, -2.169304847717285, -1.8038082122802734, -1.4383115768432617, -1.07281494140625, -0.7073183059692383, -0.34182167053222656, 0.023674964904785156, 0.3891716003417969, 0.754669189453125, 1.1201658248901367, 1.4856624603271484, 1.8511590957641602, 2.216655731201172, 2.5821523666381836, 2.9476490020751953, 3.313145637512207, 3.6786422729492188, 4.0441389083862305, 4.409635543823242, 4.775132179260254, 5.140628814697266, 5.506125450134277, 5.871622085571289, 6.237118721008301, 6.6026153564453125, 6.968111991882324, 7.333608627319336, 7.699105262756348, 8.06460189819336, 8.430098533630371, 8.795595169067383, 9.161091804504395, 9.526588439941406, 9.892085075378418, 10.25758171081543, 10.623078346252441, 10.988574981689453, 11.354071617126465, 11.719568252563477, 12.085064888000488, 12.4505615234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 14.0, 19.0, 24.0, 32.0, 41.0, 37.0, 37.0, 39.0, 39.0, 55.0, 58.0, 45.0, 30.0, 50.0, 61.0, 46.0, 52.0, 44.0, 32.0, 37.0, 35.0, 35.0, 29.0, 20.0, 15.0, 15.0, 9.0, 5.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.829183578491211, -7.616166591644287, -7.403149127960205, -7.190132141113281, -6.977114677429199, -6.764097690582275, -6.551080703735352, -6.3380632400512695, -6.125046253204346, -5.912029266357422, -5.69901180267334, -5.485994815826416, -5.272977828979492, -5.05996036529541, -4.846943378448486, -4.6339263916015625, -4.4209089279174805, -4.207891941070557, -3.9948744773864746, -3.781857490539551, -3.568840265274048, -3.355823040008545, -3.142806053161621, -2.929788827896118, -2.7167716026306152, -2.5037543773651123, -2.2907371520996094, -2.0777201652526855, -1.8647029399871826, -1.6516857147216797, -1.4386686086654663, -1.225651502609253, -1.01263427734375, -0.7996171116828918, -0.5865999460220337, -0.37358278036117554, -0.16056561470031738, 0.05245161056518555, 0.2654687166213989, 0.4784858226776123, 0.6915030479431152, 0.9045202136039734, 1.1175373792648315, 1.330554485321045, 1.5435717105865479, 1.7565889358520508, 1.9696060419082642, 2.1826231479644775, 2.3956403732299805, 2.6086575984954834, 2.8216748237609863, 3.03469181060791, 3.247709035873413, 3.460726261138916, 3.67374324798584, 3.8867604732513428, 4.099777698516846, 4.3127946853637695, 4.525812149047852, 4.738829135894775, 4.951846122741699, 5.164863586425781, 5.377880573272705, 5.590897560119629, 5.803915023803711]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 15.0, 15.0, 27.0, 60.0, 79.0, 155.0, 269.0, 390.0, 705.0, 1215.0, 2376.0, 4786.0, 10146.0, 23351.0, 55005.0, 126989.0, 282772.0, 298065.0, 136768.0, 58620.0, 25175.0, 10829.0, 5049.0, 2489.0, 1357.0, 769.0, 414.0, 260.0, 131.0, 113.0, 60.0, 35.0, 15.0, 14.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.62841796875, -3.4990234375, -3.36962890625, -3.240234375, -3.11083984375, -2.9814453125, -2.85205078125, -2.72265625, -2.59326171875, -2.4638671875, -2.33447265625, -2.205078125, -2.07568359375, -1.9462890625, -1.81689453125, -1.6875, -1.55810546875, -1.4287109375, -1.29931640625, -1.169921875, -1.04052734375, -0.9111328125, -0.78173828125, -0.65234375, -0.52294921875, -0.3935546875, -0.26416015625, -0.134765625, -0.00537109375, 0.1240234375, 0.25341796875, 0.3828125, 0.51220703125, 0.6416015625, 0.77099609375, 0.900390625, 1.02978515625, 1.1591796875, 1.28857421875, 1.41796875, 1.54736328125, 1.6767578125, 1.80615234375, 1.935546875, 2.06494140625, 2.1943359375, 2.32373046875, 2.453125, 2.58251953125, 2.7119140625, 2.84130859375, 2.970703125, 3.10009765625, 3.2294921875, 3.35888671875, 3.48828125, 3.61767578125, 3.7470703125, 3.87646484375, 4.005859375, 4.13525390625, 4.2646484375, 4.39404296875, 4.5234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 15.0, 10.0, 20.0, 20.0, 24.0, 24.0, 25.0, 36.0, 35.0, 42.0, 36.0, 50.0, 56.0, 34.0, 60.0, 55.0, 51.0, 52.0, 44.0, 35.0, 37.0, 39.0, 32.0, 29.0, 28.0, 22.0, 16.0, 13.0, 13.0, 7.0, 8.0, 7.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9638671875, -0.9376373291015625, -0.911407470703125, -0.8851776123046875, -0.85894775390625, -0.8327178955078125, -0.806488037109375, -0.7802581787109375, -0.7540283203125, -0.7277984619140625, -0.701568603515625, -0.6753387451171875, -0.64910888671875, -0.6228790283203125, -0.596649169921875, -0.5704193115234375, -0.544189453125, -0.5179595947265625, -0.491729736328125, -0.4654998779296875, -0.43927001953125, -0.4130401611328125, -0.386810302734375, -0.3605804443359375, -0.3343505859375, -0.3081207275390625, -0.281890869140625, -0.2556610107421875, -0.22943115234375, -0.2032012939453125, -0.176971435546875, -0.1507415771484375, -0.12451171875, -0.0982818603515625, -0.072052001953125, -0.0458221435546875, -0.01959228515625, 0.0066375732421875, 0.032867431640625, 0.0590972900390625, 0.0853271484375, 0.1115570068359375, 0.137786865234375, 0.1640167236328125, 0.19024658203125, 0.2164764404296875, 0.242706298828125, 0.2689361572265625, 0.295166015625, 0.3213958740234375, 0.347625732421875, 0.3738555908203125, 0.40008544921875, 0.4263153076171875, 0.452545166015625, 0.4787750244140625, 0.5050048828125, 0.5312347412109375, 0.557464599609375, 0.5836944580078125, 0.60992431640625, 0.6361541748046875, 0.662384033203125, 0.6886138916015625, 0.71484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 7.0, 6.0, 12.0, 11.0, 21.0, 14.0, 25.0, 31.0, 51.0, 60.0, 72.0, 95.0, 141.0, 162.0, 239.0, 309.0, 401.0, 585.0, 1149.0, 2454.0, 7887.0, 30124.0, 119548.0, 401434.0, 348159.0, 98692.0, 24904.0, 6599.0, 2227.0, 1026.0, 575.0, 395.0, 277.0, 206.0, 144.0, 121.0, 93.0, 75.0, 55.0, 40.0, 30.0, 22.0, 22.0, 14.0, 10.0, 13.0, 10.0, 6.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.50006103515625, -4.3634033203125, -4.22674560546875, -4.090087890625, -3.95343017578125, -3.8167724609375, -3.68011474609375, -3.54345703125, -3.40679931640625, -3.2701416015625, -3.13348388671875, -2.996826171875, -2.86016845703125, -2.7235107421875, -2.58685302734375, -2.4501953125, -2.31353759765625, -2.1768798828125, -2.04022216796875, -1.903564453125, -1.76690673828125, -1.6302490234375, -1.49359130859375, -1.35693359375, -1.22027587890625, -1.0836181640625, -0.94696044921875, -0.810302734375, -0.67364501953125, -0.5369873046875, -0.40032958984375, -0.263671875, -0.12701416015625, 0.0096435546875, 0.14630126953125, 0.282958984375, 0.41961669921875, 0.5562744140625, 0.69293212890625, 0.82958984375, 0.96624755859375, 1.1029052734375, 1.23956298828125, 1.376220703125, 1.51287841796875, 1.6495361328125, 1.78619384765625, 1.9228515625, 2.05950927734375, 2.1961669921875, 2.33282470703125, 2.469482421875, 2.60614013671875, 2.7427978515625, 2.87945556640625, 3.01611328125, 3.15277099609375, 3.2894287109375, 3.42608642578125, 3.562744140625, 3.69940185546875, 3.8360595703125, 3.97271728515625, 4.109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 4.0, 10.0, 11.0, 14.0, 14.0, 13.0, 15.0, 27.0, 21.0, 18.0, 27.0, 21.0, 35.0, 28.0, 35.0, 30.0, 42.0, 37.0, 34.0, 40.0, 46.0, 43.0, 38.0, 30.0, 23.0, 36.0, 25.0, 35.0, 28.0, 25.0, 25.0, 20.0, 16.0, 9.0, 20.0, 15.0, 11.0, 11.0, 10.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.69921875, -2.61529541015625, -2.5313720703125, -2.44744873046875, -2.363525390625, -2.27960205078125, -2.1956787109375, -2.11175537109375, -2.02783203125, -1.94390869140625, -1.8599853515625, -1.77606201171875, -1.692138671875, -1.60821533203125, -1.5242919921875, -1.44036865234375, -1.3564453125, -1.27252197265625, -1.1885986328125, -1.10467529296875, -1.020751953125, -0.93682861328125, -0.8529052734375, -0.76898193359375, -0.68505859375, -0.60113525390625, -0.5172119140625, -0.43328857421875, -0.349365234375, -0.26544189453125, -0.1815185546875, -0.09759521484375, -0.013671875, 0.07025146484375, 0.1541748046875, 0.23809814453125, 0.322021484375, 0.40594482421875, 0.4898681640625, 0.57379150390625, 0.65771484375, 0.74163818359375, 0.8255615234375, 0.90948486328125, 0.993408203125, 1.07733154296875, 1.1612548828125, 1.24517822265625, 1.3291015625, 1.41302490234375, 1.4969482421875, 1.58087158203125, 1.664794921875, 1.74871826171875, 1.8326416015625, 1.91656494140625, 2.00048828125, 2.08441162109375, 2.1683349609375, 2.25225830078125, 2.336181640625, 2.42010498046875, 2.5040283203125, 2.58795166015625, 2.671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 13.0, 20.0, 34.0, 84.0, 150.0, 347.0, 949.0, 3109.0, 12875.0, 75536.0, 542480.0, 352276.0, 48088.0, 9005.0, 2271.0, 736.0, 282.0, 122.0, 66.0, 37.0, 26.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.447265625, -3.34552001953125, -3.2437744140625, -3.14202880859375, -3.040283203125, -2.93853759765625, -2.8367919921875, -2.73504638671875, -2.63330078125, -2.53155517578125, -2.4298095703125, -2.32806396484375, -2.226318359375, -2.12457275390625, -2.0228271484375, -1.92108154296875, -1.8193359375, -1.71759033203125, -1.6158447265625, -1.51409912109375, -1.412353515625, -1.31060791015625, -1.2088623046875, -1.10711669921875, -1.00537109375, -0.90362548828125, -0.8018798828125, -0.70013427734375, -0.598388671875, -0.49664306640625, -0.3948974609375, -0.29315185546875, -0.19140625, -0.08966064453125, 0.0120849609375, 0.11383056640625, 0.215576171875, 0.31732177734375, 0.4190673828125, 0.52081298828125, 0.62255859375, 0.72430419921875, 0.8260498046875, 0.92779541015625, 1.029541015625, 1.13128662109375, 1.2330322265625, 1.33477783203125, 1.4365234375, 1.53826904296875, 1.6400146484375, 1.74176025390625, 1.843505859375, 1.94525146484375, 2.0469970703125, 2.14874267578125, 2.25048828125, 2.35223388671875, 2.4539794921875, 2.55572509765625, 2.657470703125, 2.75921630859375, 2.8609619140625, 2.96270751953125, 3.064453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 7.0, 12.0, 14.0, 14.0, 24.0, 23.0, 34.0, 50.0, 52.0, 70.0, 115.0, 141.0, 97.0, 68.0, 57.0, 56.0, 41.0, 16.0, 18.0, 18.0, 12.0, 12.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003597736358642578, -0.0003486238420009613, -0.0003374740481376648, -0.0003263242542743683, -0.0003151744604110718, -0.00030402466654777527, -0.00029287487268447876, -0.00028172507882118225, -0.00027057528495788574, -0.00025942549109458923, -0.0002482756972312927, -0.00023712590336799622, -0.0002259761095046997, -0.0002148263156414032, -0.0002036765217781067, -0.00019252672791481018, -0.00018137693405151367, -0.00017022714018821716, -0.00015907734632492065, -0.00014792755246162415, -0.00013677775859832764, -0.00012562796473503113, -0.00011447817087173462, -0.00010332837700843811, -9.21785831451416e-05, -8.102878928184509e-05, -6.987899541854858e-05, -5.8729201555252075e-05, -4.7579407691955566e-05, -3.642961382865906e-05, -2.527981996536255e-05, -1.413002610206604e-05, -2.9802322387695312e-06, 8.169561624526978e-06, 1.9319355487823486e-05, 3.0469149351119995e-05, 4.1618943214416504e-05, 5.276873707771301e-05, 6.391853094100952e-05, 7.506832480430603e-05, 8.621811866760254e-05, 9.736791253089905e-05, 0.00010851770639419556, 0.00011966750025749207, 0.00013081729412078857, 0.00014196708798408508, 0.0001531168818473816, 0.0001642666757106781, 0.0001754164695739746, 0.00018656626343727112, 0.00019771605730056763, 0.00020886585116386414, 0.00022001564502716064, 0.00023116543889045715, 0.00024231523275375366, 0.00025346502661705017, 0.0002646148204803467, 0.0002757646143436432, 0.0002869144082069397, 0.0002980642020702362, 0.0003092139959335327, 0.0003203637897968292, 0.00033151358366012573, 0.00034266337752342224, 0.00035381317138671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 18.0, 21.0, 49.0, 61.0, 178.0, 291.0, 579.0, 1510.0, 7453.0, 83461.0, 802126.0, 139032.0, 10368.0, 1938.0, 705.0, 308.0, 188.0, 97.0, 65.0, 35.0, 24.0, 13.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.16156005859375, -3.9989013671875, -3.83624267578125, -3.673583984375, -3.51092529296875, -3.3482666015625, -3.18560791015625, -3.02294921875, -2.86029052734375, -2.6976318359375, -2.53497314453125, -2.372314453125, -2.20965576171875, -2.0469970703125, -1.88433837890625, -1.7216796875, -1.55902099609375, -1.3963623046875, -1.23370361328125, -1.071044921875, -0.90838623046875, -0.7457275390625, -0.58306884765625, -0.42041015625, -0.25775146484375, -0.0950927734375, 0.06756591796875, 0.230224609375, 0.39288330078125, 0.5555419921875, 0.71820068359375, 0.880859375, 1.04351806640625, 1.2061767578125, 1.36883544921875, 1.531494140625, 1.69415283203125, 1.8568115234375, 2.01947021484375, 2.18212890625, 2.34478759765625, 2.5074462890625, 2.67010498046875, 2.832763671875, 2.99542236328125, 3.1580810546875, 3.32073974609375, 3.4833984375, 3.64605712890625, 3.8087158203125, 3.97137451171875, 4.134033203125, 4.29669189453125, 4.4593505859375, 4.62200927734375, 4.78466796875, 4.94732666015625, 5.1099853515625, 5.27264404296875, 5.435302734375, 5.59796142578125, 5.7606201171875, 5.92327880859375, 6.0859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 12.0, 15.0, 18.0, 23.0, 43.0, 47.0, 79.0, 79.0, 101.0, 134.0, 103.0, 79.0, 74.0, 48.0, 43.0, 25.0, 21.0, 16.0, 7.0, 12.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.712890625, -3.6252593994140625, -3.537628173828125, -3.4499969482421875, -3.36236572265625, -3.2747344970703125, -3.187103271484375, -3.0994720458984375, -3.0118408203125, -2.9242095947265625, -2.836578369140625, -2.7489471435546875, -2.66131591796875, -2.5736846923828125, -2.486053466796875, -2.3984222412109375, -2.310791015625, -2.2231597900390625, -2.135528564453125, -2.0478973388671875, -1.96026611328125, -1.8726348876953125, -1.785003662109375, -1.6973724365234375, -1.6097412109375, -1.5221099853515625, -1.434478759765625, -1.3468475341796875, -1.25921630859375, -1.1715850830078125, -1.083953857421875, -0.9963226318359375, -0.90869140625, -0.8210601806640625, -0.733428955078125, -0.6457977294921875, -0.55816650390625, -0.4705352783203125, -0.382904052734375, -0.2952728271484375, -0.2076416015625, -0.1200103759765625, -0.032379150390625, 0.0552520751953125, 0.14288330078125, 0.2305145263671875, 0.318145751953125, 0.4057769775390625, 0.493408203125, 0.5810394287109375, 0.668670654296875, 0.7563018798828125, 0.84393310546875, 0.9315643310546875, 1.019195556640625, 1.1068267822265625, 1.1944580078125, 1.2820892333984375, 1.369720458984375, 1.4573516845703125, 1.54498291015625, 1.6326141357421875, 1.720245361328125, 1.8078765869140625, 1.8955078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 15.0, 45.0, 90.0, 143.0, 188.0, 194.0, 135.0, 88.0, 51.0, 27.0, 10.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.40587615966797, -75.85062408447266, -74.29537200927734, -72.7401123046875, -71.18486022949219, -69.62960815429688, -68.07435607910156, -66.51910400390625, -64.96385192871094, -63.408599853515625, -61.85334396362305, -60.298091888427734, -58.74283981323242, -57.187583923339844, -55.63233184814453, -54.07707977294922, -52.52182388305664, -50.96657180786133, -49.41131591796875, -47.85606384277344, -46.300811767578125, -44.74555969238281, -43.190303802490234, -41.63505172729492, -40.079795837402344, -38.52454376220703, -36.96928787231445, -35.41403579711914, -33.85878372192383, -32.30352783203125, -30.748275756835938, -29.193023681640625, -27.637771606445312, -26.082517623901367, -24.527265548706055, -22.97201156616211, -21.416759490966797, -19.86150550842285, -18.306251525878906, -16.750999450683594, -15.195745468139648, -13.64049243927002, -12.08523941040039, -10.529985427856445, -8.974732398986816, -7.4194793701171875, -5.864225387573242, -4.308972358703613, -2.7537193298339844, -1.1984660625457764, 0.35678720474243164, 1.9120407104492188, 3.4672937393188477, 5.022546768188477, 6.577800750732422, 8.13305377960205, 9.68830680847168, 11.243559837341309, 12.798812866210938, 14.354066848754883, 15.909319877624512, 17.46457290649414, 19.019826889038086, 20.57508087158203, 22.130332946777344]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 3.0, 9.0, 6.0, 11.0, 14.0, 10.0, 21.0, 14.0, 24.0, 17.0, 25.0, 33.0, 22.0, 36.0, 39.0, 39.0, 36.0, 48.0, 46.0, 47.0, 43.0, 40.0, 48.0, 28.0, 40.0, 27.0, 44.0, 23.0, 39.0, 25.0, 22.0, 17.0, 17.0, 17.0, 13.0, 10.0, 5.0, 6.0, 5.0, 8.0, 2.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.491778373718262, -14.00961971282959, -13.527462005615234, -13.045303344726562, -12.56314468383789, -12.080986022949219, -11.598828315734863, -11.116669654846191, -10.634511947631836, -10.152353286743164, -9.670195579528809, -9.188036918640137, -8.705878257751465, -8.22372055053711, -7.7415618896484375, -7.259403228759766, -6.777244567871094, -6.29508638381958, -5.812927722930908, -5.3307695388793945, -4.848610877990723, -4.366452693939209, -3.8842945098876953, -3.4021360874176025, -2.9199776649475098, -2.437819242477417, -1.9556609392166138, -1.4735026359558105, -0.9913442134857178, -0.509185791015625, -0.027027606964111328, 0.45513081550598145, 0.9372882843017578, 1.4194467067718506, 1.9016050100326538, 2.383763313293457, 2.86592173576355, 3.3480801582336426, 3.8302383422851562, 4.312397003173828, 4.794555187225342, 5.2767133712768555, 5.758872032165527, 6.241030216217041, 6.723188400268555, 7.205347061157227, 7.68750524520874, 8.169663429260254, 8.651822090148926, 9.133980751037598, 9.616138458251953, 10.098297119140625, 10.580455780029297, 11.062614440917969, 11.544772148132324, 12.026930809020996, 12.509088516235352, 12.991247177124023, 13.473404884338379, 13.95556354522705, 14.437722206115723, 14.919879913330078, 15.40203857421875, 15.884197235107422, 16.366355895996094]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 5.0, 16.0, 6.0, 14.0, 18.0, 31.0, 63.0, 93.0, 138.0, 215.0, 380.0, 615.0, 1164.0, 2210.0, 4621.0, 10457.0, 27132.0, 80971.0, 356018.0, 3137388.0, 428415.0, 92200.0, 30137.0, 11760.0, 5063.0, 2437.0, 1170.0, 609.0, 386.0, 221.0, 123.0, 84.0, 49.0, 25.0, 12.0, 9.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.4140625, -5.26593017578125, -5.1177978515625, -4.96966552734375, -4.821533203125, -4.67340087890625, -4.5252685546875, -4.37713623046875, -4.22900390625, -4.08087158203125, -3.9327392578125, -3.78460693359375, -3.636474609375, -3.48834228515625, -3.3402099609375, -3.19207763671875, -3.0439453125, -2.89581298828125, -2.7476806640625, -2.59954833984375, -2.451416015625, -2.30328369140625, -2.1551513671875, -2.00701904296875, -1.85888671875, -1.71075439453125, -1.5626220703125, -1.41448974609375, -1.266357421875, -1.11822509765625, -0.9700927734375, -0.82196044921875, -0.673828125, -0.52569580078125, -0.3775634765625, -0.22943115234375, -0.081298828125, 0.06683349609375, 0.2149658203125, 0.36309814453125, 0.51123046875, 0.65936279296875, 0.8074951171875, 0.95562744140625, 1.103759765625, 1.25189208984375, 1.4000244140625, 1.54815673828125, 1.6962890625, 1.84442138671875, 1.9925537109375, 2.14068603515625, 2.288818359375, 2.43695068359375, 2.5850830078125, 2.73321533203125, 2.88134765625, 3.02947998046875, 3.1776123046875, 3.32574462890625, 3.473876953125, 3.62200927734375, 3.7701416015625, 3.91827392578125, 4.06640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 7.0, 14.0, 25.0, 19.0, 30.0, 24.0, 29.0, 45.0, 36.0, 45.0, 38.0, 49.0, 51.0, 42.0, 52.0, 49.0, 59.0, 42.0, 44.0, 43.0, 39.0, 33.0, 26.0, 35.0, 22.0, 17.0, 12.0, 13.0, 7.0, 12.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.98486328125, -0.9590682983398438, -0.9332733154296875, -0.9074783325195312, -0.881683349609375, -0.8558883666992188, -0.8300933837890625, -0.8042984008789062, -0.77850341796875, -0.7527084350585938, -0.7269134521484375, -0.7011184692382812, -0.675323486328125, -0.6495285034179688, -0.6237335205078125, -0.5979385375976562, -0.5721435546875, -0.5463485717773438, -0.5205535888671875, -0.49475860595703125, -0.468963623046875, -0.44316864013671875, -0.4173736572265625, -0.39157867431640625, -0.36578369140625, -0.33998870849609375, -0.3141937255859375, -0.28839874267578125, -0.262603759765625, -0.23680877685546875, -0.2110137939453125, -0.18521881103515625, -0.159423828125, -0.13362884521484375, -0.1078338623046875, -0.08203887939453125, -0.056243896484375, -0.03044891357421875, -0.0046539306640625, 0.02114105224609375, 0.04693603515625, 0.07273101806640625, 0.0985260009765625, 0.12432098388671875, 0.150115966796875, 0.17591094970703125, 0.2017059326171875, 0.22750091552734375, 0.2532958984375, 0.27909088134765625, 0.3048858642578125, 0.33068084716796875, 0.356475830078125, 0.38227081298828125, 0.4080657958984375, 0.43386077880859375, 0.45965576171875, 0.48545074462890625, 0.5112457275390625, 0.5370407104492188, 0.562835693359375, 0.5886306762695312, 0.6144256591796875, 0.6402206420898438, 0.666015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 11.0, 4.0, 4.0, 10.0, 11.0, 6.0, 22.0, 32.0, 31.0, 56.0, 101.0, 127.0, 241.0, 365.0, 586.0, 937.0, 1701.0, 3035.0, 5711.0, 11309.0, 23028.0, 50178.0, 124389.0, 393808.0, 2395041.0, 834677.0, 206992.0, 75928.0, 32903.0, 15526.0, 7856.0, 4239.0, 2219.0, 1232.0, 744.0, 464.0, 250.0, 156.0, 118.0, 76.0, 51.0, 32.0, 19.0, 13.0, 9.0, 13.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.580078125, -2.493316650390625, -2.40655517578125, -2.319793701171875, -2.2330322265625, -2.146270751953125, -2.05950927734375, -1.972747802734375, -1.885986328125, -1.799224853515625, -1.71246337890625, -1.625701904296875, -1.5389404296875, -1.452178955078125, -1.36541748046875, -1.278656005859375, -1.19189453125, -1.105133056640625, -1.01837158203125, -0.931610107421875, -0.8448486328125, -0.758087158203125, -0.67132568359375, -0.584564208984375, -0.497802734375, -0.411041259765625, -0.32427978515625, -0.237518310546875, -0.1507568359375, -0.063995361328125, 0.02276611328125, 0.109527587890625, 0.1962890625, 0.283050537109375, 0.36981201171875, 0.456573486328125, 0.5433349609375, 0.630096435546875, 0.71685791015625, 0.803619384765625, 0.890380859375, 0.977142333984375, 1.06390380859375, 1.150665283203125, 1.2374267578125, 1.324188232421875, 1.41094970703125, 1.497711181640625, 1.58447265625, 1.671234130859375, 1.75799560546875, 1.844757080078125, 1.9315185546875, 2.018280029296875, 2.10504150390625, 2.191802978515625, 2.278564453125, 2.365325927734375, 2.45208740234375, 2.538848876953125, 2.6256103515625, 2.712371826171875, 2.79913330078125, 2.885894775390625, 2.97265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 8.0, 3.0, 9.0, 10.0, 21.0, 22.0, 25.0, 38.0, 37.0, 81.0, 88.0, 121.0, 192.0, 340.0, 608.0, 1155.0, 472.0, 259.0, 129.0, 141.0, 81.0, 70.0, 44.0, 34.0, 21.0, 17.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.9970703125, -1.9354095458984375, -1.873748779296875, -1.8120880126953125, -1.75042724609375, -1.6887664794921875, -1.627105712890625, -1.5654449462890625, -1.5037841796875, -1.4421234130859375, -1.380462646484375, -1.3188018798828125, -1.25714111328125, -1.1954803466796875, -1.133819580078125, -1.0721588134765625, -1.010498046875, -0.9488372802734375, -0.887176513671875, -0.8255157470703125, -0.76385498046875, -0.7021942138671875, -0.640533447265625, -0.5788726806640625, -0.5172119140625, -0.4555511474609375, -0.393890380859375, -0.3322296142578125, -0.27056884765625, -0.2089080810546875, -0.147247314453125, -0.0855865478515625, -0.02392578125, 0.0377349853515625, 0.099395751953125, 0.1610565185546875, 0.22271728515625, 0.2843780517578125, 0.346038818359375, 0.4076995849609375, 0.4693603515625, 0.5310211181640625, 0.592681884765625, 0.6543426513671875, 0.71600341796875, 0.7776641845703125, 0.839324951171875, 0.9009857177734375, 0.962646484375, 1.0243072509765625, 1.085968017578125, 1.1476287841796875, 1.20928955078125, 1.2709503173828125, 1.332611083984375, 1.3942718505859375, 1.4559326171875, 1.5175933837890625, 1.579254150390625, 1.6409149169921875, 1.70257568359375, 1.7642364501953125, 1.825897216796875, 1.8875579833984375, 1.94921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 16.0, 19.0, 23.0, 33.0, 54.0, 87.0, 84.0, 119.0, 125.0, 85.0, 100.0, 77.0, 55.0, 32.0, 30.0, 19.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.284547805786133, -17.84395980834961, -17.40337371826172, -16.962785720825195, -16.522197723388672, -16.08161163330078, -15.641023635864258, -15.200435638427734, -14.759848594665527, -14.31926155090332, -13.878673553466797, -13.43808650970459, -12.997499465942383, -12.55691146850586, -12.116324424743652, -11.675737380981445, -11.235149383544922, -10.794562339782715, -10.353974342346191, -9.913387298583984, -9.472800254821777, -9.032212257385254, -8.591625213623047, -8.151037216186523, -7.710451126098633, -7.269863605499268, -6.8292765617370605, -6.388689041137695, -5.94810152053833, -5.507513999938965, -5.066926956176758, -4.626339435577393, -4.185751914978027, -3.745164632797241, -3.304577112197876, -2.86398983001709, -2.4234023094177246, -1.9828150272369385, -1.5422277450561523, -1.101640224456787, -0.661052942276001, -0.22046557068824768, 0.22012180089950562, 0.6607091426849365, 1.1012965440750122, 1.541883945465088, 1.982471227645874, 2.4230587482452393, 2.8636460304260254, 3.3042333126068115, 3.7448208332061768, 4.185408115386963, 4.625995635986328, 5.066582679748535, 5.5071702003479, 5.947757720947266, 6.388344764709473, 6.828932285308838, 7.269519329071045, 7.71010684967041, 8.150693893432617, 8.59128189086914, 9.031868934631348, 9.472455978393555, 9.913043975830078]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 16.0, 14.0, 14.0, 25.0, 32.0, 20.0, 23.0, 29.0, 40.0, 28.0, 41.0, 29.0, 43.0, 40.0, 43.0, 41.0, 45.0, 54.0, 35.0, 36.0, 27.0, 34.0, 34.0, 29.0, 38.0, 34.0, 13.0, 21.0, 16.0, 16.0, 14.0, 13.0, 7.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.650493621826172, -7.420549392700195, -7.190605640411377, -6.9606614112854, -6.730717658996582, -6.5007734298706055, -6.270829200744629, -6.0408854484558105, -5.810941219329834, -5.580996990203857, -5.351053237915039, -5.1211090087890625, -4.891165256500244, -4.661221027374268, -4.431277275085449, -4.201333045959473, -3.971389055252075, -3.7414450645446777, -3.5115010738372803, -3.281557083129883, -3.0516128540039062, -2.821668863296509, -2.5917248725891113, -2.3617806434631348, -2.1318368911743164, -1.901892900466919, -1.671948790550232, -1.4420047998428345, -1.2120606899261475, -0.98211669921875, -0.7521727085113525, -0.5222285985946655, -0.2922844886779785, -0.06234045326709747, 0.16760358214378357, 0.3975476026535034, 0.6274916529655457, 0.8574357032775879, 1.0873796939849854, 1.3173238039016724, 1.5472677946090698, 1.7772117853164673, 2.0071558952331543, 2.2370998859405518, 2.467043876647949, 2.696988105773926, 2.926931858062744, 3.1568760871887207, 3.386820077896118, 3.6167640686035156, 3.846708059310913, 4.0766520500183105, 4.306596279144287, 4.5365400314331055, 4.766484260559082, 4.996428489685059, 5.226372241973877, 5.4563164710998535, 5.686260223388672, 5.916204452514648, 6.146148204803467, 6.376092433929443, 6.606036186218262, 6.835980415344238, 7.065924644470215]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 12.0, 14.0, 16.0, 28.0, 38.0, 63.0, 69.0, 115.0, 147.0, 253.0, 374.0, 572.0, 893.0, 1452.0, 2294.0, 3889.0, 6867.0, 12672.0, 23852.0, 46673.0, 92229.0, 166855.0, 233197.0, 202409.0, 120829.0, 63017.0, 31883.0, 16504.0, 8776.0, 4888.0, 2880.0, 1685.0, 1069.0, 691.0, 404.0, 296.0, 192.0, 154.0, 80.0, 64.0, 31.0, 35.0, 24.0, 14.0, 17.0, 5.0, 4.0, 8.0, 2.0, 1.0, 5.0], "bins": [-2.94921875, -2.86663818359375, -2.7840576171875, -2.70147705078125, -2.618896484375, -2.53631591796875, -2.4537353515625, -2.37115478515625, -2.28857421875, -2.20599365234375, -2.1234130859375, -2.04083251953125, -1.958251953125, -1.87567138671875, -1.7930908203125, -1.71051025390625, -1.6279296875, -1.54534912109375, -1.4627685546875, -1.38018798828125, -1.297607421875, -1.21502685546875, -1.1324462890625, -1.04986572265625, -0.96728515625, -0.88470458984375, -0.8021240234375, -0.71954345703125, -0.636962890625, -0.55438232421875, -0.4718017578125, -0.38922119140625, -0.306640625, -0.22406005859375, -0.1414794921875, -0.05889892578125, 0.023681640625, 0.10626220703125, 0.1888427734375, 0.27142333984375, 0.35400390625, 0.43658447265625, 0.5191650390625, 0.60174560546875, 0.684326171875, 0.76690673828125, 0.8494873046875, 0.93206787109375, 1.0146484375, 1.09722900390625, 1.1798095703125, 1.26239013671875, 1.344970703125, 1.42755126953125, 1.5101318359375, 1.59271240234375, 1.67529296875, 1.75787353515625, 1.8404541015625, 1.92303466796875, 2.005615234375, 2.08819580078125, 2.1707763671875, 2.25335693359375, 2.3359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 11.0, 8.0, 6.0, 10.0, 25.0, 16.0, 21.0, 34.0, 25.0, 33.0, 40.0, 33.0, 55.0, 48.0, 44.0, 50.0, 47.0, 51.0, 49.0, 37.0, 50.0, 40.0, 44.0, 39.0, 39.0, 27.0, 25.0, 20.0, 16.0, 13.0, 9.0, 12.0, 8.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.037109375, -1.0096511840820312, -0.9821929931640625, -0.9547348022460938, -0.927276611328125, -0.8998184204101562, -0.8723602294921875, -0.8449020385742188, -0.81744384765625, -0.7899856567382812, -0.7625274658203125, -0.7350692749023438, -0.707611083984375, -0.6801528930664062, -0.6526947021484375, -0.6252365112304688, -0.5977783203125, -0.5703201293945312, -0.5428619384765625, -0.5154037475585938, -0.487945556640625, -0.46048736572265625, -0.4330291748046875, -0.40557098388671875, -0.37811279296875, -0.35065460205078125, -0.3231964111328125, -0.29573822021484375, -0.268280029296875, -0.24082183837890625, -0.2133636474609375, -0.18590545654296875, -0.158447265625, -0.13098907470703125, -0.1035308837890625, -0.07607269287109375, -0.048614501953125, -0.02115631103515625, 0.0063018798828125, 0.03376007080078125, 0.06121826171875, 0.08867645263671875, 0.1161346435546875, 0.14359283447265625, 0.171051025390625, 0.19850921630859375, 0.2259674072265625, 0.25342559814453125, 0.2808837890625, 0.30834197998046875, 0.3358001708984375, 0.36325836181640625, 0.390716552734375, 0.41817474365234375, 0.4456329345703125, 0.47309112548828125, 0.50054931640625, 0.5280075073242188, 0.5554656982421875, 0.5829238891601562, 0.610382080078125, 0.6378402709960938, 0.6652984619140625, 0.6927566528320312, 0.72021484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 11.0, 25.0, 21.0, 28.0, 38.0, 51.0, 62.0, 99.0, 157.0, 216.0, 276.0, 421.0, 638.0, 1212.0, 3435.0, 16036.0, 115001.0, 605115.0, 261858.0, 33715.0, 5958.0, 1748.0, 821.0, 509.0, 312.0, 209.0, 175.0, 108.0, 81.0, 58.0, 42.0, 34.0, 23.0, 16.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.5703125, -6.363037109375, -6.15576171875, -5.948486328125, -5.7412109375, -5.533935546875, -5.32666015625, -5.119384765625, -4.912109375, -4.704833984375, -4.49755859375, -4.290283203125, -4.0830078125, -3.875732421875, -3.66845703125, -3.461181640625, -3.25390625, -3.046630859375, -2.83935546875, -2.632080078125, -2.4248046875, -2.217529296875, -2.01025390625, -1.802978515625, -1.595703125, -1.388427734375, -1.18115234375, -0.973876953125, -0.7666015625, -0.559326171875, -0.35205078125, -0.144775390625, 0.0625, 0.269775390625, 0.47705078125, 0.684326171875, 0.8916015625, 1.098876953125, 1.30615234375, 1.513427734375, 1.720703125, 1.927978515625, 2.13525390625, 2.342529296875, 2.5498046875, 2.757080078125, 2.96435546875, 3.171630859375, 3.37890625, 3.586181640625, 3.79345703125, 4.000732421875, 4.2080078125, 4.415283203125, 4.62255859375, 4.829833984375, 5.037109375, 5.244384765625, 5.45166015625, 5.658935546875, 5.8662109375, 6.073486328125, 6.28076171875, 6.488037109375, 6.6953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 8.0, 4.0, 5.0, 10.0, 9.0, 16.0, 21.0, 14.0, 9.0, 30.0, 22.0, 30.0, 33.0, 36.0, 47.0, 35.0, 35.0, 48.0, 40.0, 52.0, 39.0, 54.0, 51.0, 38.0, 34.0, 47.0, 34.0, 32.0, 25.0, 26.0, 31.0, 11.0, 8.0, 18.0, 9.0, 14.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.515625, -3.399932861328125, -3.28424072265625, -3.168548583984375, -3.0528564453125, -2.937164306640625, -2.82147216796875, -2.705780029296875, -2.590087890625, -2.474395751953125, -2.35870361328125, -2.243011474609375, -2.1273193359375, -2.011627197265625, -1.89593505859375, -1.780242919921875, -1.66455078125, -1.548858642578125, -1.43316650390625, -1.317474365234375, -1.2017822265625, -1.086090087890625, -0.97039794921875, -0.854705810546875, -0.739013671875, -0.623321533203125, -0.50762939453125, -0.391937255859375, -0.2762451171875, -0.160552978515625, -0.04486083984375, 0.070831298828125, 0.1865234375, 0.302215576171875, 0.41790771484375, 0.533599853515625, 0.6492919921875, 0.764984130859375, 0.88067626953125, 0.996368408203125, 1.112060546875, 1.227752685546875, 1.34344482421875, 1.459136962890625, 1.5748291015625, 1.690521240234375, 1.80621337890625, 1.921905517578125, 2.03759765625, 2.153289794921875, 2.26898193359375, 2.384674072265625, 2.5003662109375, 2.616058349609375, 2.73175048828125, 2.847442626953125, 2.963134765625, 3.078826904296875, 3.19451904296875, 3.310211181640625, 3.4259033203125, 3.541595458984375, 3.65728759765625, 3.772979736328125, 3.888671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 16.0, 26.0, 33.0, 40.0, 91.0, 138.0, 245.0, 524.0, 1373.0, 4625.0, 19471.0, 103487.0, 440109.0, 375860.0, 80921.0, 15568.0, 3653.0, 1248.0, 479.0, 269.0, 125.0, 73.0, 51.0, 29.0, 18.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.424072265625, -2.34814453125, -2.272216796875, -2.1962890625, -2.120361328125, -2.04443359375, -1.968505859375, -1.892578125, -1.816650390625, -1.74072265625, -1.664794921875, -1.5888671875, -1.512939453125, -1.43701171875, -1.361083984375, -1.28515625, -1.209228515625, -1.13330078125, -1.057373046875, -0.9814453125, -0.905517578125, -0.82958984375, -0.753662109375, -0.677734375, -0.601806640625, -0.52587890625, -0.449951171875, -0.3740234375, -0.298095703125, -0.22216796875, -0.146240234375, -0.0703125, 0.005615234375, 0.08154296875, 0.157470703125, 0.2333984375, 0.309326171875, 0.38525390625, 0.461181640625, 0.537109375, 0.613037109375, 0.68896484375, 0.764892578125, 0.8408203125, 0.916748046875, 0.99267578125, 1.068603515625, 1.14453125, 1.220458984375, 1.29638671875, 1.372314453125, 1.4482421875, 1.524169921875, 1.60009765625, 1.676025390625, 1.751953125, 1.827880859375, 1.90380859375, 1.979736328125, 2.0556640625, 2.131591796875, 2.20751953125, 2.283447265625, 2.359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 8.0, 7.0, 8.0, 8.0, 8.0, 14.0, 22.0, 37.0, 33.0, 31.0, 45.0, 48.0, 54.0, 44.0, 79.0, 75.0, 62.0, 66.0, 44.0, 43.0, 37.0, 42.0, 27.0, 14.0, 22.0, 23.0, 14.0, 22.0, 8.0, 12.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002522468566894531, -0.0002439543604850769, -0.00023566186428070068, -0.00022736936807632446, -0.00021907687187194824, -0.00021078437566757202, -0.0002024918794631958, -0.00019419938325881958, -0.00018590688705444336, -0.00017761439085006714, -0.00016932189464569092, -0.0001610293984413147, -0.00015273690223693848, -0.00014444440603256226, -0.00013615190982818604, -0.00012785941362380981, -0.0001195669174194336, -0.00011127442121505737, -0.00010298192501068115, -9.468942880630493e-05, -8.639693260192871e-05, -7.810443639755249e-05, -6.981194019317627e-05, -6.151944398880005e-05, -5.322694778442383e-05, -4.493445158004761e-05, -3.664195537567139e-05, -2.8349459171295166e-05, -2.0056962966918945e-05, -1.1764466762542725e-05, -3.471970558166504e-06, 4.820525646209717e-06, 1.3113021850585938e-05, 2.1405518054962158e-05, 2.969801425933838e-05, 3.79905104637146e-05, 4.628300666809082e-05, 5.457550287246704e-05, 6.286799907684326e-05, 7.116049528121948e-05, 7.94529914855957e-05, 8.774548768997192e-05, 9.603798389434814e-05, 0.00010433048009872437, 0.00011262297630310059, 0.0001209154725074768, 0.00012920796871185303, 0.00013750046491622925, 0.00014579296112060547, 0.0001540854573249817, 0.0001623779535293579, 0.00017067044973373413, 0.00017896294593811035, 0.00018725544214248657, 0.0001955479383468628, 0.00020384043455123901, 0.00021213293075561523, 0.00022042542695999146, 0.00022871792316436768, 0.0002370104193687439, 0.0002453029155731201, 0.00025359541177749634, 0.00026188790798187256, 0.0002701804041862488, 0.000278472900390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 8.0, 13.0, 24.0, 25.0, 38.0, 58.0, 89.0, 132.0, 198.0, 318.0, 605.0, 1206.0, 3050.0, 12633.0, 90787.0, 499662.0, 370947.0, 55511.0, 8559.0, 2289.0, 1010.0, 532.0, 315.0, 182.0, 113.0, 78.0, 52.0, 33.0, 22.0, 13.0, 9.0, 8.0, 1.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.85546875, -2.765899658203125, -2.67633056640625, -2.586761474609375, -2.4971923828125, -2.407623291015625, -2.31805419921875, -2.228485107421875, -2.138916015625, -2.049346923828125, -1.95977783203125, -1.870208740234375, -1.7806396484375, -1.691070556640625, -1.60150146484375, -1.511932373046875, -1.42236328125, -1.332794189453125, -1.24322509765625, -1.153656005859375, -1.0640869140625, -0.974517822265625, -0.88494873046875, -0.795379638671875, -0.705810546875, -0.616241455078125, -0.52667236328125, -0.437103271484375, -0.3475341796875, -0.257965087890625, -0.16839599609375, -0.078826904296875, 0.0107421875, 0.100311279296875, 0.18988037109375, 0.279449462890625, 0.3690185546875, 0.458587646484375, 0.54815673828125, 0.637725830078125, 0.727294921875, 0.816864013671875, 0.90643310546875, 0.996002197265625, 1.0855712890625, 1.175140380859375, 1.26470947265625, 1.354278564453125, 1.44384765625, 1.533416748046875, 1.62298583984375, 1.712554931640625, 1.8021240234375, 1.891693115234375, 1.98126220703125, 2.070831298828125, 2.160400390625, 2.249969482421875, 2.33953857421875, 2.429107666015625, 2.5186767578125, 2.608245849609375, 2.69781494140625, 2.787384033203125, 2.876953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 16.0, 20.0, 29.0, 34.0, 44.0, 65.0, 45.0, 66.0, 92.0, 95.0, 87.0, 75.0, 65.0, 63.0, 40.0, 39.0, 30.0, 24.0, 20.0, 12.0, 13.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3372344970703125, -1.275054931640625, -1.2128753662109375, -1.15069580078125, -1.0885162353515625, -1.026336669921875, -0.9641571044921875, -0.9019775390625, -0.8397979736328125, -0.777618408203125, -0.7154388427734375, -0.65325927734375, -0.5910797119140625, -0.528900146484375, -0.4667205810546875, -0.404541015625, -0.3423614501953125, -0.280181884765625, -0.2180023193359375, -0.15582275390625, -0.0936431884765625, -0.031463623046875, 0.0307159423828125, 0.0928955078125, 0.1550750732421875, 0.217254638671875, 0.2794342041015625, 0.34161376953125, 0.4037933349609375, 0.465972900390625, 0.5281524658203125, 0.59033203125, 0.6525115966796875, 0.714691162109375, 0.7768707275390625, 0.83905029296875, 0.9012298583984375, 0.963409423828125, 1.0255889892578125, 1.0877685546875, 1.1499481201171875, 1.212127685546875, 1.2743072509765625, 1.33648681640625, 1.3986663818359375, 1.460845947265625, 1.5230255126953125, 1.585205078125, 1.6473846435546875, 1.709564208984375, 1.7717437744140625, 1.83392333984375, 1.8961029052734375, 1.958282470703125, 2.0204620361328125, 2.0826416015625, 2.1448211669921875, 2.207000732421875, 2.2691802978515625, 2.33135986328125, 2.3935394287109375, 2.455718994140625, 2.5178985595703125, 2.580078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 12.0, 21.0, 46.0, 85.0, 165.0, 219.0, 206.0, 144.0, 58.0, 31.0, 16.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.44492721557617, -60.64997482299805, -58.855018615722656, -57.06006622314453, -55.26511001586914, -53.470157623291016, -51.675201416015625, -49.8802490234375, -48.085296630859375, -46.29034423828125, -44.49538803100586, -42.700435638427734, -40.905479431152344, -39.11052703857422, -37.315574645996094, -35.5206184387207, -33.72566223144531, -31.930707931518555, -30.135753631591797, -28.340801239013672, -26.54584503173828, -24.750892639160156, -22.9559383392334, -21.16098403930664, -19.366029739379883, -17.571075439453125, -15.776121139526367, -13.981167793273926, -12.186213493347168, -10.39125919342041, -8.596305847167969, -6.801351547241211, -5.006401062011719, -3.21144700050354, -1.4164929389953613, 0.3784608840942383, 2.173415184020996, 3.968369483947754, 5.763322830200195, 7.558277130126953, 9.353231430053711, 11.148185729980469, 12.943140029907227, 14.738093376159668, 16.53304672241211, 18.3280029296875, 20.122955322265625, 21.917909622192383, 23.71286392211914, 25.5078182220459, 27.302772521972656, 29.09772491455078, 30.892681121826172, 32.6876335144043, 34.48258972167969, 36.27754211425781, 38.07249450683594, 39.86744689941406, 41.66240310668945, 43.45735549926758, 45.25231170654297, 47.047264099121094, 48.84221649169922, 50.63717269897461, 52.43212890625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 2.0, 9.0, 5.0, 12.0, 11.0, 10.0, 17.0, 14.0, 27.0, 25.0, 18.0, 18.0, 40.0, 43.0, 41.0, 39.0, 36.0, 43.0, 41.0, 40.0, 39.0, 45.0, 40.0, 38.0, 51.0, 39.0, 34.0, 32.0, 20.0, 32.0, 27.0, 20.0, 11.0, 18.0, 14.0, 8.0, 7.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.701343536376953, -16.108783721923828, -15.516223907470703, -14.923663139343262, -14.331103324890137, -13.738543510437012, -13.14598274230957, -12.553422927856445, -11.96086311340332, -11.368303298950195, -10.77574348449707, -10.183182716369629, -9.590622901916504, -8.998063087463379, -8.405502319335938, -7.8129425048828125, -7.2203826904296875, -6.6278228759765625, -6.035262584686279, -5.442702293395996, -4.850142478942871, -4.257582664489746, -3.665022373199463, -3.0724620819091797, -2.4799022674560547, -1.8873422145843506, -1.2947821617126465, -0.7022221088409424, -0.10966205596923828, 0.4828979969024658, 1.07545804977417, 1.6680183410644531, 2.260580062866211, 2.853140115737915, 3.445700168609619, 4.038260459899902, 4.630820274353027, 5.223380088806152, 5.8159403800964355, 6.408500671386719, 7.001060485839844, 7.593620300292969, 8.186180114746094, 8.778740882873535, 9.37130069732666, 9.963860511779785, 10.556421279907227, 11.148981094360352, 11.741540908813477, 12.334100723266602, 12.926660537719727, 13.519221305847168, 14.111781120300293, 14.704340934753418, 15.29690170288086, 15.889461517333984, 16.48202133178711, 17.074581146240234, 17.66714096069336, 18.259700775146484, 18.85226058959961, 19.444822311401367, 20.037382125854492, 20.629941940307617, 21.222501754760742]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 5.0, 7.0, 18.0, 29.0, 34.0, 50.0, 79.0, 120.0, 154.0, 232.0, 327.0, 595.0, 1151.0, 2432.0, 7658.0, 56968.0, 4056076.0, 55495.0, 7590.0, 2500.0, 1086.0, 606.0, 324.0, 228.0, 153.0, 97.0, 70.0, 50.0, 41.0, 21.0, 13.0, 14.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.112060546875, -12.73193359375, -12.351806640625, -11.9716796875, -11.591552734375, -11.21142578125, -10.831298828125, -10.451171875, -10.071044921875, -9.69091796875, -9.310791015625, -8.9306640625, -8.550537109375, -8.17041015625, -7.790283203125, -7.41015625, -7.030029296875, -6.64990234375, -6.269775390625, -5.8896484375, -5.509521484375, -5.12939453125, -4.749267578125, -4.369140625, -3.989013671875, -3.60888671875, -3.228759765625, -2.8486328125, -2.468505859375, -2.08837890625, -1.708251953125, -1.328125, -0.947998046875, -0.56787109375, -0.187744140625, 0.1923828125, 0.572509765625, 0.95263671875, 1.332763671875, 1.712890625, 2.093017578125, 2.47314453125, 2.853271484375, 3.2333984375, 3.613525390625, 3.99365234375, 4.373779296875, 4.75390625, 5.134033203125, 5.51416015625, 5.894287109375, 6.2744140625, 6.654541015625, 7.03466796875, 7.414794921875, 7.794921875, 8.175048828125, 8.55517578125, 8.935302734375, 9.3154296875, 9.695556640625, 10.07568359375, 10.455810546875, 10.8359375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 13.0, 18.0, 28.0, 31.0, 39.0, 39.0, 40.0, 53.0, 52.0, 52.0, 48.0, 64.0, 54.0, 53.0, 58.0, 59.0, 46.0, 39.0, 36.0, 31.0, 25.0, 19.0, 22.0, 12.0, 6.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1056976318359375, -1.072723388671875, -1.0397491455078125, -1.00677490234375, -0.9738006591796875, -0.940826416015625, -0.9078521728515625, -0.8748779296875, -0.8419036865234375, -0.808929443359375, -0.7759552001953125, -0.74298095703125, -0.7100067138671875, -0.677032470703125, -0.6440582275390625, -0.611083984375, -0.5781097412109375, -0.545135498046875, -0.5121612548828125, -0.47918701171875, -0.4462127685546875, -0.413238525390625, -0.3802642822265625, -0.3472900390625, -0.3143157958984375, -0.281341552734375, -0.2483673095703125, -0.21539306640625, -0.1824188232421875, -0.149444580078125, -0.1164703369140625, -0.08349609375, -0.0505218505859375, -0.017547607421875, 0.0154266357421875, 0.04840087890625, 0.0813751220703125, 0.114349365234375, 0.1473236083984375, 0.1802978515625, 0.2132720947265625, 0.246246337890625, 0.2792205810546875, 0.31219482421875, 0.3451690673828125, 0.378143310546875, 0.4111175537109375, 0.444091796875, 0.4770660400390625, 0.510040283203125, 0.5430145263671875, 0.57598876953125, 0.6089630126953125, 0.641937255859375, 0.6749114990234375, 0.7078857421875, 0.7408599853515625, 0.773834228515625, 0.8068084716796875, 0.83978271484375, 0.8727569580078125, 0.905731201171875, 0.9387054443359375, 0.9716796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 11.0, 6.0, 7.0, 19.0, 12.0, 22.0, 36.0, 52.0, 97.0, 108.0, 148.0, 199.0, 319.0, 475.0, 671.0, 947.0, 1582.0, 2391.0, 4012.0, 7718.0, 16817.0, 48571.0, 310606.0, 3637294.0, 108453.0, 28110.0, 11180.0, 5499.0, 3089.0, 1892.0, 1243.0, 824.0, 533.0, 370.0, 310.0, 200.0, 134.0, 87.0, 70.0, 48.0, 39.0, 27.0, 18.0, 16.0, 10.0, 5.0, 1.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.33135986328125, -3.2135009765625, -3.09564208984375, -2.977783203125, -2.85992431640625, -2.7420654296875, -2.62420654296875, -2.50634765625, -2.38848876953125, -2.2706298828125, -2.15277099609375, -2.034912109375, -1.91705322265625, -1.7991943359375, -1.68133544921875, -1.5634765625, -1.44561767578125, -1.3277587890625, -1.20989990234375, -1.092041015625, -0.97418212890625, -0.8563232421875, -0.73846435546875, -0.62060546875, -0.50274658203125, -0.3848876953125, -0.26702880859375, -0.149169921875, -0.03131103515625, 0.0865478515625, 0.20440673828125, 0.322265625, 0.44012451171875, 0.5579833984375, 0.67584228515625, 0.793701171875, 0.91156005859375, 1.0294189453125, 1.14727783203125, 1.26513671875, 1.38299560546875, 1.5008544921875, 1.61871337890625, 1.736572265625, 1.85443115234375, 1.9722900390625, 2.09014892578125, 2.2080078125, 2.32586669921875, 2.4437255859375, 2.56158447265625, 2.679443359375, 2.79730224609375, 2.9151611328125, 3.03302001953125, 3.15087890625, 3.26873779296875, 3.3865966796875, 3.50445556640625, 3.622314453125, 3.74017333984375, 3.8580322265625, 3.97589111328125, 4.09375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 3.0, 4.0, 5.0, 17.0, 20.0, 33.0, 48.0, 82.0, 204.0, 2525.0, 761.0, 173.0, 66.0, 41.0, 25.0, 8.0, 11.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0282745361328125, -0.995025634765625, -0.9617767333984375, -0.92852783203125, -0.8952789306640625, -0.862030029296875, -0.8287811279296875, -0.7955322265625, -0.7622833251953125, -0.729034423828125, -0.6957855224609375, -0.66253662109375, -0.6292877197265625, -0.596038818359375, -0.5627899169921875, -0.529541015625, -0.4962921142578125, -0.463043212890625, -0.4297943115234375, -0.39654541015625, -0.3632965087890625, -0.330047607421875, -0.2967987060546875, -0.2635498046875, -0.2303009033203125, -0.197052001953125, -0.1638031005859375, -0.13055419921875, -0.0973052978515625, -0.064056396484375, -0.0308074951171875, 0.00244140625, 0.0356903076171875, 0.068939208984375, 0.1021881103515625, 0.13543701171875, 0.1686859130859375, 0.201934814453125, 0.2351837158203125, 0.2684326171875, 0.3016815185546875, 0.334930419921875, 0.3681793212890625, 0.40142822265625, 0.4346771240234375, 0.467926025390625, 0.5011749267578125, 0.534423828125, 0.5676727294921875, 0.600921630859375, 0.6341705322265625, 0.66741943359375, 0.7006683349609375, 0.733917236328125, 0.7671661376953125, 0.8004150390625, 0.8336639404296875, 0.866912841796875, 0.9001617431640625, 0.93341064453125, 0.9666595458984375, 0.999908447265625, 1.0331573486328125, 1.06640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 9.0, 28.0, 24.0, 47.0, 67.0, 82.0, 94.0, 124.0, 116.0, 98.0, 87.0, 72.0, 50.0, 41.0, 24.0, 11.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.908100605010986, -5.762397766113281, -5.616695404052734, -5.470992565155029, -5.325289726257324, -5.179587364196777, -5.033884525299072, -4.888181686401367, -4.74247932434082, -4.596776485443115, -4.451074123382568, -4.305371284484863, -4.159668445587158, -4.013966083526611, -3.8682632446289062, -3.7225606441497803, -3.576857805252075, -3.431155204772949, -3.285452365875244, -3.139749765396118, -2.994047164916992, -2.848344326019287, -2.702641725540161, -2.556939125061035, -2.41123628616333, -2.265533685684204, -2.119830846786499, -1.974128246307373, -1.828425645828247, -1.6827229261398315, -1.537020206451416, -1.39131760597229, -1.2456152439117432, -1.0999125242233276, -0.9542099237442017, -0.8085072040557861, -0.6628045439720154, -0.5171018838882446, -0.3713991641998291, -0.22569656372070312, -0.0799938440322876, 0.06570883095264435, 0.2114115059375763, 0.35711419582366943, 0.5028168559074402, 0.6485195159912109, 0.7942222356796265, 0.9399248361587524, 1.085627555847168, 1.2313302755355835, 1.3770328760147095, 1.522735595703125, 1.668438196182251, 1.8141409158706665, 1.959843635559082, 2.105546236038208, 2.251248836517334, 2.39695143699646, 2.542654275894165, 2.688356876373291, 2.834059476852417, 2.979762077331543, 3.125464916229248, 3.271167516708374, 3.416870355606079]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 9.0, 3.0, 5.0, 9.0, 12.0, 17.0, 15.0, 17.0, 22.0, 22.0, 25.0, 39.0, 31.0, 40.0, 42.0, 31.0, 48.0, 37.0, 42.0, 47.0, 45.0, 39.0, 41.0, 36.0, 33.0, 36.0, 38.0, 28.0, 36.0, 21.0, 20.0, 24.0, 13.0, 23.0, 11.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.091492176055908, -2.0252082347869873, -1.9589242935180664, -1.892640233039856, -1.826356291770935, -1.7600723505020142, -1.6937882900238037, -1.6275043487548828, -1.561220407485962, -1.494936466217041, -1.4286525249481201, -1.3623684644699097, -1.2960845232009888, -1.2298005819320679, -1.1635165214538574, -1.0972325801849365, -1.0309486389160156, -0.9646646976470947, -0.898380696773529, -0.8320966958999634, -0.7658127546310425, -0.6995288133621216, -0.6332448124885559, -0.5669608116149902, -0.5006768703460693, -0.43439289927482605, -0.36810892820358276, -0.3018249571323395, -0.2355409860610962, -0.1692570149898529, -0.10297304391860962, -0.03668907284736633, 0.029594898223876953, 0.09587886929512024, 0.16216284036636353, 0.2284468114376068, 0.2947307825088501, 0.3610147535800934, 0.42729872465133667, 0.49358269572257996, 0.5598666667938232, 0.6261506080627441, 0.6924346089363098, 0.7587186098098755, 0.8250025510787964, 0.8912864923477173, 0.957570493221283, 1.0238544940948486, 1.0901384353637695, 1.1564223766326904, 1.2227063179016113, 1.2889903783798218, 1.3552743196487427, 1.4215582609176636, 1.487842321395874, 1.554126262664795, 1.6204102039337158, 1.6866941452026367, 1.7529780864715576, 1.819262146949768, 1.885546088218689, 1.9518300294876099, 2.0181140899658203, 2.084398031234741, 2.150681972503662]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 11.0, 22.0, 20.0, 36.0, 50.0, 56.0, 80.0, 152.0, 196.0, 292.0, 416.0, 614.0, 882.0, 1437.0, 2347.0, 3807.0, 6543.0, 11223.0, 19991.0, 35392.0, 62593.0, 106021.0, 159207.0, 190370.0, 168950.0, 115348.0, 69321.0, 39810.0, 22100.0, 12557.0, 7291.0, 4189.0, 2537.0, 1636.0, 1020.0, 616.0, 443.0, 308.0, 207.0, 123.0, 82.0, 73.0, 45.0, 40.0, 30.0, 23.0, 13.0, 9.0, 5.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-2.03515625, -1.97271728515625, -1.9102783203125, -1.84783935546875, -1.785400390625, -1.72296142578125, -1.6605224609375, -1.59808349609375, -1.53564453125, -1.47320556640625, -1.4107666015625, -1.34832763671875, -1.285888671875, -1.22344970703125, -1.1610107421875, -1.09857177734375, -1.0361328125, -0.97369384765625, -0.9112548828125, -0.84881591796875, -0.786376953125, -0.72393798828125, -0.6614990234375, -0.59906005859375, -0.53662109375, -0.47418212890625, -0.4117431640625, -0.34930419921875, -0.286865234375, -0.22442626953125, -0.1619873046875, -0.09954833984375, -0.037109375, 0.02532958984375, 0.0877685546875, 0.15020751953125, 0.212646484375, 0.27508544921875, 0.3375244140625, 0.39996337890625, 0.46240234375, 0.52484130859375, 0.5872802734375, 0.64971923828125, 0.712158203125, 0.77459716796875, 0.8370361328125, 0.89947509765625, 0.9619140625, 1.02435302734375, 1.0867919921875, 1.14923095703125, 1.211669921875, 1.27410888671875, 1.3365478515625, 1.39898681640625, 1.46142578125, 1.52386474609375, 1.5863037109375, 1.64874267578125, 1.711181640625, 1.77362060546875, 1.8360595703125, 1.89849853515625, 1.9609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 12.0, 19.0, 24.0, 36.0, 42.0, 42.0, 44.0, 45.0, 56.0, 49.0, 54.0, 58.0, 52.0, 64.0, 54.0, 68.0, 32.0, 31.0, 25.0, 34.0, 23.0, 20.0, 12.0, 14.0, 10.0, 10.0, 10.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.232421875, -1.1984634399414062, -1.1645050048828125, -1.1305465698242188, -1.096588134765625, -1.0626296997070312, -1.0286712646484375, -0.9947128295898438, -0.96075439453125, -0.9267959594726562, -0.8928375244140625, -0.8588790893554688, -0.824920654296875, -0.7909622192382812, -0.7570037841796875, -0.7230453491210938, -0.6890869140625, -0.6551284790039062, -0.6211700439453125, -0.5872116088867188, -0.553253173828125, -0.5192947387695312, -0.4853363037109375, -0.45137786865234375, -0.41741943359375, -0.38346099853515625, -0.3495025634765625, -0.31554412841796875, -0.281585693359375, -0.24762725830078125, -0.2136688232421875, -0.17971038818359375, -0.145751953125, -0.11179351806640625, -0.0778350830078125, -0.04387664794921875, -0.009918212890625, 0.02404022216796875, 0.0579986572265625, 0.09195709228515625, 0.12591552734375, 0.15987396240234375, 0.1938323974609375, 0.22779083251953125, 0.261749267578125, 0.29570770263671875, 0.3296661376953125, 0.36362457275390625, 0.3975830078125, 0.43154144287109375, 0.4654998779296875, 0.49945831298828125, 0.533416748046875, 0.5673751831054688, 0.6013336181640625, 0.6352920532226562, 0.66925048828125, 0.7032089233398438, 0.7371673583984375, 0.7711257934570312, 0.805084228515625, 0.8390426635742188, 0.8730010986328125, 0.9069595336914062, 0.94091796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 4.0, 14.0, 17.0, 31.0, 32.0, 46.0, 57.0, 68.0, 117.0, 128.0, 172.0, 290.0, 351.0, 482.0, 729.0, 1333.0, 3850.0, 23571.0, 215127.0, 659666.0, 122507.0, 13759.0, 2708.0, 1134.0, 681.0, 446.0, 315.0, 223.0, 173.0, 124.0, 91.0, 65.0, 61.0, 51.0, 28.0, 22.0, 22.0, 14.0, 8.0, 9.0, 6.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.0423583984375, -4.858154296875, -4.6739501953125, -4.48974609375, -4.3055419921875, -4.121337890625, -3.9371337890625, -3.7529296875, -3.5687255859375, -3.384521484375, -3.2003173828125, -3.01611328125, -2.8319091796875, -2.647705078125, -2.4635009765625, -2.279296875, -2.0950927734375, -1.910888671875, -1.7266845703125, -1.54248046875, -1.3582763671875, -1.174072265625, -0.9898681640625, -0.8056640625, -0.6214599609375, -0.437255859375, -0.2530517578125, -0.06884765625, 0.1153564453125, 0.299560546875, 0.4837646484375, 0.66796875, 0.8521728515625, 1.036376953125, 1.2205810546875, 1.40478515625, 1.5889892578125, 1.773193359375, 1.9573974609375, 2.1416015625, 2.3258056640625, 2.510009765625, 2.6942138671875, 2.87841796875, 3.0626220703125, 3.246826171875, 3.4310302734375, 3.615234375, 3.7994384765625, 3.983642578125, 4.1678466796875, 4.35205078125, 4.5362548828125, 4.720458984375, 4.9046630859375, 5.0888671875, 5.2730712890625, 5.457275390625, 5.6414794921875, 5.82568359375, 6.0098876953125, 6.194091796875, 6.3782958984375, 6.5625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 8.0, 5.0, 9.0, 9.0, 13.0, 15.0, 12.0, 14.0, 20.0, 21.0, 26.0, 25.0, 34.0, 32.0, 33.0, 32.0, 47.0, 31.0, 42.0, 36.0, 40.0, 38.0, 45.0, 45.0, 50.0, 35.0, 38.0, 27.0, 29.0, 43.0, 24.0, 25.0, 11.0, 13.0, 13.0, 8.0, 14.0, 9.0, 6.0, 5.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.427734375, -3.3203125, -3.212890625, -3.10546875, -2.998046875, -2.890625, -2.783203125, -2.67578125, -2.568359375, -2.4609375, -2.353515625, -2.24609375, -2.138671875, -2.03125, -1.923828125, -1.81640625, -1.708984375, -1.6015625, -1.494140625, -1.38671875, -1.279296875, -1.171875, -1.064453125, -0.95703125, -0.849609375, -0.7421875, -0.634765625, -0.52734375, -0.419921875, -0.3125, -0.205078125, -0.09765625, 0.009765625, 0.1171875, 0.224609375, 0.33203125, 0.439453125, 0.546875, 0.654296875, 0.76171875, 0.869140625, 0.9765625, 1.083984375, 1.19140625, 1.298828125, 1.40625, 1.513671875, 1.62109375, 1.728515625, 1.8359375, 1.943359375, 2.05078125, 2.158203125, 2.265625, 2.373046875, 2.48046875, 2.587890625, 2.6953125, 2.802734375, 2.91015625, 3.017578125, 3.125, 3.232421875, 3.33984375, 3.447265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 6.0, 9.0, 7.0, 14.0, 14.0, 23.0, 28.0, 33.0, 63.0, 78.0, 148.0, 249.0, 484.0, 935.0, 2139.0, 6184.0, 23619.0, 109645.0, 469940.0, 339800.0, 71344.0, 15750.0, 4578.0, 1649.0, 767.0, 431.0, 205.0, 132.0, 84.0, 51.0, 39.0, 20.0, 17.0, 9.0, 16.0, 9.0, 15.0, 6.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.11328125, -2.046966552734375, -1.98065185546875, -1.914337158203125, -1.8480224609375, -1.781707763671875, -1.71539306640625, -1.649078369140625, -1.582763671875, -1.516448974609375, -1.45013427734375, -1.383819580078125, -1.3175048828125, -1.251190185546875, -1.18487548828125, -1.118560791015625, -1.05224609375, -0.985931396484375, -0.91961669921875, -0.853302001953125, -0.7869873046875, -0.720672607421875, -0.65435791015625, -0.588043212890625, -0.521728515625, -0.455413818359375, -0.38909912109375, -0.322784423828125, -0.2564697265625, -0.190155029296875, -0.12384033203125, -0.057525634765625, 0.0087890625, 0.075103759765625, 0.14141845703125, 0.207733154296875, 0.2740478515625, 0.340362548828125, 0.40667724609375, 0.472991943359375, 0.539306640625, 0.605621337890625, 0.67193603515625, 0.738250732421875, 0.8045654296875, 0.870880126953125, 0.93719482421875, 1.003509521484375, 1.06982421875, 1.136138916015625, 1.20245361328125, 1.268768310546875, 1.3350830078125, 1.401397705078125, 1.46771240234375, 1.534027099609375, 1.600341796875, 1.666656494140625, 1.73297119140625, 1.799285888671875, 1.8656005859375, 1.931915283203125, 1.99822998046875, 2.064544677734375, 2.130859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 5.0, 13.0, 10.0, 20.0, 18.0, 16.0, 29.0, 32.0, 48.0, 52.0, 67.0, 68.0, 97.0, 76.0, 64.0, 70.0, 58.0, 51.0, 42.0, 28.0, 32.0, 15.0, 26.0, 8.0, 11.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024330615997314453, -0.00023430772125720978, -0.00022530928254127502, -0.00021631084382534027, -0.00020731240510940552, -0.00019831396639347076, -0.000189315527677536, -0.00018031708896160126, -0.0001713186502456665, -0.00016232021152973175, -0.000153321772813797, -0.00014432333409786224, -0.0001353248953819275, -0.00012632645666599274, -0.00011732801795005798, -0.00010832957923412323, -9.933114051818848e-05, -9.033270180225372e-05, -8.133426308631897e-05, -7.233582437038422e-05, -6.333738565444946e-05, -5.433894693851471e-05, -4.5340508222579956e-05, -3.63420695066452e-05, -2.734363079071045e-05, -1.8345192074775696e-05, -9.346753358840942e-06, -3.4831464290618896e-07, 8.650124073028564e-06, 1.7648562788963318e-05, 2.664700150489807e-05, 3.5645440220832825e-05, 4.464387893676758e-05, 5.364231765270233e-05, 6.264075636863708e-05, 7.163919508457184e-05, 8.063763380050659e-05, 8.963607251644135e-05, 9.86345112323761e-05, 0.00010763294994831085, 0.0001166313886642456, 0.00012562982738018036, 0.0001346282660961151, 0.00014362670481204987, 0.00015262514352798462, 0.00016162358224391937, 0.00017062202095985413, 0.00017962045967578888, 0.00018861889839172363, 0.00019761733710765839, 0.00020661577582359314, 0.0002156142145395279, 0.00022461265325546265, 0.0002336110919713974, 0.00024260953068733215, 0.0002516079694032669, 0.00026060640811920166, 0.0002696048468351364, 0.00027860328555107117, 0.0002876017242670059, 0.0002966001629829407, 0.00030559860169887543, 0.0003145970404148102, 0.00032359547913074493, 0.0003325939178466797]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 11.0, 9.0, 16.0, 32.0, 46.0, 55.0, 109.0, 128.0, 213.0, 373.0, 690.0, 1421.0, 3668.0, 14514.0, 108972.0, 640992.0, 239670.0, 27998.0, 5651.0, 1909.0, 917.0, 463.0, 231.0, 140.0, 90.0, 64.0, 49.0, 32.0, 26.0, 12.0, 12.0, 9.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.87890625, -2.78802490234375, -2.6971435546875, -2.60626220703125, -2.515380859375, -2.42449951171875, -2.3336181640625, -2.24273681640625, -2.15185546875, -2.06097412109375, -1.9700927734375, -1.87921142578125, -1.788330078125, -1.69744873046875, -1.6065673828125, -1.51568603515625, -1.4248046875, -1.33392333984375, -1.2430419921875, -1.15216064453125, -1.061279296875, -0.97039794921875, -0.8795166015625, -0.78863525390625, -0.69775390625, -0.60687255859375, -0.5159912109375, -0.42510986328125, -0.334228515625, -0.24334716796875, -0.1524658203125, -0.06158447265625, 0.029296875, 0.12017822265625, 0.2110595703125, 0.30194091796875, 0.392822265625, 0.48370361328125, 0.5745849609375, 0.66546630859375, 0.75634765625, 0.84722900390625, 0.9381103515625, 1.02899169921875, 1.119873046875, 1.21075439453125, 1.3016357421875, 1.39251708984375, 1.4833984375, 1.57427978515625, 1.6651611328125, 1.75604248046875, 1.846923828125, 1.93780517578125, 2.0286865234375, 2.11956787109375, 2.21044921875, 2.30133056640625, 2.3922119140625, 2.48309326171875, 2.573974609375, 2.66485595703125, 2.7557373046875, 2.84661865234375, 2.9375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 12.0, 10.0, 21.0, 26.0, 28.0, 42.0, 42.0, 54.0, 94.0, 89.0, 83.0, 91.0, 80.0, 66.0, 72.0, 39.0, 45.0, 30.0, 21.0, 15.0, 9.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.955474853515625, -1.88555908203125, -1.815643310546875, -1.7457275390625, -1.675811767578125, -1.60589599609375, -1.535980224609375, -1.466064453125, -1.396148681640625, -1.32623291015625, -1.256317138671875, -1.1864013671875, -1.116485595703125, -1.04656982421875, -0.976654052734375, -0.90673828125, -0.836822509765625, -0.76690673828125, -0.696990966796875, -0.6270751953125, -0.557159423828125, -0.48724365234375, -0.417327880859375, -0.347412109375, -0.277496337890625, -0.20758056640625, -0.137664794921875, -0.0677490234375, 0.002166748046875, 0.07208251953125, 0.141998291015625, 0.2119140625, 0.281829833984375, 0.35174560546875, 0.421661376953125, 0.4915771484375, 0.561492919921875, 0.63140869140625, 0.701324462890625, 0.771240234375, 0.841156005859375, 0.91107177734375, 0.980987548828125, 1.0509033203125, 1.120819091796875, 1.19073486328125, 1.260650634765625, 1.33056640625, 1.400482177734375, 1.47039794921875, 1.540313720703125, 1.6102294921875, 1.680145263671875, 1.75006103515625, 1.819976806640625, 1.889892578125, 1.959808349609375, 2.02972412109375, 2.099639892578125, 2.1695556640625, 2.239471435546875, 2.30938720703125, 2.379302978515625, 2.44921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 15.0, 24.0, 69.0, 109.0, 187.0, 231.0, 155.0, 103.0, 59.0, 33.0, 9.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.95857238769531, -39.29039764404297, -37.62221908569336, -35.95404052734375, -34.285865783691406, -32.61769104003906, -30.949512481689453, -29.281335830688477, -27.6131591796875, -25.944982528686523, -24.276805877685547, -22.60862922668457, -20.940452575683594, -19.272275924682617, -17.60409927368164, -15.935922622680664, -14.267745971679688, -12.599569320678711, -10.931392669677734, -9.263216018676758, -7.595039367675781, -5.926862716674805, -4.258686065673828, -2.5905094146728516, -0.922332763671875, 0.7458438873291016, 2.414020538330078, 4.082197189331055, 5.750373840332031, 7.418550491333008, 9.086727142333984, 10.754903793334961, 12.423080444335938, 14.091257095336914, 15.75943374633789, 17.427610397338867, 19.095787048339844, 20.76396369934082, 22.432140350341797, 24.100317001342773, 25.76849365234375, 27.436670303344727, 29.104846954345703, 30.77302360534668, 32.441200256347656, 34.109375, 35.77755355834961, 37.44573211669922, 39.11390686035156, 40.782081604003906, 42.450260162353516, 44.118438720703125, 45.78661346435547, 47.45478820800781, 49.12296676635742, 50.79114532470703, 52.459320068359375, 54.12749481201172, 55.79567337036133, 57.46385192871094, 59.13202667236328, 60.800201416015625, 62.468379974365234, 64.13655853271484, 65.80473327636719]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 18.0, 9.0, 9.0, 19.0, 20.0, 18.0, 30.0, 25.0, 27.0, 47.0, 24.0, 39.0, 51.0, 48.0, 52.0, 45.0, 52.0, 51.0, 44.0, 45.0, 40.0, 37.0, 37.0, 34.0, 30.0, 23.0, 18.0, 20.0, 14.0, 18.0, 9.0, 9.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.52798843383789, -22.886945724487305, -22.24590301513672, -21.604860305786133, -20.963817596435547, -20.322772979736328, -19.681730270385742, -19.040687561035156, -18.39964485168457, -17.758602142333984, -17.1175594329834, -16.476516723632812, -15.83547306060791, -15.194430351257324, -14.553386688232422, -13.912343978881836, -13.27130126953125, -12.630258560180664, -11.989215850830078, -11.348172187805176, -10.70712947845459, -10.066086769104004, -9.425043106079102, -8.784000396728516, -8.14295768737793, -7.501914978027344, -6.8608717918396, -6.2198286056518555, -5.5787858963012695, -4.937743186950684, -4.2967000007629395, -3.6556568145751953, -3.0146141052246094, -2.3735711574554443, -1.7325282096862793, -1.0914852619171143, -0.4504423141479492, 0.19060063362121582, 0.8316435813903809, 1.472686767578125, 2.113729476928711, 2.754772424697876, 3.395815372467041, 4.036858558654785, 4.677901268005371, 5.318943977355957, 5.959987163543701, 6.601030349731445, 7.242073059082031, 7.883115768432617, 8.524158477783203, 9.165202140808105, 9.806244850158691, 10.447287559509277, 11.08833122253418, 11.729373931884766, 12.370416641235352, 13.011459350585938, 13.652502059936523, 14.293545722961426, 14.934588432312012, 15.575631141662598, 16.2166748046875, 16.857717514038086, 17.498760223388672]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 12.0, 11.0, 7.0, 11.0, 26.0, 46.0, 53.0, 101.0, 165.0, 230.0, 387.0, 813.0, 1509.0, 3364.0, 10120.0, 53889.0, 3962686.0, 134930.0, 16948.0, 4787.0, 1951.0, 910.0, 528.0, 303.0, 166.0, 97.0, 70.0, 54.0, 36.0, 26.0, 9.0, 8.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.13330078125, -7.8681640625, -7.60302734375, -7.337890625, -7.07275390625, -6.8076171875, -6.54248046875, -6.27734375, -6.01220703125, -5.7470703125, -5.48193359375, -5.216796875, -4.95166015625, -4.6865234375, -4.42138671875, -4.15625, -3.89111328125, -3.6259765625, -3.36083984375, -3.095703125, -2.83056640625, -2.5654296875, -2.30029296875, -2.03515625, -1.77001953125, -1.5048828125, -1.23974609375, -0.974609375, -0.70947265625, -0.4443359375, -0.17919921875, 0.0859375, 0.35107421875, 0.6162109375, 0.88134765625, 1.146484375, 1.41162109375, 1.6767578125, 1.94189453125, 2.20703125, 2.47216796875, 2.7373046875, 3.00244140625, 3.267578125, 3.53271484375, 3.7978515625, 4.06298828125, 4.328125, 4.59326171875, 4.8583984375, 5.12353515625, 5.388671875, 5.65380859375, 5.9189453125, 6.18408203125, 6.44921875, 6.71435546875, 6.9794921875, 7.24462890625, 7.509765625, 7.77490234375, 8.0400390625, 8.30517578125, 8.5703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 13.0, 11.0, 10.0, 24.0, 11.0, 26.0, 35.0, 32.0, 33.0, 53.0, 36.0, 50.0, 45.0, 82.0, 50.0, 61.0, 52.0, 58.0, 47.0, 35.0, 46.0, 34.0, 26.0, 26.0, 21.0, 16.0, 19.0, 6.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2490234375, -1.2156448364257812, -1.1822662353515625, -1.1488876342773438, -1.115509033203125, -1.0821304321289062, -1.0487518310546875, -1.0153732299804688, -0.98199462890625, -0.9486160278320312, -0.9152374267578125, -0.8818588256835938, -0.848480224609375, -0.8151016235351562, -0.7817230224609375, -0.7483444213867188, -0.7149658203125, -0.6815872192382812, -0.6482086181640625, -0.6148300170898438, -0.581451416015625, -0.5480728149414062, -0.5146942138671875, -0.48131561279296875, -0.44793701171875, -0.41455841064453125, -0.3811798095703125, -0.34780120849609375, -0.314422607421875, -0.28104400634765625, -0.2476654052734375, -0.21428680419921875, -0.180908203125, -0.14752960205078125, -0.1141510009765625, -0.08077239990234375, -0.047393798828125, -0.01401519775390625, 0.0193634033203125, 0.05274200439453125, 0.08612060546875, 0.11949920654296875, 0.1528778076171875, 0.18625640869140625, 0.219635009765625, 0.25301361083984375, 0.2863922119140625, 0.31977081298828125, 0.3531494140625, 0.38652801513671875, 0.4199066162109375, 0.45328521728515625, 0.486663818359375, 0.5200424194335938, 0.5534210205078125, 0.5867996215820312, 0.62017822265625, 0.6535568237304688, 0.6869354248046875, 0.7203140258789062, 0.753692626953125, 0.7870712280273438, 0.8204498291015625, 0.8538284301757812, 0.88720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 18.0, 21.0, 18.0, 34.0, 39.0, 48.0, 86.0, 114.0, 162.0, 216.0, 357.0, 542.0, 881.0, 1259.0, 2220.0, 3754.0, 7062.0, 14941.0, 40439.0, 186033.0, 3663301.0, 197990.0, 42090.0, 15557.0, 7305.0, 3749.0, 2169.0, 1283.0, 834.0, 563.0, 389.0, 231.0, 161.0, 106.0, 93.0, 58.0, 33.0, 40.0, 18.0, 15.0, 9.0, 13.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.611328125, -3.49298095703125, -3.3746337890625, -3.25628662109375, -3.137939453125, -3.01959228515625, -2.9012451171875, -2.78289794921875, -2.66455078125, -2.54620361328125, -2.4278564453125, -2.30950927734375, -2.191162109375, -2.07281494140625, -1.9544677734375, -1.83612060546875, -1.7177734375, -1.59942626953125, -1.4810791015625, -1.36273193359375, -1.244384765625, -1.12603759765625, -1.0076904296875, -0.88934326171875, -0.77099609375, -0.65264892578125, -0.5343017578125, -0.41595458984375, -0.297607421875, -0.17926025390625, -0.0609130859375, 0.05743408203125, 0.17578125, 0.29412841796875, 0.4124755859375, 0.53082275390625, 0.649169921875, 0.76751708984375, 0.8858642578125, 1.00421142578125, 1.12255859375, 1.24090576171875, 1.3592529296875, 1.47760009765625, 1.595947265625, 1.71429443359375, 1.8326416015625, 1.95098876953125, 2.0693359375, 2.18768310546875, 2.3060302734375, 2.42437744140625, 2.542724609375, 2.66107177734375, 2.7794189453125, 2.89776611328125, 3.01611328125, 3.13446044921875, 3.2528076171875, 3.37115478515625, 3.489501953125, 3.60784912109375, 3.7261962890625, 3.84454345703125, 3.962890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 13.0, 21.0, 29.0, 43.0, 53.0, 110.0, 273.0, 2450.0, 592.0, 186.0, 92.0, 52.0, 36.0, 24.0, 12.0, 11.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9242630004882812, -0.8910064697265625, -0.8577499389648438, -0.824493408203125, -0.7912368774414062, -0.7579803466796875, -0.7247238159179688, -0.69146728515625, -0.6582107543945312, -0.6249542236328125, -0.5916976928710938, -0.558441162109375, -0.5251846313476562, -0.4919281005859375, -0.45867156982421875, -0.4254150390625, -0.39215850830078125, -0.3589019775390625, -0.32564544677734375, -0.292388916015625, -0.25913238525390625, -0.2258758544921875, -0.19261932373046875, -0.15936279296875, -0.12610626220703125, -0.0928497314453125, -0.05959320068359375, -0.026336669921875, 0.00691986083984375, 0.0401763916015625, 0.07343292236328125, 0.106689453125, 0.13994598388671875, 0.1732025146484375, 0.20645904541015625, 0.239715576171875, 0.27297210693359375, 0.3062286376953125, 0.33948516845703125, 0.37274169921875, 0.40599822998046875, 0.4392547607421875, 0.47251129150390625, 0.505767822265625, 0.5390243530273438, 0.5722808837890625, 0.6055374145507812, 0.6387939453125, 0.6720504760742188, 0.7053070068359375, 0.7385635375976562, 0.771820068359375, 0.8050765991210938, 0.8383331298828125, 0.8715896606445312, 0.90484619140625, 0.9381027221679688, 0.9713592529296875, 1.0046157836914062, 1.037872314453125, 1.0711288452148438, 1.1043853759765625, 1.1376419067382812, 1.1708984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 12.0, 9.0, 13.0, 21.0, 32.0, 49.0, 66.0, 69.0, 89.0, 109.0, 99.0, 105.0, 99.0, 65.0, 51.0, 38.0, 23.0, 23.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.423069000244141, -4.252223014831543, -4.081377029418945, -3.910531520843506, -3.739685535430908, -3.5688395500183105, -3.397993803024292, -3.2271480560302734, -3.056302070617676, -2.885456085205078, -2.7146103382110596, -2.543764591217041, -2.3729186058044434, -2.2020726203918457, -2.031226873397827, -1.860381007194519, -1.689535140991211, -1.5186892747879028, -1.3478434085845947, -1.1769975423812866, -1.0061516761779785, -0.8353058099746704, -0.6644599437713623, -0.4936140775680542, -0.3227682113647461, -0.151922345161438, 0.018923521041870117, 0.18976938724517822, 0.36061525344848633, 0.5314611196517944, 0.7023069858551025, 0.8731528520584106, 1.0439987182617188, 1.2148445844650269, 1.385690450668335, 1.556536316871643, 1.7273821830749512, 1.8982280492782593, 2.0690739154815674, 2.239919662475586, 2.4107656478881836, 2.5816116333007812, 2.7524573802948, 2.9233031272888184, 3.094149112701416, 3.2649950981140137, 3.4358408451080322, 3.606686592102051, 3.7775325775146484, 3.948378562927246, 4.119224548339844, 4.290070056915283, 4.460916042327881, 4.6317620277404785, 4.802607536315918, 4.973453521728516, 5.144299507141113, 5.315145492553711, 5.485991477966309, 5.656836986541748, 5.827682971954346, 5.998528957366943, 6.169374465942383, 6.3402204513549805, 6.511066436767578]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 10.0, 5.0, 18.0, 8.0, 12.0, 8.0, 14.0, 32.0, 23.0, 29.0, 22.0, 22.0, 41.0, 42.0, 33.0, 36.0, 44.0, 38.0, 43.0, 51.0, 47.0, 35.0, 43.0, 26.0, 40.0, 28.0, 32.0, 33.0, 20.0, 25.0, 32.0, 25.0, 10.0, 11.0, 9.0, 12.0, 6.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4137866497039795, -2.3262338638305664, -2.2386810779571533, -2.1511282920837402, -2.063575506210327, -1.976022720336914, -1.8884700536727905, -1.8009172677993774, -1.7133644819259644, -1.6258116960525513, -1.5382589101791382, -1.4507062435150146, -1.3631534576416016, -1.2756006717681885, -1.1880478858947754, -1.1004951000213623, -1.0129423141479492, -0.9253895282745361, -0.837836742401123, -0.7502840161323547, -0.6627312302589417, -0.5751784443855286, -0.48762571811676025, -0.40007293224334717, -0.3125201463699341, -0.2249673753976822, -0.1374146044254303, -0.0498618483543396, 0.037690937519073486, 0.12524372339248657, 0.21279644966125488, 0.30034923553466797, 0.38790202140808105, 0.47545480728149414, 0.5630075931549072, 0.6505603194236755, 0.7381131052970886, 0.8256658911705017, 0.91321861743927, 1.000771403312683, 1.0883241891860962, 1.1758769750595093, 1.2634297609329224, 1.350982427597046, 1.438535213470459, 1.526087999343872, 1.6136407852172852, 1.7011935710906982, 1.7887463569641113, 1.8762991428375244, 1.9638519287109375, 2.0514047145843506, 2.1389575004577637, 2.2265102863311768, 2.31406307220459, 2.401615619659424, 2.489168643951416, 2.576721429824829, 2.664274215698242, 2.7518270015716553, 2.8393797874450684, 2.9269325733184814, 3.0144853591918945, 3.1020379066467285, 3.1895906925201416]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 8.0, 8.0, 10.0, 17.0, 15.0, 21.0, 36.0, 72.0, 74.0, 95.0, 177.0, 255.0, 348.0, 562.0, 795.0, 1287.0, 2115.0, 3371.0, 5910.0, 10692.0, 19213.0, 36375.0, 68102.0, 119240.0, 179148.0, 203712.0, 164462.0, 104237.0, 58008.0, 31052.0, 16749.0, 8971.0, 5136.0, 3012.0, 1861.0, 1141.0, 793.0, 456.0, 328.0, 204.0, 159.0, 101.0, 73.0, 50.0, 37.0, 24.0, 15.0, 9.0, 8.0, 7.0, 4.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7060546875, -1.65167236328125, -1.5972900390625, -1.54290771484375, -1.488525390625, -1.43414306640625, -1.3797607421875, -1.32537841796875, -1.27099609375, -1.21661376953125, -1.1622314453125, -1.10784912109375, -1.053466796875, -0.99908447265625, -0.9447021484375, -0.89031982421875, -0.8359375, -0.78155517578125, -0.7271728515625, -0.67279052734375, -0.618408203125, -0.56402587890625, -0.5096435546875, -0.45526123046875, -0.40087890625, -0.34649658203125, -0.2921142578125, -0.23773193359375, -0.183349609375, -0.12896728515625, -0.0745849609375, -0.02020263671875, 0.0341796875, 0.08856201171875, 0.1429443359375, 0.19732666015625, 0.251708984375, 0.30609130859375, 0.3604736328125, 0.41485595703125, 0.46923828125, 0.52362060546875, 0.5780029296875, 0.63238525390625, 0.686767578125, 0.74114990234375, 0.7955322265625, 0.84991455078125, 0.904296875, 0.95867919921875, 1.0130615234375, 1.06744384765625, 1.121826171875, 1.17620849609375, 1.2305908203125, 1.28497314453125, 1.33935546875, 1.39373779296875, 1.4481201171875, 1.50250244140625, 1.556884765625, 1.61126708984375, 1.6656494140625, 1.72003173828125, 1.7744140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 5.0, 11.0, 16.0, 16.0, 16.0, 26.0, 17.0, 30.0, 25.0, 28.0, 41.0, 43.0, 55.0, 45.0, 40.0, 55.0, 56.0, 57.0, 49.0, 42.0, 52.0, 44.0, 43.0, 29.0, 24.0, 17.0, 28.0, 15.0, 12.0, 13.0, 8.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.263671875, -1.2305068969726562, -1.1973419189453125, -1.1641769409179688, -1.131011962890625, -1.0978469848632812, -1.0646820068359375, -1.0315170288085938, -0.99835205078125, -0.9651870727539062, -0.9320220947265625, -0.8988571166992188, -0.865692138671875, -0.8325271606445312, -0.7993621826171875, -0.7661972045898438, -0.7330322265625, -0.6998672485351562, -0.6667022705078125, -0.6335372924804688, -0.600372314453125, -0.5672073364257812, -0.5340423583984375, -0.5008773803710938, -0.46771240234375, -0.43454742431640625, -0.4013824462890625, -0.36821746826171875, -0.335052490234375, -0.30188751220703125, -0.2687225341796875, -0.23555755615234375, -0.202392578125, -0.16922760009765625, -0.1360626220703125, -0.10289764404296875, -0.069732666015625, -0.03656768798828125, -0.0034027099609375, 0.02976226806640625, 0.06292724609375, 0.09609222412109375, 0.1292572021484375, 0.16242218017578125, 0.195587158203125, 0.22875213623046875, 0.2619171142578125, 0.29508209228515625, 0.3282470703125, 0.36141204833984375, 0.3945770263671875, 0.42774200439453125, 0.460906982421875, 0.49407196044921875, 0.5272369384765625, 0.5604019165039062, 0.59356689453125, 0.6267318725585938, 0.6598968505859375, 0.6930618286132812, 0.726226806640625, 0.7593917846679688, 0.7925567626953125, 0.8257217407226562, 0.85888671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 9.0, 14.0, 20.0, 27.0, 41.0, 63.0, 81.0, 104.0, 138.0, 229.0, 300.0, 410.0, 597.0, 960.0, 1627.0, 5708.0, 66551.0, 744790.0, 208564.0, 12524.0, 2377.0, 1090.0, 693.0, 447.0, 331.0, 251.0, 190.0, 128.0, 99.0, 58.0, 36.0, 29.0, 22.0, 12.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.510498046875, -6.29833984375, -6.086181640625, -5.8740234375, -5.661865234375, -5.44970703125, -5.237548828125, -5.025390625, -4.813232421875, -4.60107421875, -4.388916015625, -4.1767578125, -3.964599609375, -3.75244140625, -3.540283203125, -3.328125, -3.115966796875, -2.90380859375, -2.691650390625, -2.4794921875, -2.267333984375, -2.05517578125, -1.843017578125, -1.630859375, -1.418701171875, -1.20654296875, -0.994384765625, -0.7822265625, -0.570068359375, -0.35791015625, -0.145751953125, 0.06640625, 0.278564453125, 0.49072265625, 0.702880859375, 0.9150390625, 1.127197265625, 1.33935546875, 1.551513671875, 1.763671875, 1.975830078125, 2.18798828125, 2.400146484375, 2.6123046875, 2.824462890625, 3.03662109375, 3.248779296875, 3.4609375, 3.673095703125, 3.88525390625, 4.097412109375, 4.3095703125, 4.521728515625, 4.73388671875, 4.946044921875, 5.158203125, 5.370361328125, 5.58251953125, 5.794677734375, 6.0068359375, 6.218994140625, 6.43115234375, 6.643310546875, 6.85546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 1.0, 7.0, 10.0, 5.0, 3.0, 14.0, 16.0, 19.0, 23.0, 16.0, 21.0, 33.0, 27.0, 27.0, 29.0, 34.0, 35.0, 43.0, 50.0, 42.0, 35.0, 35.0, 50.0, 38.0, 42.0, 29.0, 36.0, 36.0, 32.0, 34.0, 28.0, 18.0, 14.0, 19.0, 12.0, 14.0, 10.0, 13.0, 10.0, 3.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.908203125, -3.787078857421875, -3.66595458984375, -3.544830322265625, -3.4237060546875, -3.302581787109375, -3.18145751953125, -3.060333251953125, -2.939208984375, -2.818084716796875, -2.69696044921875, -2.575836181640625, -2.4547119140625, -2.333587646484375, -2.21246337890625, -2.091339111328125, -1.97021484375, -1.849090576171875, -1.72796630859375, -1.606842041015625, -1.4857177734375, -1.364593505859375, -1.24346923828125, -1.122344970703125, -1.001220703125, -0.880096435546875, -0.75897216796875, -0.637847900390625, -0.5167236328125, -0.395599365234375, -0.27447509765625, -0.153350830078125, -0.0322265625, 0.088897705078125, 0.21002197265625, 0.331146240234375, 0.4522705078125, 0.573394775390625, 0.69451904296875, 0.815643310546875, 0.936767578125, 1.057891845703125, 1.17901611328125, 1.300140380859375, 1.4212646484375, 1.542388916015625, 1.66351318359375, 1.784637451171875, 1.90576171875, 2.026885986328125, 2.14801025390625, 2.269134521484375, 2.3902587890625, 2.511383056640625, 2.63250732421875, 2.753631591796875, 2.874755859375, 2.995880126953125, 3.11700439453125, 3.238128662109375, 3.3592529296875, 3.480377197265625, 3.60150146484375, 3.722625732421875, 3.84375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 0.0, 6.0, 7.0, 7.0, 7.0, 6.0, 15.0, 25.0, 23.0, 45.0, 56.0, 74.0, 127.0, 178.0, 320.0, 550.0, 1146.0, 3256.0, 16739.0, 177337.0, 743416.0, 90221.0, 10266.0, 2455.0, 991.0, 482.0, 284.0, 164.0, 98.0, 78.0, 48.0, 33.0, 29.0, 20.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.82421875, -2.731231689453125, -2.63824462890625, -2.545257568359375, -2.4522705078125, -2.359283447265625, -2.26629638671875, -2.173309326171875, -2.080322265625, -1.987335205078125, -1.89434814453125, -1.801361083984375, -1.7083740234375, -1.615386962890625, -1.52239990234375, -1.429412841796875, -1.33642578125, -1.243438720703125, -1.15045166015625, -1.057464599609375, -0.9644775390625, -0.871490478515625, -0.77850341796875, -0.685516357421875, -0.592529296875, -0.499542236328125, -0.40655517578125, -0.313568115234375, -0.2205810546875, -0.127593994140625, -0.03460693359375, 0.058380126953125, 0.1513671875, 0.244354248046875, 0.33734130859375, 0.430328369140625, 0.5233154296875, 0.616302490234375, 0.70928955078125, 0.802276611328125, 0.895263671875, 0.988250732421875, 1.08123779296875, 1.174224853515625, 1.2672119140625, 1.360198974609375, 1.45318603515625, 1.546173095703125, 1.63916015625, 1.732147216796875, 1.82513427734375, 1.918121337890625, 2.0111083984375, 2.104095458984375, 2.19708251953125, 2.290069580078125, 2.383056640625, 2.476043701171875, 2.56903076171875, 2.662017822265625, 2.7550048828125, 2.847991943359375, 2.94097900390625, 3.033966064453125, 3.126953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 14.0, 19.0, 29.0, 27.0, 63.0, 70.0, 81.0, 117.0, 113.0, 108.0, 96.0, 69.0, 49.0, 31.0, 30.0, 18.0, 13.0, 10.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003783702850341797, -0.0003658905625343323, -0.00035341084003448486, -0.00034093111753463745, -0.00032845139503479004, -0.0003159716725349426, -0.0003034919500350952, -0.0002910122275352478, -0.0002785325050354004, -0.000266052782535553, -0.00025357306003570557, -0.00024109333753585815, -0.00022861361503601074, -0.00021613389253616333, -0.00020365417003631592, -0.0001911744475364685, -0.0001786947250366211, -0.00016621500253677368, -0.00015373528003692627, -0.00014125555753707886, -0.00012877583503723145, -0.00011629611253738403, -0.00010381639003753662, -9.133666753768921e-05, -7.88569450378418e-05, -6.637722253799438e-05, -5.389750003814697e-05, -4.141777753829956e-05, -2.893805503845215e-05, -1.6458332538604736e-05, -3.978610038757324e-06, 8.501112461090088e-06, 2.09808349609375e-05, 3.346055746078491e-05, 4.5940279960632324e-05, 5.8420002460479736e-05, 7.089972496032715e-05, 8.337944746017456e-05, 9.585916996002197e-05, 0.00010833889245986938, 0.0001208186149597168, 0.0001332983374595642, 0.00014577805995941162, 0.00015825778245925903, 0.00017073750495910645, 0.00018321722745895386, 0.00019569694995880127, 0.00020817667245864868, 0.0002206563949584961, 0.0002331361174583435, 0.0002456158399581909, 0.00025809556245803833, 0.00027057528495788574, 0.00028305500745773315, 0.00029553472995758057, 0.000308014452457428, 0.0003204941749572754, 0.0003329738974571228, 0.0003454536199569702, 0.0003579333424568176, 0.00037041306495666504, 0.00038289278745651245, 0.00039537250995635986, 0.0004078522324562073, 0.0004203319549560547]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 11.0, 22.0, 28.0, 49.0, 86.0, 179.0, 343.0, 942.0, 3163.0, 45279.0, 950823.0, 42858.0, 3127.0, 914.0, 349.0, 158.0, 84.0, 55.0, 21.0, 9.0, 17.0, 11.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.07421875, -5.88134765625, -5.6884765625, -5.49560546875, -5.302734375, -5.10986328125, -4.9169921875, -4.72412109375, -4.53125, -4.33837890625, -4.1455078125, -3.95263671875, -3.759765625, -3.56689453125, -3.3740234375, -3.18115234375, -2.98828125, -2.79541015625, -2.6025390625, -2.40966796875, -2.216796875, -2.02392578125, -1.8310546875, -1.63818359375, -1.4453125, -1.25244140625, -1.0595703125, -0.86669921875, -0.673828125, -0.48095703125, -0.2880859375, -0.09521484375, 0.09765625, 0.29052734375, 0.4833984375, 0.67626953125, 0.869140625, 1.06201171875, 1.2548828125, 1.44775390625, 1.640625, 1.83349609375, 2.0263671875, 2.21923828125, 2.412109375, 2.60498046875, 2.7978515625, 2.99072265625, 3.18359375, 3.37646484375, 3.5693359375, 3.76220703125, 3.955078125, 4.14794921875, 4.3408203125, 4.53369140625, 4.7265625, 4.91943359375, 5.1123046875, 5.30517578125, 5.498046875, 5.69091796875, 5.8837890625, 6.07666015625, 6.26953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 12.0, 23.0, 41.0, 61.0, 91.0, 116.0, 132.0, 155.0, 111.0, 98.0, 42.0, 37.0, 26.0, 21.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.3128662109375, -2.207763671875, -2.1026611328125, -1.99755859375, -1.8924560546875, -1.787353515625, -1.6822509765625, -1.5771484375, -1.4720458984375, -1.366943359375, -1.2618408203125, -1.15673828125, -1.0516357421875, -0.946533203125, -0.8414306640625, -0.736328125, -0.6312255859375, -0.526123046875, -0.4210205078125, -0.31591796875, -0.2108154296875, -0.105712890625, -0.0006103515625, 0.1044921875, 0.2095947265625, 0.314697265625, 0.4197998046875, 0.52490234375, 0.6300048828125, 0.735107421875, 0.8402099609375, 0.9453125, 1.0504150390625, 1.155517578125, 1.2606201171875, 1.36572265625, 1.4708251953125, 1.575927734375, 1.6810302734375, 1.7861328125, 1.8912353515625, 1.996337890625, 2.1014404296875, 2.20654296875, 2.3116455078125, 2.416748046875, 2.5218505859375, 2.626953125, 2.7320556640625, 2.837158203125, 2.9422607421875, 3.04736328125, 3.1524658203125, 3.257568359375, 3.3626708984375, 3.4677734375, 3.5728759765625, 3.677978515625, 3.7830810546875, 3.88818359375, 3.9932861328125, 4.098388671875, 4.2034912109375, 4.30859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 7.0, 10.0, 16.0, 42.0, 100.0, 154.0, 216.0, 189.0, 146.0, 77.0, 28.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.998624801635742, -30.387989044189453, -28.777353286743164, -27.166717529296875, -25.556081771850586, -23.945446014404297, -22.334808349609375, -20.72417449951172, -19.113536834716797, -17.502901077270508, -15.892265319824219, -14.28162956237793, -12.67099380493164, -11.060357093811035, -9.449721336364746, -7.839085578918457, -6.228450775146484, -4.617815017700195, -3.007179021835327, -1.396543025970459, 0.21409273147583008, 1.8247289657592773, 3.4353647232055664, 5.0460004806518555, 6.6566362380981445, 8.267271995544434, 9.877907752990723, 11.488544464111328, 13.099180221557617, 14.709815979003906, 16.320451736450195, 17.931087493896484, 19.54172134399414, 21.15235710144043, 22.76299285888672, 24.373628616333008, 25.984264373779297, 27.59490203857422, 29.205535888671875, 30.816173553466797, 32.42680740356445, 34.037445068359375, 35.64807891845703, 37.25871658325195, 38.86935043334961, 40.47998809814453, 42.09062194824219, 43.70125961303711, 45.31189727783203, 46.92253494262695, 48.53316879272461, 50.14380645751953, 51.75444030761719, 53.36507797241211, 54.975711822509766, 56.58634948730469, 58.196983337402344, 59.807621002197266, 61.41825485229492, 63.028892517089844, 64.6395263671875, 66.25016021728516, 67.86080169677734, 69.471435546875, 71.08206939697266]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 9.0, 4.0, 2.0, 8.0, 10.0, 8.0, 6.0, 16.0, 19.0, 17.0, 25.0, 29.0, 30.0, 33.0, 27.0, 41.0, 51.0, 45.0, 37.0, 46.0, 44.0, 44.0, 43.0, 47.0, 52.0, 43.0, 30.0, 33.0, 37.0, 20.0, 16.0, 23.0, 12.0, 16.0, 19.0, 12.0, 12.0, 5.0, 6.0, 10.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-21.228343963623047, -20.62083625793457, -20.013328552246094, -19.405818939208984, -18.798311233520508, -18.19080352783203, -17.583295822143555, -16.975788116455078, -16.36827850341797, -15.760770797729492, -15.1532621383667, -14.545754432678223, -13.93824577331543, -13.330738067626953, -12.723230361938477, -12.115721702575684, -11.508213996887207, -10.90070629119873, -10.293197631835938, -9.685689926147461, -9.078181266784668, -8.470673561096191, -7.863165378570557, -7.255657196044922, -6.648149013519287, -6.040640830993652, -5.433132648468018, -4.825624465942383, -4.218116760253906, -3.6106083393096924, -3.0031003952026367, -2.395592212677002, -1.7880840301513672, -1.1805758476257324, -0.5730677843093872, 0.03444027900695801, 0.6419484615325928, 1.2494566440582275, 1.8569645881652832, 2.464472770690918, 3.0719809532165527, 3.6794891357421875, 4.286997318267822, 4.894505500793457, 5.502013206481934, 6.109521865844727, 6.717029571533203, 7.324537754058838, 7.932045936584473, 8.53955364227295, 9.147062301635742, 9.754570007324219, 10.362078666687012, 10.969586372375488, 11.577095031738281, 12.184602737426758, 12.792110443115234, 13.399618148803711, 14.007126808166504, 14.61463451385498, 15.222143173217773, 15.82965087890625, 16.437158584594727, 17.044666290283203, 17.652175903320312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 9.0, 5.0, 14.0, 13.0, 25.0, 31.0, 58.0, 54.0, 74.0, 113.0, 187.0, 226.0, 365.0, 563.0, 837.0, 1380.0, 2568.0, 6388.0, 26817.0, 4045600.0, 88670.0, 11486.0, 3883.0, 1722.0, 1040.0, 667.0, 442.0, 325.0, 208.0, 131.0, 92.0, 71.0, 53.0, 39.0, 31.0, 17.0, 21.0, 10.0, 7.0, 6.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.09375, -7.86077880859375, -7.6278076171875, -7.39483642578125, -7.161865234375, -6.92889404296875, -6.6959228515625, -6.46295166015625, -6.22998046875, -5.99700927734375, -5.7640380859375, -5.53106689453125, -5.298095703125, -5.06512451171875, -4.8321533203125, -4.59918212890625, -4.3662109375, -4.13323974609375, -3.9002685546875, -3.66729736328125, -3.434326171875, -3.20135498046875, -2.9683837890625, -2.73541259765625, -2.50244140625, -2.26947021484375, -2.0364990234375, -1.80352783203125, -1.570556640625, -1.33758544921875, -1.1046142578125, -0.87164306640625, -0.638671875, -0.40570068359375, -0.1727294921875, 0.06024169921875, 0.293212890625, 0.52618408203125, 0.7591552734375, 0.99212646484375, 1.22509765625, 1.45806884765625, 1.6910400390625, 1.92401123046875, 2.156982421875, 2.38995361328125, 2.6229248046875, 2.85589599609375, 3.0888671875, 3.32183837890625, 3.5548095703125, 3.78778076171875, 4.020751953125, 4.25372314453125, 4.4866943359375, 4.71966552734375, 4.95263671875, 5.18560791015625, 5.4185791015625, 5.65155029296875, 5.884521484375, 6.11749267578125, 6.3504638671875, 6.58343505859375, 6.81640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 5.0, 9.0, 15.0, 8.0, 16.0, 17.0, 21.0, 27.0, 26.0, 36.0, 38.0, 44.0, 45.0, 46.0, 52.0, 53.0, 43.0, 52.0, 52.0, 49.0, 39.0, 55.0, 40.0, 31.0, 25.0, 30.0, 25.0, 18.0, 21.0, 5.0, 12.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1767578125, -1.141571044921875, -1.10638427734375, -1.071197509765625, -1.0360107421875, -1.000823974609375, -0.96563720703125, -0.930450439453125, -0.895263671875, -0.860076904296875, -0.82489013671875, -0.789703369140625, -0.7545166015625, -0.719329833984375, -0.68414306640625, -0.648956298828125, -0.61376953125, -0.578582763671875, -0.54339599609375, -0.508209228515625, -0.4730224609375, -0.437835693359375, -0.40264892578125, -0.367462158203125, -0.332275390625, -0.297088623046875, -0.26190185546875, -0.226715087890625, -0.1915283203125, -0.156341552734375, -0.12115478515625, -0.085968017578125, -0.05078125, -0.015594482421875, 0.01959228515625, 0.054779052734375, 0.0899658203125, 0.125152587890625, 0.16033935546875, 0.195526123046875, 0.230712890625, 0.265899658203125, 0.30108642578125, 0.336273193359375, 0.3714599609375, 0.406646728515625, 0.44183349609375, 0.477020263671875, 0.51220703125, 0.547393798828125, 0.58258056640625, 0.617767333984375, 0.6529541015625, 0.688140869140625, 0.72332763671875, 0.758514404296875, 0.793701171875, 0.828887939453125, 0.86407470703125, 0.899261474609375, 0.9344482421875, 0.969635009765625, 1.00482177734375, 1.040008544921875, 1.0751953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 15.0, 19.0, 34.0, 44.0, 46.0, 64.0, 108.0, 124.0, 202.0, 270.0, 477.0, 656.0, 997.0, 1626.0, 2714.0, 4854.0, 10669.0, 34460.0, 3882871.0, 212630.0, 22695.0, 8196.0, 4106.0, 2282.0, 1339.0, 912.0, 561.0, 410.0, 282.0, 188.0, 126.0, 91.0, 50.0, 41.0, 34.0, 16.0, 19.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.15625, -5.00830078125, -4.8603515625, -4.71240234375, -4.564453125, -4.41650390625, -4.2685546875, -4.12060546875, -3.97265625, -3.82470703125, -3.6767578125, -3.52880859375, -3.380859375, -3.23291015625, -3.0849609375, -2.93701171875, -2.7890625, -2.64111328125, -2.4931640625, -2.34521484375, -2.197265625, -2.04931640625, -1.9013671875, -1.75341796875, -1.60546875, -1.45751953125, -1.3095703125, -1.16162109375, -1.013671875, -0.86572265625, -0.7177734375, -0.56982421875, -0.421875, -0.27392578125, -0.1259765625, 0.02197265625, 0.169921875, 0.31787109375, 0.4658203125, 0.61376953125, 0.76171875, 0.90966796875, 1.0576171875, 1.20556640625, 1.353515625, 1.50146484375, 1.6494140625, 1.79736328125, 1.9453125, 2.09326171875, 2.2412109375, 2.38916015625, 2.537109375, 2.68505859375, 2.8330078125, 2.98095703125, 3.12890625, 3.27685546875, 3.4248046875, 3.57275390625, 3.720703125, 3.86865234375, 4.0166015625, 4.16455078125, 4.3125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 22.0, 64.0, 146.0, 3379.0, 250.0, 63.0, 26.0, 20.0, 8.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1796875, -1.1446990966796875, -1.109710693359375, -1.0747222900390625, -1.03973388671875, -1.0047454833984375, -0.969757080078125, -0.9347686767578125, -0.8997802734375, -0.8647918701171875, -0.829803466796875, -0.7948150634765625, -0.75982666015625, -0.7248382568359375, -0.689849853515625, -0.6548614501953125, -0.619873046875, -0.5848846435546875, -0.549896240234375, -0.5149078369140625, -0.47991943359375, -0.4449310302734375, -0.409942626953125, -0.3749542236328125, -0.3399658203125, -0.3049774169921875, -0.269989013671875, -0.2350006103515625, -0.20001220703125, -0.1650238037109375, -0.130035400390625, -0.0950469970703125, -0.06005859375, -0.0250701904296875, 0.009918212890625, 0.0449066162109375, 0.07989501953125, 0.1148834228515625, 0.149871826171875, 0.1848602294921875, 0.2198486328125, 0.2548370361328125, 0.289825439453125, 0.3248138427734375, 0.35980224609375, 0.3947906494140625, 0.429779052734375, 0.4647674560546875, 0.499755859375, 0.5347442626953125, 0.569732666015625, 0.6047210693359375, 0.63970947265625, 0.6746978759765625, 0.709686279296875, 0.7446746826171875, 0.7796630859375, 0.8146514892578125, 0.849639892578125, 0.8846282958984375, 0.91961669921875, 0.9546051025390625, 0.989593505859375, 1.0245819091796875, 1.0595703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 12.0, 26.0, 40.0, 79.0, 120.0, 151.0, 189.0, 171.0, 89.0, 63.0, 31.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-11.44223403930664, -11.214584350585938, -10.986934661865234, -10.759284973144531, -10.531635284423828, -10.303985595703125, -10.076335906982422, -9.848686218261719, -9.621036529541016, -9.393386840820312, -9.16573715209961, -8.938087463378906, -8.710437774658203, -8.4827880859375, -8.255138397216797, -8.027488708496094, -7.799838066101074, -7.572188377380371, -7.344538688659668, -7.116888999938965, -6.889239311218262, -6.661589622497559, -6.433939456939697, -6.206289768218994, -5.978640079498291, -5.750990390777588, -5.523340702056885, -5.295691013336182, -5.06804084777832, -4.840391159057617, -4.612741470336914, -4.385091781616211, -4.157442092895508, -3.9297924041748047, -3.7021427154541016, -3.4744927883148193, -3.246843099594116, -3.019193410873413, -2.791543483734131, -2.5638937950134277, -2.3362441062927246, -2.1085944175720215, -1.8809446096420288, -1.6532948017120361, -1.425645112991333, -1.1979954242706299, -0.9703456163406372, -0.7426958084106445, -0.5150461196899414, -0.2873963713645935, -0.059746623039245605, 0.1679031252861023, 0.3955528736114502, 0.6232025623321533, 0.850852370262146, 1.0785021781921387, 1.3061518669128418, 1.533801555633545, 1.7614513635635376, 1.9891011714935303, 2.2167508602142334, 2.4444005489349365, 2.6720504760742188, 2.899700164794922, 3.127349853515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 1.0, 5.0, 6.0, 9.0, 9.0, 6.0, 17.0, 14.0, 13.0, 20.0, 21.0, 33.0, 32.0, 29.0, 28.0, 29.0, 39.0, 46.0, 62.0, 46.0, 55.0, 41.0, 51.0, 41.0, 33.0, 40.0, 29.0, 33.0, 30.0, 27.0, 29.0, 22.0, 19.0, 14.0, 12.0, 14.0, 11.0, 10.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2060015201568604, -2.131774425506592, -2.0575475692749023, -1.9833204746246338, -1.9090934991836548, -1.8348665237426758, -1.7606394290924072, -1.6864124536514282, -1.6121854782104492, -1.5379585027694702, -1.4637315273284912, -1.3895044326782227, -1.3152774572372437, -1.2410504817962646, -1.166823387145996, -1.092596411705017, -1.018369436264038, -0.9441424608230591, -0.8699154257774353, -0.7956883907318115, -0.7214614152908325, -0.6472344398498535, -0.5730074048042297, -0.49878036975860596, -0.42455339431762695, -0.35032638907432556, -0.27609938383102417, -0.20187237858772278, -0.1276453733444214, -0.053418368101119995, 0.020808637142181396, 0.09503567218780518, 0.16926240921020508, 0.24348941445350647, 0.31771641969680786, 0.39194342494010925, 0.46617043018341064, 0.5403974056243896, 0.6146244406700134, 0.6888514757156372, 0.7630784511566162, 0.8373054265975952, 0.911532461643219, 0.9857594966888428, 1.0599864721298218, 1.1342134475708008, 1.2084405422210693, 1.2826675176620483, 1.3568944931030273, 1.4311214685440063, 1.5053484439849854, 1.579575538635254, 1.653802514076233, 1.728029489517212, 1.8022565841674805, 1.8764835596084595, 1.9507105350494385, 2.024937629699707, 2.0991644859313965, 2.173391580581665, 2.2476186752319336, 2.321845531463623, 2.3960726261138916, 2.47029972076416, 2.5445265769958496]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 7.0, 1.0, 2.0, 6.0, 9.0, 7.0, 7.0, 10.0, 24.0, 28.0, 41.0, 83.0, 123.0, 192.0, 434.0, 1030.0, 3065.0, 11161.0, 47959.0, 222451.0, 508720.0, 196301.0, 42307.0, 9876.0, 2818.0, 969.0, 408.0, 206.0, 101.0, 73.0, 30.0, 30.0, 19.0, 13.0, 18.0, 13.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.798248291015625, -4.65899658203125, -4.519744873046875, -4.3804931640625, -4.241241455078125, -4.10198974609375, -3.962738037109375, -3.823486328125, -3.684234619140625, -3.54498291015625, -3.405731201171875, -3.2664794921875, -3.127227783203125, -2.98797607421875, -2.848724365234375, -2.70947265625, -2.570220947265625, -2.43096923828125, -2.291717529296875, -2.1524658203125, -2.013214111328125, -1.87396240234375, -1.734710693359375, -1.595458984375, -1.456207275390625, -1.31695556640625, -1.177703857421875, -1.0384521484375, -0.899200439453125, -0.75994873046875, -0.620697021484375, -0.4814453125, -0.342193603515625, -0.20294189453125, -0.063690185546875, 0.0755615234375, 0.214813232421875, 0.35406494140625, 0.493316650390625, 0.632568359375, 0.771820068359375, 0.91107177734375, 1.050323486328125, 1.1895751953125, 1.328826904296875, 1.46807861328125, 1.607330322265625, 1.74658203125, 1.885833740234375, 2.02508544921875, 2.164337158203125, 2.3035888671875, 2.442840576171875, 2.58209228515625, 2.721343994140625, 2.860595703125, 2.999847412109375, 3.13909912109375, 3.278350830078125, 3.4176025390625, 3.556854248046875, 3.69610595703125, 3.835357666015625, 3.974609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 8.0, 7.0, 10.0, 9.0, 14.0, 15.0, 25.0, 22.0, 26.0, 33.0, 34.0, 32.0, 33.0, 41.0, 50.0, 46.0, 42.0, 40.0, 38.0, 40.0, 50.0, 51.0, 43.0, 39.0, 37.0, 28.0, 30.0, 22.0, 16.0, 18.0, 16.0, 17.0, 16.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.080352783203125, -1.04644775390625, -1.012542724609375, -0.9786376953125, -0.944732666015625, -0.91082763671875, -0.876922607421875, -0.843017578125, -0.809112548828125, -0.77520751953125, -0.741302490234375, -0.7073974609375, -0.673492431640625, -0.63958740234375, -0.605682373046875, -0.57177734375, -0.537872314453125, -0.50396728515625, -0.470062255859375, -0.4361572265625, -0.402252197265625, -0.36834716796875, -0.334442138671875, -0.300537109375, -0.266632080078125, -0.23272705078125, -0.198822021484375, -0.1649169921875, -0.131011962890625, -0.09710693359375, -0.063201904296875, -0.029296875, 0.004608154296875, 0.03851318359375, 0.072418212890625, 0.1063232421875, 0.140228271484375, 0.17413330078125, 0.208038330078125, 0.241943359375, 0.275848388671875, 0.30975341796875, 0.343658447265625, 0.3775634765625, 0.411468505859375, 0.44537353515625, 0.479278564453125, 0.51318359375, 0.547088623046875, 0.58099365234375, 0.614898681640625, 0.6488037109375, 0.682708740234375, 0.71661376953125, 0.750518798828125, 0.784423828125, 0.818328857421875, 0.85223388671875, 0.886138916015625, 0.9200439453125, 0.953948974609375, 0.98785400390625, 1.021759033203125, 1.0556640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 6.0, 9.0, 7.0, 11.0, 29.0, 43.0, 57.0, 79.0, 146.0, 228.0, 352.0, 619.0, 999.0, 2454.0, 11699.0, 188197.0, 782042.0, 52263.0, 5564.0, 1670.0, 787.0, 481.0, 304.0, 198.0, 109.0, 80.0, 52.0, 25.0, 22.0, 5.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.875, -8.64324951171875, -8.4114990234375, -8.17974853515625, -7.947998046875, -7.71624755859375, -7.4844970703125, -7.25274658203125, -7.02099609375, -6.78924560546875, -6.5574951171875, -6.32574462890625, -6.093994140625, -5.86224365234375, -5.6304931640625, -5.39874267578125, -5.1669921875, -4.93524169921875, -4.7034912109375, -4.47174072265625, -4.239990234375, -4.00823974609375, -3.7764892578125, -3.54473876953125, -3.31298828125, -3.08123779296875, -2.8494873046875, -2.61773681640625, -2.385986328125, -2.15423583984375, -1.9224853515625, -1.69073486328125, -1.458984375, -1.22723388671875, -0.9954833984375, -0.76373291015625, -0.531982421875, -0.30023193359375, -0.0684814453125, 0.16326904296875, 0.39501953125, 0.62677001953125, 0.8585205078125, 1.09027099609375, 1.322021484375, 1.55377197265625, 1.7855224609375, 2.01727294921875, 2.2490234375, 2.48077392578125, 2.7125244140625, 2.94427490234375, 3.176025390625, 3.40777587890625, 3.6395263671875, 3.87127685546875, 4.10302734375, 4.33477783203125, 4.5665283203125, 4.79827880859375, 5.030029296875, 5.26177978515625, 5.4935302734375, 5.72528076171875, 5.95703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 9.0, 4.0, 10.0, 2.0, 9.0, 8.0, 9.0, 13.0, 23.0, 22.0, 24.0, 35.0, 39.0, 37.0, 40.0, 35.0, 43.0, 52.0, 38.0, 49.0, 49.0, 49.0, 56.0, 38.0, 39.0, 41.0, 32.0, 32.0, 29.0, 21.0, 27.0, 20.0, 17.0, 12.0, 9.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21875, -5.05987548828125, -4.9010009765625, -4.74212646484375, -4.583251953125, -4.42437744140625, -4.2655029296875, -4.10662841796875, -3.94775390625, -3.78887939453125, -3.6300048828125, -3.47113037109375, -3.312255859375, -3.15338134765625, -2.9945068359375, -2.83563232421875, -2.6767578125, -2.51788330078125, -2.3590087890625, -2.20013427734375, -2.041259765625, -1.88238525390625, -1.7235107421875, -1.56463623046875, -1.40576171875, -1.24688720703125, -1.0880126953125, -0.92913818359375, -0.770263671875, -0.61138916015625, -0.4525146484375, -0.29364013671875, -0.134765625, 0.02410888671875, 0.1829833984375, 0.34185791015625, 0.500732421875, 0.65960693359375, 0.8184814453125, 0.97735595703125, 1.13623046875, 1.29510498046875, 1.4539794921875, 1.61285400390625, 1.771728515625, 1.93060302734375, 2.0894775390625, 2.24835205078125, 2.4072265625, 2.56610107421875, 2.7249755859375, 2.88385009765625, 3.042724609375, 3.20159912109375, 3.3604736328125, 3.51934814453125, 3.67822265625, 3.83709716796875, 3.9959716796875, 4.15484619140625, 4.313720703125, 4.47259521484375, 4.6314697265625, 4.79034423828125, 4.94921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 19.0, 24.0, 20.0, 24.0, 37.0, 44.0, 75.0, 102.0, 156.0, 287.0, 580.0, 1765.0, 9214.0, 125510.0, 847694.0, 54967.0, 5576.0, 1222.0, 491.0, 240.0, 136.0, 81.0, 74.0, 53.0, 23.0, 26.0, 20.0, 22.0, 8.0, 5.0, 9.0, 8.0, 4.0, 7.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.3262939453125, -4.183837890625, -4.0413818359375, -3.89892578125, -3.7564697265625, -3.614013671875, -3.4715576171875, -3.3291015625, -3.1866455078125, -3.044189453125, -2.9017333984375, -2.75927734375, -2.6168212890625, -2.474365234375, -2.3319091796875, -2.189453125, -2.0469970703125, -1.904541015625, -1.7620849609375, -1.61962890625, -1.4771728515625, -1.334716796875, -1.1922607421875, -1.0498046875, -0.9073486328125, -0.764892578125, -0.6224365234375, -0.47998046875, -0.3375244140625, -0.195068359375, -0.0526123046875, 0.08984375, 0.2322998046875, 0.374755859375, 0.5172119140625, 0.65966796875, 0.8021240234375, 0.944580078125, 1.0870361328125, 1.2294921875, 1.3719482421875, 1.514404296875, 1.6568603515625, 1.79931640625, 1.9417724609375, 2.084228515625, 2.2266845703125, 2.369140625, 2.5115966796875, 2.654052734375, 2.7965087890625, 2.93896484375, 3.0814208984375, 3.223876953125, 3.3663330078125, 3.5087890625, 3.6512451171875, 3.793701171875, 3.9361572265625, 4.07861328125, 4.2210693359375, 4.363525390625, 4.5059814453125, 4.6484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 3.0, 6.0, 9.0, 8.0, 26.0, 26.0, 28.0, 39.0, 47.0, 64.0, 83.0, 123.0, 123.0, 108.0, 74.0, 60.0, 37.0, 27.0, 23.0, 14.0, 13.0, 13.0, 10.0, 8.0, 6.0, 3.0, 1.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004513263702392578, -0.0004377886652946472, -0.0004242509603500366, -0.000410713255405426, -0.00039717555046081543, -0.00038363784551620483, -0.00037010014057159424, -0.00035656243562698364, -0.00034302473068237305, -0.00032948702573776245, -0.00031594932079315186, -0.00030241161584854126, -0.00028887391090393066, -0.00027533620595932007, -0.00026179850101470947, -0.0002482607960700989, -0.00023472309112548828, -0.00022118538618087769, -0.0002076476812362671, -0.0001941099762916565, -0.0001805722713470459, -0.0001670345664024353, -0.0001534968614578247, -0.0001399591565132141, -0.00012642145156860352, -0.00011288374662399292, -9.934604167938232e-05, -8.580833673477173e-05, -7.227063179016113e-05, -5.873292684555054e-05, -4.519522190093994e-05, -3.1657516956329346e-05, -1.811981201171875e-05, -4.582107067108154e-06, 8.955597877502441e-06, 2.2493302822113037e-05, 3.603100776672363e-05, 4.956871271133423e-05, 6.310641765594482e-05, 7.664412260055542e-05, 9.018182754516602e-05, 0.00010371953248977661, 0.00011725723743438721, 0.0001307949423789978, 0.0001443326473236084, 0.000157870352268219, 0.0001714080572128296, 0.00018494576215744019, 0.00019848346710205078, 0.00021202117204666138, 0.00022555887699127197, 0.00023909658193588257, 0.00025263428688049316, 0.00026617199182510376, 0.00027970969676971436, 0.00029324740171432495, 0.00030678510665893555, 0.00032032281160354614, 0.00033386051654815674, 0.00034739822149276733, 0.00036093592643737793, 0.0003744736313819885, 0.0003880113363265991, 0.0004015490412712097, 0.0004150867462158203]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 9.0, 11.0, 14.0, 26.0, 37.0, 46.0, 74.0, 129.0, 177.0, 297.0, 501.0, 1012.0, 2383.0, 7918.0, 46797.0, 561104.0, 383969.0, 33690.0, 6215.0, 1981.0, 891.0, 521.0, 243.0, 157.0, 104.0, 76.0, 38.0, 40.0, 17.0, 9.0, 18.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.2545166015625, -3.145751953125, -3.0369873046875, -2.92822265625, -2.8194580078125, -2.710693359375, -2.6019287109375, -2.4931640625, -2.3843994140625, -2.275634765625, -2.1668701171875, -2.05810546875, -1.9493408203125, -1.840576171875, -1.7318115234375, -1.623046875, -1.5142822265625, -1.405517578125, -1.2967529296875, -1.18798828125, -1.0792236328125, -0.970458984375, -0.8616943359375, -0.7529296875, -0.6441650390625, -0.535400390625, -0.4266357421875, -0.31787109375, -0.2091064453125, -0.100341796875, 0.0084228515625, 0.1171875, 0.2259521484375, 0.334716796875, 0.4434814453125, 0.55224609375, 0.6610107421875, 0.769775390625, 0.8785400390625, 0.9873046875, 1.0960693359375, 1.204833984375, 1.3135986328125, 1.42236328125, 1.5311279296875, 1.639892578125, 1.7486572265625, 1.857421875, 1.9661865234375, 2.074951171875, 2.1837158203125, 2.29248046875, 2.4012451171875, 2.510009765625, 2.6187744140625, 2.7275390625, 2.8363037109375, 2.945068359375, 3.0538330078125, 3.16259765625, 3.2713623046875, 3.380126953125, 3.4888916015625, 3.59765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 10.0, 12.0, 14.0, 24.0, 26.0, 32.0, 52.0, 60.0, 112.0, 120.0, 104.0, 101.0, 88.0, 70.0, 47.0, 33.0, 31.0, 15.0, 9.0, 10.0, 6.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056640625, -1.964080810546875, -1.87152099609375, -1.778961181640625, -1.6864013671875, -1.593841552734375, -1.50128173828125, -1.408721923828125, -1.316162109375, -1.223602294921875, -1.13104248046875, -1.038482666015625, -0.9459228515625, -0.853363037109375, -0.76080322265625, -0.668243408203125, -0.57568359375, -0.483123779296875, -0.39056396484375, -0.298004150390625, -0.2054443359375, -0.112884521484375, -0.02032470703125, 0.072235107421875, 0.164794921875, 0.257354736328125, 0.34991455078125, 0.442474365234375, 0.5350341796875, 0.627593994140625, 0.72015380859375, 0.812713623046875, 0.9052734375, 0.997833251953125, 1.09039306640625, 1.182952880859375, 1.2755126953125, 1.368072509765625, 1.46063232421875, 1.553192138671875, 1.645751953125, 1.738311767578125, 1.83087158203125, 1.923431396484375, 2.0159912109375, 2.108551025390625, 2.20111083984375, 2.293670654296875, 2.38623046875, 2.478790283203125, 2.57135009765625, 2.663909912109375, 2.7564697265625, 2.849029541015625, 2.94158935546875, 3.034149169921875, 3.126708984375, 3.219268798828125, 3.31182861328125, 3.404388427734375, 3.4969482421875, 3.589508056640625, 3.68206787109375, 3.774627685546875, 3.8671875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 11.0, 33.0, 132.0, 256.0, 317.0, 172.0, 51.0, 13.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.981239318847656, -50.22185134887695, -47.462459564208984, -44.70307159423828, -41.94367980957031, -39.18429183959961, -36.424903869628906, -33.66551208496094, -30.906124114990234, -28.1467342376709, -25.387344360351562, -22.62795639038086, -19.868566513061523, -17.109176635742188, -14.349788665771484, -11.590398788452148, -8.831008911132812, -6.071619510650635, -3.312230110168457, -0.5528411865234375, 2.2065486907958984, 4.965938568115234, 7.7253265380859375, 10.484716415405273, 13.24410629272461, 16.003496170043945, 18.76288604736328, 21.522274017333984, 24.28166389465332, 27.041053771972656, 29.80044174194336, 32.55982971191406, 35.31922149658203, 38.078609466552734, 40.8380012512207, 43.597389221191406, 46.356781005859375, 49.11616897583008, 51.87555694580078, 54.63494873046875, 57.39433670043945, 60.153724670410156, 62.913116455078125, 65.67250061035156, 68.43189239501953, 71.1912841796875, 73.95066833496094, 76.7100601196289, 79.46945190429688, 82.22884368896484, 84.98822784423828, 87.74761962890625, 90.50701141357422, 93.26640319824219, 96.02578735351562, 98.7851791381836, 101.54457092285156, 104.30396270751953, 107.06334686279297, 109.82273864746094, 112.5821304321289, 115.34152221679688, 118.10090637207031, 120.86029815673828, 123.61968231201172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 11.0, 8.0, 17.0, 13.0, 10.0, 9.0, 19.0, 12.0, 26.0, 20.0, 22.0, 35.0, 37.0, 30.0, 38.0, 45.0, 42.0, 34.0, 44.0, 46.0, 52.0, 39.0, 47.0, 39.0, 23.0, 28.0, 28.0, 23.0, 25.0, 26.0, 28.0, 13.0, 13.0, 15.0, 12.0, 13.0, 15.0, 8.0, 9.0, 2.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-22.928943634033203, -22.27569007873535, -21.6224365234375, -20.969181060791016, -20.315927505493164, -19.662673950195312, -19.009418487548828, -18.356164932250977, -17.702911376953125, -17.049657821655273, -16.396404266357422, -15.743148803710938, -15.089895248413086, -14.436641693115234, -13.783387184143066, -13.130132675170898, -12.476879119873047, -11.823625564575195, -11.170371055603027, -10.51711654663086, -9.863862991333008, -9.210609436035156, -8.557354927062988, -7.9041008949279785, -7.250846862792969, -6.597592830657959, -5.944338798522949, -5.2910847663879395, -4.63783073425293, -3.98457670211792, -3.33132266998291, -2.6780686378479004, -2.0248146057128906, -1.3715605735778809, -0.7183065414428711, -0.06505250930786133, 0.5882015228271484, 1.2414555549621582, 1.894709587097168, 2.5479636192321777, 3.2012176513671875, 3.8544716835021973, 4.507725715637207, 5.160979747772217, 5.814233779907227, 6.467487812042236, 7.120741844177246, 7.773995876312256, 8.427249908447266, 9.080503463745117, 9.733757972717285, 10.387012481689453, 11.040266036987305, 11.693519592285156, 12.346774101257324, 13.000028610229492, 13.653282165527344, 14.306535720825195, 14.959790229797363, 15.613044738769531, 16.266298294067383, 16.919551849365234, 17.57280731201172, 18.22606086730957, 18.879314422607422]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 19.0, 21.0, 31.0, 46.0, 70.0, 65.0, 116.0, 174.0, 255.0, 359.0, 570.0, 888.0, 1474.0, 2514.0, 4841.0, 11158.0, 35015.0, 376870.0, 3685841.0, 47475.0, 13480.0, 5474.0, 2863.0, 1647.0, 967.0, 666.0, 410.0, 275.0, 206.0, 119.0, 93.0, 65.0, 34.0, 32.0, 22.0, 25.0, 19.0, 13.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.3046875, -4.16168212890625, -4.0186767578125, -3.87567138671875, -3.732666015625, -3.58966064453125, -3.4466552734375, -3.30364990234375, -3.16064453125, -3.01763916015625, -2.8746337890625, -2.73162841796875, -2.588623046875, -2.44561767578125, -2.3026123046875, -2.15960693359375, -2.0166015625, -1.87359619140625, -1.7305908203125, -1.58758544921875, -1.444580078125, -1.30157470703125, -1.1585693359375, -1.01556396484375, -0.87255859375, -0.72955322265625, -0.5865478515625, -0.44354248046875, -0.300537109375, -0.15753173828125, -0.0145263671875, 0.12847900390625, 0.271484375, 0.41448974609375, 0.5574951171875, 0.70050048828125, 0.843505859375, 0.98651123046875, 1.1295166015625, 1.27252197265625, 1.41552734375, 1.55853271484375, 1.7015380859375, 1.84454345703125, 1.987548828125, 2.13055419921875, 2.2735595703125, 2.41656494140625, 2.5595703125, 2.70257568359375, 2.8455810546875, 2.98858642578125, 3.131591796875, 3.27459716796875, 3.4176025390625, 3.56060791015625, 3.70361328125, 3.84661865234375, 3.9896240234375, 4.13262939453125, 4.275634765625, 4.41864013671875, 4.5616455078125, 4.70465087890625, 4.84765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 12.0, 8.0, 10.0, 15.0, 16.0, 32.0, 40.0, 41.0, 44.0, 56.0, 60.0, 56.0, 72.0, 76.0, 89.0, 57.0, 61.0, 47.0, 50.0, 39.0, 21.0, 27.0, 15.0, 13.0, 9.0, 13.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.5931549072265625, -1.543731689453125, -1.4943084716796875, -1.44488525390625, -1.3954620361328125, -1.346038818359375, -1.2966156005859375, -1.2471923828125, -1.1977691650390625, -1.148345947265625, -1.0989227294921875, -1.04949951171875, -1.0000762939453125, -0.950653076171875, -0.9012298583984375, -0.851806640625, -0.8023834228515625, -0.752960205078125, -0.7035369873046875, -0.65411376953125, -0.6046905517578125, -0.555267333984375, -0.5058441162109375, -0.4564208984375, -0.4069976806640625, -0.357574462890625, -0.3081512451171875, -0.25872802734375, -0.2093048095703125, -0.159881591796875, -0.1104583740234375, -0.06103515625, -0.0116119384765625, 0.037811279296875, 0.0872344970703125, 0.13665771484375, 0.1860809326171875, 0.235504150390625, 0.2849273681640625, 0.3343505859375, 0.3837738037109375, 0.433197021484375, 0.4826202392578125, 0.53204345703125, 0.5814666748046875, 0.630889892578125, 0.6803131103515625, 0.729736328125, 0.7791595458984375, 0.828582763671875, 0.8780059814453125, 0.92742919921875, 0.9768524169921875, 1.026275634765625, 1.0756988525390625, 1.1251220703125, 1.1745452880859375, 1.223968505859375, 1.2733917236328125, 1.32281494140625, 1.3722381591796875, 1.421661376953125, 1.4710845947265625, 1.5205078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 9.0, 9.0, 11.0, 17.0, 23.0, 28.0, 30.0, 56.0, 72.0, 98.0, 142.0, 199.0, 319.0, 470.0, 728.0, 1223.0, 2029.0, 3717.0, 6797.0, 14681.0, 39620.0, 237176.0, 3743246.0, 94353.0, 25854.0, 10536.0, 5365.0, 2865.0, 1650.0, 1025.0, 628.0, 421.0, 251.0, 189.0, 132.0, 80.0, 54.0, 40.0, 27.0, 30.0, 14.0, 11.0, 13.0, 12.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.318359375, -3.21234130859375, -3.1063232421875, -3.00030517578125, -2.894287109375, -2.78826904296875, -2.6822509765625, -2.57623291015625, -2.47021484375, -2.36419677734375, -2.2581787109375, -2.15216064453125, -2.046142578125, -1.94012451171875, -1.8341064453125, -1.72808837890625, -1.6220703125, -1.51605224609375, -1.4100341796875, -1.30401611328125, -1.197998046875, -1.09197998046875, -0.9859619140625, -0.87994384765625, -0.77392578125, -0.66790771484375, -0.5618896484375, -0.45587158203125, -0.349853515625, -0.24383544921875, -0.1378173828125, -0.03179931640625, 0.07421875, 0.18023681640625, 0.2862548828125, 0.39227294921875, 0.498291015625, 0.60430908203125, 0.7103271484375, 0.81634521484375, 0.92236328125, 1.02838134765625, 1.1343994140625, 1.24041748046875, 1.346435546875, 1.45245361328125, 1.5584716796875, 1.66448974609375, 1.7705078125, 1.87652587890625, 1.9825439453125, 2.08856201171875, 2.194580078125, 2.30059814453125, 2.4066162109375, 2.51263427734375, 2.61865234375, 2.72467041015625, 2.8306884765625, 2.93670654296875, 3.042724609375, 3.14874267578125, 3.2547607421875, 3.36077880859375, 3.466796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 7.0, 3.0, 9.0, 9.0, 14.0, 15.0, 26.0, 28.0, 56.0, 94.0, 248.0, 2852.0, 360.0, 144.0, 59.0, 29.0, 25.0, 21.0, 10.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6748046875, -1.62347412109375, -1.5721435546875, -1.52081298828125, -1.469482421875, -1.41815185546875, -1.3668212890625, -1.31549072265625, -1.26416015625, -1.21282958984375, -1.1614990234375, -1.11016845703125, -1.058837890625, -1.00750732421875, -0.9561767578125, -0.90484619140625, -0.853515625, -0.80218505859375, -0.7508544921875, -0.69952392578125, -0.648193359375, -0.59686279296875, -0.5455322265625, -0.49420166015625, -0.44287109375, -0.39154052734375, -0.3402099609375, -0.28887939453125, -0.237548828125, -0.18621826171875, -0.1348876953125, -0.08355712890625, -0.0322265625, 0.01910400390625, 0.0704345703125, 0.12176513671875, 0.173095703125, 0.22442626953125, 0.2757568359375, 0.32708740234375, 0.37841796875, 0.42974853515625, 0.4810791015625, 0.53240966796875, 0.583740234375, 0.63507080078125, 0.6864013671875, 0.73773193359375, 0.7890625, 0.84039306640625, 0.8917236328125, 0.94305419921875, 0.994384765625, 1.04571533203125, 1.0970458984375, 1.14837646484375, 1.19970703125, 1.25103759765625, 1.3023681640625, 1.35369873046875, 1.405029296875, 1.45635986328125, 1.5076904296875, 1.55902099609375, 1.6103515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 14.0, 13.0, 22.0, 23.0, 50.0, 53.0, 81.0, 102.0, 98.0, 123.0, 79.0, 68.0, 63.0, 45.0, 47.0, 28.0, 17.0, 13.0, 16.0, 10.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.317131042480469, -6.099594593048096, -5.882058620452881, -5.664522171020508, -5.446985721588135, -5.229449272155762, -5.011913299560547, -4.794376850128174, -4.576840400695801, -4.359303951263428, -4.141767978668213, -3.92423152923584, -3.706695079803467, -3.489158868789673, -3.271622657775879, -3.054086208343506, -2.836549997329712, -2.619013786315918, -2.401477336883545, -2.183941125869751, -1.966404676437378, -1.748868465423584, -1.5313321352005005, -1.313795804977417, -1.0962594747543335, -0.87872314453125, -0.6611868143081665, -0.4436505436897278, -0.2261142134666443, -0.008577942848205566, 0.20895838737487793, 0.4264947175979614, 0.6440310478210449, 0.8615673780441284, 1.079103708267212, 1.2966399192810059, 1.514176368713379, 1.7317125797271729, 1.9492489099502563, 2.16678524017334, 2.384321689605713, 2.601857900619507, 2.81939435005188, 3.036930561065674, 3.254467010498047, 3.472003221511841, 3.6895394325256348, 3.907075881958008, 4.124611854553223, 4.342148303985596, 4.5596842765808105, 4.777220726013184, 4.994757175445557, 5.21229362487793, 5.4298295974731445, 5.647366046905518, 5.864902496337891, 6.082438945770264, 6.2999749183654785, 6.517511367797852, 6.735047817230225, 6.952584266662598, 7.1701202392578125, 7.3876566886901855, 7.605193138122559]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 2.0, 5.0, 6.0, 10.0, 11.0, 17.0, 26.0, 15.0, 23.0, 25.0, 33.0, 31.0, 46.0, 42.0, 38.0, 39.0, 46.0, 51.0, 54.0, 39.0, 36.0, 47.0, 43.0, 26.0, 39.0, 37.0, 31.0, 40.0, 20.0, 25.0, 24.0, 14.0, 11.0, 7.0, 8.0, 7.0, 2.0, 8.0, 3.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.618462562561035, -4.480080604553223, -4.341698169708252, -4.2033162117004395, -4.064933776855469, -3.9265518188476562, -3.7881698608398438, -3.649787664413452, -3.5114054679870605, -3.373023271560669, -3.2346410751342773, -3.096259117126465, -2.9578769207000732, -2.8194947242736816, -2.681112766265869, -2.5427305698394775, -2.404348373413086, -2.2659661769866943, -2.1275839805603027, -1.9892020225524902, -1.8508198261260986, -1.712437629699707, -1.574055552482605, -1.435673475265503, -1.2972912788391113, -1.1589090824127197, -1.0205270051956177, -0.8821448683738708, -0.743762731552124, -0.6053805947303772, -0.46699845790863037, -0.32861632108688354, -0.19023466110229492, -0.051852524280548096, 0.08652961254119873, 0.22491174936294556, 0.3632938861846924, 0.5016760230064392, 0.640058159828186, 0.7784402966499329, 0.9168224334716797, 1.0552046298980713, 1.1935867071151733, 1.3319687843322754, 1.470350980758667, 1.6087331771850586, 1.7471152544021606, 1.8854973316192627, 2.0238795280456543, 2.162261724472046, 2.3006439208984375, 2.43902587890625, 2.5774080753326416, 2.715790271759033, 2.8541722297668457, 2.9925544261932373, 3.130936622619629, 3.2693188190460205, 3.407701015472412, 3.5460829734802246, 3.684465169906616, 3.822847366333008, 3.9612293243408203, 4.099611759185791, 4.2379937171936035]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 15.0, 20.0, 20.0, 47.0, 58.0, 96.0, 165.0, 360.0, 578.0, 1136.0, 2419.0, 5618.0, 14408.0, 41607.0, 124600.0, 343318.0, 331931.0, 118411.0, 39637.0, 13982.0, 5386.0, 2362.0, 1063.0, 558.0, 274.0, 197.0, 99.0, 52.0, 47.0, 23.0, 16.0, 6.0, 14.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.067779541015625, -3.94805908203125, -3.828338623046875, -3.7086181640625, -3.588897705078125, -3.46917724609375, -3.349456787109375, -3.229736328125, -3.110015869140625, -2.99029541015625, -2.870574951171875, -2.7508544921875, -2.631134033203125, -2.51141357421875, -2.391693115234375, -2.27197265625, -2.152252197265625, -2.03253173828125, -1.912811279296875, -1.7930908203125, -1.673370361328125, -1.55364990234375, -1.433929443359375, -1.314208984375, -1.194488525390625, -1.07476806640625, -0.955047607421875, -0.8353271484375, -0.715606689453125, -0.59588623046875, -0.476165771484375, -0.3564453125, -0.236724853515625, -0.11700439453125, 0.002716064453125, 0.1224365234375, 0.242156982421875, 0.36187744140625, 0.481597900390625, 0.601318359375, 0.721038818359375, 0.84075927734375, 0.960479736328125, 1.0802001953125, 1.199920654296875, 1.31964111328125, 1.439361572265625, 1.55908203125, 1.678802490234375, 1.79852294921875, 1.918243408203125, 2.0379638671875, 2.157684326171875, 2.27740478515625, 2.397125244140625, 2.516845703125, 2.636566162109375, 2.75628662109375, 2.876007080078125, 2.9957275390625, 3.115447998046875, 3.23516845703125, 3.354888916015625, 3.474609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 16.0, 14.0, 14.0, 18.0, 31.0, 29.0, 37.0, 59.0, 62.0, 59.0, 74.0, 74.0, 80.0, 63.0, 64.0, 58.0, 52.0, 50.0, 38.0, 22.0, 24.0, 14.0, 16.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.142578125, -2.0877838134765625, -2.032989501953125, -1.9781951904296875, -1.92340087890625, -1.8686065673828125, -1.813812255859375, -1.7590179443359375, -1.7042236328125, -1.6494293212890625, -1.594635009765625, -1.5398406982421875, -1.48504638671875, -1.4302520751953125, -1.375457763671875, -1.3206634521484375, -1.265869140625, -1.2110748291015625, -1.156280517578125, -1.1014862060546875, -1.04669189453125, -0.9918975830078125, -0.937103271484375, -0.8823089599609375, -0.8275146484375, -0.7727203369140625, -0.717926025390625, -0.6631317138671875, -0.60833740234375, -0.5535430908203125, -0.498748779296875, -0.4439544677734375, -0.38916015625, -0.3343658447265625, -0.279571533203125, -0.2247772216796875, -0.16998291015625, -0.1151885986328125, -0.060394287109375, -0.0055999755859375, 0.0491943359375, 0.1039886474609375, 0.158782958984375, 0.2135772705078125, 0.26837158203125, 0.3231658935546875, 0.377960205078125, 0.4327545166015625, 0.487548828125, 0.5423431396484375, 0.597137451171875, 0.6519317626953125, 0.70672607421875, 0.7615203857421875, 0.816314697265625, 0.8711090087890625, 0.9259033203125, 0.9806976318359375, 1.035491943359375, 1.0902862548828125, 1.14508056640625, 1.1998748779296875, 1.254669189453125, 1.3094635009765625, 1.3642578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 11.0, 8.0, 22.0, 14.0, 28.0, 32.0, 42.0, 57.0, 81.0, 83.0, 137.0, 193.0, 301.0, 405.0, 596.0, 984.0, 1982.0, 5631.0, 25569.0, 206955.0, 673430.0, 108046.0, 15447.0, 4075.0, 1641.0, 911.0, 526.0, 354.0, 260.0, 161.0, 125.0, 100.0, 79.0, 55.0, 53.0, 41.0, 29.0, 20.0, 13.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.421875, -5.2371826171875, -5.052490234375, -4.8677978515625, -4.68310546875, -4.4984130859375, -4.313720703125, -4.1290283203125, -3.9443359375, -3.7596435546875, -3.574951171875, -3.3902587890625, -3.20556640625, -3.0208740234375, -2.836181640625, -2.6514892578125, -2.466796875, -2.2821044921875, -2.097412109375, -1.9127197265625, -1.72802734375, -1.5433349609375, -1.358642578125, -1.1739501953125, -0.9892578125, -0.8045654296875, -0.619873046875, -0.4351806640625, -0.25048828125, -0.0657958984375, 0.118896484375, 0.3035888671875, 0.48828125, 0.6729736328125, 0.857666015625, 1.0423583984375, 1.22705078125, 1.4117431640625, 1.596435546875, 1.7811279296875, 1.9658203125, 2.1505126953125, 2.335205078125, 2.5198974609375, 2.70458984375, 2.8892822265625, 3.073974609375, 3.2586669921875, 3.443359375, 3.6280517578125, 3.812744140625, 3.9974365234375, 4.18212890625, 4.3668212890625, 4.551513671875, 4.7362060546875, 4.9208984375, 5.1055908203125, 5.290283203125, 5.4749755859375, 5.65966796875, 5.8443603515625, 6.029052734375, 6.2137451171875, 6.3984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 7.0, 2.0, 7.0, 13.0, 5.0, 12.0, 21.0, 31.0, 19.0, 17.0, 19.0, 28.0, 29.0, 47.0, 46.0, 53.0, 37.0, 46.0, 42.0, 34.0, 45.0, 46.0, 35.0, 32.0, 40.0, 34.0, 32.0, 32.0, 27.0, 26.0, 19.0, 19.0, 28.0, 10.0, 11.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-4.921875, -4.77581787109375, -4.6297607421875, -4.48370361328125, -4.337646484375, -4.19158935546875, -4.0455322265625, -3.89947509765625, -3.75341796875, -3.60736083984375, -3.4613037109375, -3.31524658203125, -3.169189453125, -3.02313232421875, -2.8770751953125, -2.73101806640625, -2.5849609375, -2.43890380859375, -2.2928466796875, -2.14678955078125, -2.000732421875, -1.85467529296875, -1.7086181640625, -1.56256103515625, -1.41650390625, -1.27044677734375, -1.1243896484375, -0.97833251953125, -0.832275390625, -0.68621826171875, -0.5401611328125, -0.39410400390625, -0.248046875, -0.10198974609375, 0.0440673828125, 0.19012451171875, 0.336181640625, 0.48223876953125, 0.6282958984375, 0.77435302734375, 0.92041015625, 1.06646728515625, 1.2125244140625, 1.35858154296875, 1.504638671875, 1.65069580078125, 1.7967529296875, 1.94281005859375, 2.0888671875, 2.23492431640625, 2.3809814453125, 2.52703857421875, 2.673095703125, 2.81915283203125, 2.9652099609375, 3.11126708984375, 3.25732421875, 3.40338134765625, 3.5494384765625, 3.69549560546875, 3.841552734375, 3.98760986328125, 4.1336669921875, 4.27972412109375, 4.42578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 12.0, 10.0, 9.0, 18.0, 27.0, 39.0, 44.0, 80.0, 130.0, 167.0, 313.0, 652.0, 1405.0, 3634.0, 12229.0, 62037.0, 472520.0, 421074.0, 56377.0, 11474.0, 3457.0, 1357.0, 644.0, 335.0, 189.0, 101.0, 62.0, 50.0, 28.0, 23.0, 16.0, 18.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.2176513671875, -2.156005859375, -2.0943603515625, -2.03271484375, -1.9710693359375, -1.909423828125, -1.8477783203125, -1.7861328125, -1.7244873046875, -1.662841796875, -1.6011962890625, -1.53955078125, -1.4779052734375, -1.416259765625, -1.3546142578125, -1.29296875, -1.2313232421875, -1.169677734375, -1.1080322265625, -1.04638671875, -0.9847412109375, -0.923095703125, -0.8614501953125, -0.7998046875, -0.7381591796875, -0.676513671875, -0.6148681640625, -0.55322265625, -0.4915771484375, -0.429931640625, -0.3682861328125, -0.306640625, -0.2449951171875, -0.183349609375, -0.1217041015625, -0.06005859375, 0.0015869140625, 0.063232421875, 0.1248779296875, 0.1865234375, 0.2481689453125, 0.309814453125, 0.3714599609375, 0.43310546875, 0.4947509765625, 0.556396484375, 0.6180419921875, 0.6796875, 0.7413330078125, 0.802978515625, 0.8646240234375, 0.92626953125, 0.9879150390625, 1.049560546875, 1.1112060546875, 1.1728515625, 1.2344970703125, 1.296142578125, 1.3577880859375, 1.41943359375, 1.4810791015625, 1.542724609375, 1.6043701171875, 1.666015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 9.0, 12.0, 13.0, 30.0, 21.0, 32.0, 29.0, 54.0, 54.0, 89.0, 95.0, 134.0, 102.0, 77.0, 69.0, 35.0, 31.0, 32.0, 14.0, 13.0, 8.0, 9.0, 4.0, 1.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003619194030761719, -0.0003490746021270752, -0.0003362298011779785, -0.00032338500022888184, -0.00031054019927978516, -0.0002976953983306885, -0.0002848505973815918, -0.0002720057964324951, -0.00025916099548339844, -0.00024631619453430176, -0.00023347139358520508, -0.0002206265926361084, -0.00020778179168701172, -0.00019493699073791504, -0.00018209218978881836, -0.00016924738883972168, -0.000156402587890625, -0.00014355778694152832, -0.00013071298599243164, -0.00011786818504333496, -0.00010502338409423828, -9.21785831451416e-05, -7.933378219604492e-05, -6.648898124694824e-05, -5.364418029785156e-05, -4.079937934875488e-05, -2.7954578399658203e-05, -1.5109777450561523e-05, -2.2649765014648438e-06, 1.0579824447631836e-05, 2.3424625396728516e-05, 3.6269426345825195e-05, 4.9114227294921875e-05, 6.195902824401855e-05, 7.480382919311523e-05, 8.764863014221191e-05, 0.0001004934310913086, 0.00011333823204040527, 0.00012618303298950195, 0.00013902783393859863, 0.0001518726348876953, 0.000164717435836792, 0.00017756223678588867, 0.00019040703773498535, 0.00020325183868408203, 0.0002160966396331787, 0.0002289414405822754, 0.00024178624153137207, 0.00025463104248046875, 0.00026747584342956543, 0.0002803206443786621, 0.0002931654453277588, 0.00030601024627685547, 0.00031885504722595215, 0.00033169984817504883, 0.0003445446491241455, 0.0003573894500732422, 0.00037023425102233887, 0.00038307905197143555, 0.0003959238529205322, 0.0004087686538696289, 0.0004216134548187256, 0.00043445825576782227, 0.00044730305671691895, 0.0004601478576660156]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 22.0, 21.0, 44.0, 62.0, 101.0, 172.0, 284.0, 562.0, 1133.0, 2713.0, 10442.0, 82826.0, 720715.0, 203158.0, 19145.0, 4042.0, 1485.0, 659.0, 404.0, 189.0, 130.0, 70.0, 41.0, 28.0, 30.0, 17.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.951171875, -2.872833251953125, -2.79449462890625, -2.716156005859375, -2.6378173828125, -2.559478759765625, -2.48114013671875, -2.402801513671875, -2.324462890625, -2.246124267578125, -2.16778564453125, -2.089447021484375, -2.0111083984375, -1.932769775390625, -1.85443115234375, -1.776092529296875, -1.69775390625, -1.619415283203125, -1.54107666015625, -1.462738037109375, -1.3843994140625, -1.306060791015625, -1.22772216796875, -1.149383544921875, -1.071044921875, -0.992706298828125, -0.91436767578125, -0.836029052734375, -0.7576904296875, -0.679351806640625, -0.60101318359375, -0.522674560546875, -0.4443359375, -0.365997314453125, -0.28765869140625, -0.209320068359375, -0.1309814453125, -0.052642822265625, 0.02569580078125, 0.104034423828125, 0.182373046875, 0.260711669921875, 0.33905029296875, 0.417388916015625, 0.4957275390625, 0.574066162109375, 0.65240478515625, 0.730743408203125, 0.80908203125, 0.887420654296875, 0.96575927734375, 1.044097900390625, 1.1224365234375, 1.200775146484375, 1.27911376953125, 1.357452392578125, 1.435791015625, 1.514129638671875, 1.59246826171875, 1.670806884765625, 1.7491455078125, 1.827484130859375, 1.90582275390625, 1.984161376953125, 2.0625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 10.0, 2.0, 10.0, 4.0, 4.0, 16.0, 12.0, 16.0, 27.0, 23.0, 38.0, 37.0, 48.0, 50.0, 69.0, 63.0, 75.0, 73.0, 71.0, 58.0, 51.0, 47.0, 28.0, 31.0, 21.0, 27.0, 20.0, 12.0, 10.0, 12.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.587890625, -1.542510986328125, -1.49713134765625, -1.451751708984375, -1.4063720703125, -1.360992431640625, -1.31561279296875, -1.270233154296875, -1.224853515625, -1.179473876953125, -1.13409423828125, -1.088714599609375, -1.0433349609375, -0.997955322265625, -0.95257568359375, -0.907196044921875, -0.86181640625, -0.816436767578125, -0.77105712890625, -0.725677490234375, -0.6802978515625, -0.634918212890625, -0.58953857421875, -0.544158935546875, -0.498779296875, -0.453399658203125, -0.40802001953125, -0.362640380859375, -0.3172607421875, -0.271881103515625, -0.22650146484375, -0.181121826171875, -0.1357421875, -0.090362548828125, -0.04498291015625, 0.000396728515625, 0.0457763671875, 0.091156005859375, 0.13653564453125, 0.181915283203125, 0.227294921875, 0.272674560546875, 0.31805419921875, 0.363433837890625, 0.4088134765625, 0.454193115234375, 0.49957275390625, 0.544952392578125, 0.59033203125, 0.635711669921875, 0.68109130859375, 0.726470947265625, 0.7718505859375, 0.817230224609375, 0.86260986328125, 0.907989501953125, 0.953369140625, 0.998748779296875, 1.04412841796875, 1.089508056640625, 1.1348876953125, 1.180267333984375, 1.22564697265625, 1.271026611328125, 1.31640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 22.0, 35.0, 76.0, 165.0, 249.0, 227.0, 126.0, 49.0, 24.0, 16.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.57037353515625, -104.38743591308594, -102.20449829101562, -100.02156066894531, -97.838623046875, -95.65568542480469, -93.47274780273438, -91.28980255126953, -89.10686492919922, -86.9239273071289, -84.7409896850586, -82.55805206298828, -80.37511444091797, -78.19216918945312, -76.00923156738281, -73.8262939453125, -71.64335632324219, -69.46041870117188, -67.27748107910156, -65.09454345703125, -62.91160202026367, -60.72866439819336, -58.54572677612305, -56.362789154052734, -54.17985534667969, -51.996917724609375, -49.81398010253906, -47.63104248046875, -45.44810104370117, -43.26516342163086, -41.08222579956055, -38.899288177490234, -36.716346740722656, -34.533409118652344, -32.35047149658203, -30.167531967163086, -27.98459243774414, -25.801654815673828, -23.618717193603516, -21.435779571533203, -19.252840042114258, -17.069902420043945, -14.886962890625, -12.704025268554688, -10.521086692810059, -8.33814811706543, -6.155210494995117, -3.9722719192504883, -1.7893333435058594, 0.39360499382019043, 2.5765433311462402, 4.759481430053711, 6.94242000579834, 9.125358581542969, 11.308296203613281, 13.49123477935791, 15.674173355102539, 17.85711097717285, 20.040050506591797, 22.22298812866211, 24.405925750732422, 26.588865280151367, 28.77180290222168, 30.954742431640625, 33.13768005371094]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 16.0, 17.0, 30.0, 24.0, 31.0, 48.0, 40.0, 59.0, 68.0, 62.0, 49.0, 73.0, 65.0, 62.0, 76.0, 53.0, 48.0, 40.0, 26.0, 26.0, 15.0, 16.0, 13.0, 5.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.112730026245117, -18.176864624023438, -17.24100112915039, -16.30513572692871, -15.369270324707031, -14.433404922485352, -13.497540473937988, -12.561676025390625, -11.625810623168945, -10.689945220947266, -9.754080772399902, -8.818216323852539, -7.882350921630859, -6.946485996246338, -6.010621070861816, -5.074756145477295, -4.138891220092773, -3.203026294708252, -2.2671613693237305, -1.331296443939209, -0.3954315185546875, 0.540433406829834, 1.4762983322143555, 2.412163257598877, 3.3480281829833984, 4.28389310836792, 5.219758033752441, 6.155622959136963, 7.091487884521484, 8.027353286743164, 8.963217735290527, 9.89908218383789, 10.834945678710938, 11.770811080932617, 12.70667552947998, 13.642539978027344, 14.578405380249023, 15.514270782470703, 16.45013427734375, 17.38599967956543, 18.32186508178711, 19.25773048400879, 20.19359588623047, 21.129459381103516, 22.065324783325195, 23.001190185546875, 23.937053680419922, 24.8729190826416, 25.80878448486328, 26.74464988708496, 27.68051528930664, 28.616378784179688, 29.552244186401367, 30.488109588623047, 31.423973083496094, 32.359840393066406, 33.29570388793945, 34.2315673828125, 35.16743469238281, 36.10329818725586, 37.039161682128906, 37.97502899169922, 38.910892486572266, 39.84675979614258, 40.782623291015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 10.0, 19.0, 28.0, 54.0, 98.0, 208.0, 441.0, 952.0, 2520.0, 7383.0, 26585.0, 141290.0, 3091733.0, 835447.0, 64695.0, 15095.0, 4623.0, 1691.0, 663.0, 326.0, 168.0, 110.0, 54.0, 29.0, 21.0, 16.0, 10.0, 5.0, 9.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.329620361328125, -2.21197509765625, -2.094329833984375, -1.9766845703125, -1.859039306640625, -1.74139404296875, -1.623748779296875, -1.506103515625, -1.388458251953125, -1.27081298828125, -1.153167724609375, -1.0355224609375, -0.917877197265625, -0.80023193359375, -0.682586669921875, -0.56494140625, -0.447296142578125, -0.32965087890625, -0.212005615234375, -0.0943603515625, 0.023284912109375, 0.14093017578125, 0.258575439453125, 0.376220703125, 0.493865966796875, 0.61151123046875, 0.729156494140625, 0.8468017578125, 0.964447021484375, 1.08209228515625, 1.199737548828125, 1.3173828125, 1.435028076171875, 1.55267333984375, 1.670318603515625, 1.7879638671875, 1.905609130859375, 2.02325439453125, 2.140899658203125, 2.258544921875, 2.376190185546875, 2.49383544921875, 2.611480712890625, 2.7291259765625, 2.846771240234375, 2.96441650390625, 3.082061767578125, 3.19970703125, 3.317352294921875, 3.43499755859375, 3.552642822265625, 3.6702880859375, 3.787933349609375, 3.90557861328125, 4.023223876953125, 4.140869140625, 4.258514404296875, 4.37615966796875, 4.493804931640625, 4.6114501953125, 4.729095458984375, 4.84674072265625, 4.964385986328125, 5.08203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 13.0, 13.0, 22.0, 32.0, 32.0, 52.0, 72.0, 80.0, 78.0, 102.0, 108.0, 92.0, 74.0, 62.0, 53.0, 44.0, 23.0, 21.0, 8.0, 9.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.23602294921875, -1.1673583984375, -1.09869384765625, -1.030029296875, -0.96136474609375, -0.8927001953125, -0.82403564453125, -0.75537109375, -0.68670654296875, -0.6180419921875, -0.54937744140625, -0.480712890625, -0.41204833984375, -0.3433837890625, -0.27471923828125, -0.2060546875, -0.13739013671875, -0.0687255859375, -6.103515625e-05, 0.068603515625, 0.13726806640625, 0.2059326171875, 0.27459716796875, 0.34326171875, 0.41192626953125, 0.4805908203125, 0.54925537109375, 0.617919921875, 0.68658447265625, 0.7552490234375, 0.82391357421875, 0.892578125, 0.96124267578125, 1.0299072265625, 1.09857177734375, 1.167236328125, 1.23590087890625, 1.3045654296875, 1.37322998046875, 1.44189453125, 1.51055908203125, 1.5792236328125, 1.64788818359375, 1.716552734375, 1.78521728515625, 1.8538818359375, 1.92254638671875, 1.9912109375, 2.05987548828125, 2.1285400390625, 2.19720458984375, 2.265869140625, 2.33453369140625, 2.4031982421875, 2.47186279296875, 2.54052734375, 2.60919189453125, 2.6778564453125, 2.74652099609375, 2.815185546875, 2.88385009765625, 2.9525146484375, 3.02117919921875, 3.08984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 11.0, 12.0, 14.0, 25.0, 36.0, 79.0, 168.0, 405.0, 1192.0, 3649.0, 13443.0, 63534.0, 911125.0, 3059894.0, 111911.0, 20498.0, 5397.0, 1671.0, 617.0, 277.0, 140.0, 58.0, 41.0, 26.0, 10.0, 6.0, 15.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.48114013671875, -4.3372802734375, -4.19342041015625, -4.049560546875, -3.90570068359375, -3.7618408203125, -3.61798095703125, -3.47412109375, -3.33026123046875, -3.1864013671875, -3.04254150390625, -2.898681640625, -2.75482177734375, -2.6109619140625, -2.46710205078125, -2.3232421875, -2.17938232421875, -2.0355224609375, -1.89166259765625, -1.747802734375, -1.60394287109375, -1.4600830078125, -1.31622314453125, -1.17236328125, -1.02850341796875, -0.8846435546875, -0.74078369140625, -0.596923828125, -0.45306396484375, -0.3092041015625, -0.16534423828125, -0.021484375, 0.12237548828125, 0.2662353515625, 0.41009521484375, 0.553955078125, 0.69781494140625, 0.8416748046875, 0.98553466796875, 1.12939453125, 1.27325439453125, 1.4171142578125, 1.56097412109375, 1.704833984375, 1.84869384765625, 1.9925537109375, 2.13641357421875, 2.2802734375, 2.42413330078125, 2.5679931640625, 2.71185302734375, 2.855712890625, 2.99957275390625, 3.1434326171875, 3.28729248046875, 3.43115234375, 3.57501220703125, 3.7188720703125, 3.86273193359375, 4.006591796875, 4.15045166015625, 4.2943115234375, 4.43817138671875, 4.58203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 11.0, 17.0, 23.0, 24.0, 42.0, 41.0, 80.0, 113.0, 181.0, 333.0, 731.0, 1085.0, 589.0, 285.0, 185.0, 85.0, 56.0, 48.0, 33.0, 18.0, 14.0, 10.0, 12.0, 7.0, 6.0, 4.0, 2.0, 3.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.5133056640625, -3.393798828125, -3.2742919921875, -3.15478515625, -3.0352783203125, -2.915771484375, -2.7962646484375, -2.6767578125, -2.5572509765625, -2.437744140625, -2.3182373046875, -2.19873046875, -2.0792236328125, -1.959716796875, -1.8402099609375, -1.720703125, -1.6011962890625, -1.481689453125, -1.3621826171875, -1.24267578125, -1.1231689453125, -1.003662109375, -0.8841552734375, -0.7646484375, -0.6451416015625, -0.525634765625, -0.4061279296875, -0.28662109375, -0.1671142578125, -0.047607421875, 0.0718994140625, 0.19140625, 0.3109130859375, 0.430419921875, 0.5499267578125, 0.66943359375, 0.7889404296875, 0.908447265625, 1.0279541015625, 1.1474609375, 1.2669677734375, 1.386474609375, 1.5059814453125, 1.62548828125, 1.7449951171875, 1.864501953125, 1.9840087890625, 2.103515625, 2.2230224609375, 2.342529296875, 2.4620361328125, 2.58154296875, 2.7010498046875, 2.820556640625, 2.9400634765625, 3.0595703125, 3.1790771484375, 3.298583984375, 3.4180908203125, 3.53759765625, 3.6571044921875, 3.776611328125, 3.8961181640625, 4.015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 11.0, 13.0, 25.0, 30.0, 57.0, 87.0, 169.0, 181.0, 161.0, 114.0, 69.0, 38.0, 19.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.05354690551758, -40.87858963012695, -39.70363235473633, -38.5286750793457, -37.35371398925781, -36.17875671386719, -35.00379943847656, -33.82884216308594, -32.65388488769531, -31.478927612304688, -30.303970336914062, -29.129011154174805, -27.95405387878418, -26.779096603393555, -25.604137420654297, -24.429180145263672, -23.254222869873047, -22.079265594482422, -20.904308319091797, -19.72934913635254, -18.554391860961914, -17.37943458557129, -16.20447540283203, -15.029518127441406, -13.854560852050781, -12.679603576660156, -11.504645347595215, -10.329687118530273, -9.154729843139648, -7.979772090911865, -6.804814338684082, -5.629856109619141, -4.45489501953125, -3.279937267303467, -2.1049795150756836, -0.9300217628479004, 0.2449359893798828, 1.419893741607666, 2.594851493835449, 3.7698097229003906, 4.944766998291016, 6.119724750518799, 7.294682502746582, 8.469640731811523, 9.644598007202148, 10.819555282592773, 11.994513511657715, 13.169471740722656, 14.344429016113281, 15.519386291503906, 16.69434356689453, 17.86930274963379, 19.044260025024414, 20.21921730041504, 21.394176483154297, 22.569133758544922, 23.744091033935547, 24.919048309326172, 26.094005584716797, 27.268964767456055, 28.44392204284668, 29.618879318237305, 30.793838500976562, 31.968795776367188, 33.14375305175781]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 12.0, 20.0, 14.0, 25.0, 35.0, 44.0, 46.0, 36.0, 58.0, 30.0, 44.0, 55.0, 57.0, 59.0, 47.0, 48.0, 53.0, 39.0, 35.0, 41.0, 31.0, 21.0, 25.0, 15.0, 18.0, 17.0, 12.0, 7.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.869686126708984, -18.338943481445312, -17.80820083618164, -17.27745819091797, -16.746715545654297, -16.215970993041992, -15.68522834777832, -15.154485702514648, -14.623743057250977, -14.093000411987305, -13.562257766723633, -13.031514167785645, -12.500771522521973, -11.9700288772583, -11.439285278320312, -10.90854263305664, -10.377799987792969, -9.847057342529297, -9.316314697265625, -8.785571098327637, -8.254828453063965, -7.724085807800293, -7.193342685699463, -6.662599563598633, -6.131856918334961, -5.601114273071289, -5.070371150970459, -4.539628028869629, -4.008885383605957, -3.478142499923706, -2.947399616241455, -2.416656732559204, -1.885915756225586, -1.355172872543335, -0.824429988861084, -0.293687105178833, 0.23705577850341797, 0.767798662185669, 1.29854154586792, 1.829284429550171, 2.360027313232422, 2.890770196914673, 3.421513080596924, 3.952255964279175, 4.482998847961426, 5.013741493225098, 5.544484615325928, 6.075227737426758, 6.60597038269043, 7.136713027954102, 7.667456150054932, 8.198199272155762, 8.728941917419434, 9.259684562683105, 9.790428161621094, 10.321170806884766, 10.851913452148438, 11.38265609741211, 11.913398742675781, 12.44414234161377, 12.974884986877441, 13.505627632141113, 14.036371231079102, 14.567113876342773, 15.097856521606445]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 1.0, 7.0, 17.0, 17.0, 21.0, 36.0, 43.0, 75.0, 86.0, 142.0, 246.0, 345.0, 598.0, 1013.0, 1778.0, 3083.0, 5582.0, 10908.0, 21798.0, 45839.0, 101938.0, 243728.0, 330494.0, 151503.0, 66454.0, 30680.0, 14831.0, 7568.0, 3949.0, 2295.0, 1346.0, 757.0, 490.0, 300.0, 168.0, 128.0, 88.0, 67.0, 35.0, 28.0, 19.0, 23.0, 8.0, 5.0, 5.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.483001708984375, -2.40350341796875, -2.324005126953125, -2.2445068359375, -2.165008544921875, -2.08551025390625, -2.006011962890625, -1.926513671875, -1.847015380859375, -1.76751708984375, -1.688018798828125, -1.6085205078125, -1.529022216796875, -1.44952392578125, -1.370025634765625, -1.29052734375, -1.211029052734375, -1.13153076171875, -1.052032470703125, -0.9725341796875, -0.893035888671875, -0.81353759765625, -0.734039306640625, -0.654541015625, -0.575042724609375, -0.49554443359375, -0.416046142578125, -0.3365478515625, -0.257049560546875, -0.17755126953125, -0.098052978515625, -0.0185546875, 0.060943603515625, 0.14044189453125, 0.219940185546875, 0.2994384765625, 0.378936767578125, 0.45843505859375, 0.537933349609375, 0.617431640625, 0.696929931640625, 0.77642822265625, 0.855926513671875, 0.9354248046875, 1.014923095703125, 1.09442138671875, 1.173919677734375, 1.25341796875, 1.332916259765625, 1.41241455078125, 1.491912841796875, 1.5714111328125, 1.650909423828125, 1.73040771484375, 1.809906005859375, 1.889404296875, 1.968902587890625, 2.04840087890625, 2.127899169921875, 2.2073974609375, 2.286895751953125, 2.36639404296875, 2.445892333984375, 2.525390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 9.0, 9.0, 19.0, 23.0, 25.0, 26.0, 30.0, 34.0, 41.0, 48.0, 59.0, 59.0, 64.0, 67.0, 74.0, 41.0, 63.0, 52.0, 38.0, 43.0, 37.0, 34.0, 28.0, 18.0, 20.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.07696533203125, -1.0299072265625, -0.98284912109375, -0.935791015625, -0.88873291015625, -0.8416748046875, -0.79461669921875, -0.74755859375, -0.70050048828125, -0.6534423828125, -0.60638427734375, -0.559326171875, -0.51226806640625, -0.4652099609375, -0.41815185546875, -0.37109375, -0.32403564453125, -0.2769775390625, -0.22991943359375, -0.182861328125, -0.13580322265625, -0.0887451171875, -0.04168701171875, 0.00537109375, 0.05242919921875, 0.0994873046875, 0.14654541015625, 0.193603515625, 0.24066162109375, 0.2877197265625, 0.33477783203125, 0.3818359375, 0.42889404296875, 0.4759521484375, 0.52301025390625, 0.570068359375, 0.61712646484375, 0.6641845703125, 0.71124267578125, 0.75830078125, 0.80535888671875, 0.8524169921875, 0.89947509765625, 0.946533203125, 0.99359130859375, 1.0406494140625, 1.08770751953125, 1.134765625, 1.18182373046875, 1.2288818359375, 1.27593994140625, 1.322998046875, 1.37005615234375, 1.4171142578125, 1.46417236328125, 1.51123046875, 1.55828857421875, 1.6053466796875, 1.65240478515625, 1.699462890625, 1.74652099609375, 1.7935791015625, 1.84063720703125, 1.8876953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 5.0, 2.0, 10.0, 6.0, 11.0, 9.0, 13.0, 26.0, 23.0, 38.0, 62.0, 68.0, 110.0, 172.0, 264.0, 498.0, 867.0, 1781.0, 5889.0, 40680.0, 736795.0, 237359.0, 17139.0, 3616.0, 1349.0, 629.0, 422.0, 237.0, 149.0, 91.0, 72.0, 45.0, 34.0, 23.0, 18.0, 14.0, 8.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.06341552734375, -6.8182373046875, -6.57305908203125, -6.327880859375, -6.08270263671875, -5.8375244140625, -5.59234619140625, -5.34716796875, -5.10198974609375, -4.8568115234375, -4.61163330078125, -4.366455078125, -4.12127685546875, -3.8760986328125, -3.63092041015625, -3.3857421875, -3.14056396484375, -2.8953857421875, -2.65020751953125, -2.405029296875, -2.15985107421875, -1.9146728515625, -1.66949462890625, -1.42431640625, -1.17913818359375, -0.9339599609375, -0.68878173828125, -0.443603515625, -0.19842529296875, 0.0467529296875, 0.29193115234375, 0.537109375, 0.78228759765625, 1.0274658203125, 1.27264404296875, 1.517822265625, 1.76300048828125, 2.0081787109375, 2.25335693359375, 2.49853515625, 2.74371337890625, 2.9888916015625, 3.23406982421875, 3.479248046875, 3.72442626953125, 3.9696044921875, 4.21478271484375, 4.4599609375, 4.70513916015625, 4.9503173828125, 5.19549560546875, 5.440673828125, 5.68585205078125, 5.9310302734375, 6.17620849609375, 6.42138671875, 6.66656494140625, 6.9117431640625, 7.15692138671875, 7.402099609375, 7.64727783203125, 7.8924560546875, 8.13763427734375, 8.3828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 5.0, 6.0, 14.0, 18.0, 16.0, 21.0, 28.0, 33.0, 33.0, 26.0, 35.0, 30.0, 63.0, 49.0, 57.0, 42.0, 53.0, 55.0, 55.0, 49.0, 50.0, 47.0, 43.0, 29.0, 29.0, 22.0, 14.0, 15.0, 11.0, 10.0, 8.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0], "bins": [-6.80078125, -6.626708984375, -6.45263671875, -6.278564453125, -6.1044921875, -5.930419921875, -5.75634765625, -5.582275390625, -5.408203125, -5.234130859375, -5.06005859375, -4.885986328125, -4.7119140625, -4.537841796875, -4.36376953125, -4.189697265625, -4.015625, -3.841552734375, -3.66748046875, -3.493408203125, -3.3193359375, -3.145263671875, -2.97119140625, -2.797119140625, -2.623046875, -2.448974609375, -2.27490234375, -2.100830078125, -1.9267578125, -1.752685546875, -1.57861328125, -1.404541015625, -1.23046875, -1.056396484375, -0.88232421875, -0.708251953125, -0.5341796875, -0.360107421875, -0.18603515625, -0.011962890625, 0.162109375, 0.336181640625, 0.51025390625, 0.684326171875, 0.8583984375, 1.032470703125, 1.20654296875, 1.380615234375, 1.5546875, 1.728759765625, 1.90283203125, 2.076904296875, 2.2509765625, 2.425048828125, 2.59912109375, 2.773193359375, 2.947265625, 3.121337890625, 3.29541015625, 3.469482421875, 3.6435546875, 3.817626953125, 3.99169921875, 4.165771484375, 4.33984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 2.0, 11.0, 15.0, 14.0, 26.0, 40.0, 46.0, 67.0, 103.0, 180.0, 292.0, 613.0, 1479.0, 4719.0, 19698.0, 156823.0, 778738.0, 68643.0, 11734.0, 3034.0, 1084.0, 477.0, 253.0, 127.0, 94.0, 69.0, 37.0, 33.0, 24.0, 19.0, 8.0, 13.0, 8.0, 5.0, 3.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.943359375, -2.852325439453125, -2.76129150390625, -2.670257568359375, -2.5792236328125, -2.488189697265625, -2.39715576171875, -2.306121826171875, -2.215087890625, -2.124053955078125, -2.03302001953125, -1.941986083984375, -1.8509521484375, -1.759918212890625, -1.66888427734375, -1.577850341796875, -1.48681640625, -1.395782470703125, -1.30474853515625, -1.213714599609375, -1.1226806640625, -1.031646728515625, -0.94061279296875, -0.849578857421875, -0.758544921875, -0.667510986328125, -0.57647705078125, -0.485443115234375, -0.3944091796875, -0.303375244140625, -0.21234130859375, -0.121307373046875, -0.0302734375, 0.060760498046875, 0.15179443359375, 0.242828369140625, 0.3338623046875, 0.424896240234375, 0.51593017578125, 0.606964111328125, 0.697998046875, 0.789031982421875, 0.88006591796875, 0.971099853515625, 1.0621337890625, 1.153167724609375, 1.24420166015625, 1.335235595703125, 1.42626953125, 1.517303466796875, 1.60833740234375, 1.699371337890625, 1.7904052734375, 1.881439208984375, 1.97247314453125, 2.063507080078125, 2.154541015625, 2.245574951171875, 2.33660888671875, 2.427642822265625, 2.5186767578125, 2.609710693359375, 2.70074462890625, 2.791778564453125, 2.8828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 5.0, 6.0, 8.0, 13.0, 15.0, 6.0, 31.0, 34.0, 22.0, 28.0, 41.0, 60.0, 84.0, 139.0, 119.0, 93.0, 59.0, 48.0, 31.0, 23.0, 24.0, 17.0, 16.0, 11.0, 9.0, 12.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003898143768310547, -0.00037755072116851807, -0.00036528706550598145, -0.0003530234098434448, -0.0003407597541809082, -0.0003284960985183716, -0.00031623244285583496, -0.00030396878719329834, -0.0002917051315307617, -0.0002794414758682251, -0.0002671778202056885, -0.00025491416454315186, -0.00024265050888061523, -0.0002303868532180786, -0.000218123197555542, -0.00020585954189300537, -0.00019359588623046875, -0.00018133223056793213, -0.0001690685749053955, -0.0001568049192428589, -0.00014454126358032227, -0.00013227760791778564, -0.00012001395225524902, -0.0001077502965927124, -9.548664093017578e-05, -8.322298526763916e-05, -7.095932960510254e-05, -5.869567394256592e-05, -4.64320182800293e-05, -3.4168362617492676e-05, -2.1904706954956055e-05, -9.641051292419434e-06, 2.6226043701171875e-06, 1.4886260032653809e-05, 2.714991569519043e-05, 3.941357135772705e-05, 5.167722702026367e-05, 6.394088268280029e-05, 7.620453834533691e-05, 8.846819400787354e-05, 0.00010073184967041016, 0.00011299550533294678, 0.0001252591609954834, 0.00013752281665802002, 0.00014978647232055664, 0.00016205012798309326, 0.00017431378364562988, 0.0001865774393081665, 0.00019884109497070312, 0.00021110475063323975, 0.00022336840629577637, 0.000235632061958313, 0.0002478957176208496, 0.00026015937328338623, 0.00027242302894592285, 0.00028468668460845947, 0.0002969503402709961, 0.0003092139959335327, 0.00032147765159606934, 0.00033374130725860596, 0.0003460049629211426, 0.0003582686185836792, 0.0003705322742462158, 0.00038279592990875244, 0.00039505958557128906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 7.0, 20.0, 30.0, 33.0, 66.0, 78.0, 116.0, 198.0, 314.0, 532.0, 999.0, 2264.0, 6353.0, 31036.0, 363829.0, 587868.0, 41781.0, 7665.0, 2570.0, 1180.0, 618.0, 336.0, 211.0, 143.0, 86.0, 62.0, 37.0, 25.0, 23.0, 10.0, 14.0, 9.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.857421875, -2.771026611328125, -2.68463134765625, -2.598236083984375, -2.5118408203125, -2.425445556640625, -2.33905029296875, -2.252655029296875, -2.166259765625, -2.079864501953125, -1.99346923828125, -1.907073974609375, -1.8206787109375, -1.734283447265625, -1.64788818359375, -1.561492919921875, -1.47509765625, -1.388702392578125, -1.30230712890625, -1.215911865234375, -1.1295166015625, -1.043121337890625, -0.95672607421875, -0.870330810546875, -0.783935546875, -0.697540283203125, -0.61114501953125, -0.524749755859375, -0.4383544921875, -0.351959228515625, -0.26556396484375, -0.179168701171875, -0.0927734375, -0.006378173828125, 0.08001708984375, 0.166412353515625, 0.2528076171875, 0.339202880859375, 0.42559814453125, 0.511993408203125, 0.598388671875, 0.684783935546875, 0.77117919921875, 0.857574462890625, 0.9439697265625, 1.030364990234375, 1.11676025390625, 1.203155517578125, 1.28955078125, 1.375946044921875, 1.46234130859375, 1.548736572265625, 1.6351318359375, 1.721527099609375, 1.80792236328125, 1.894317626953125, 1.980712890625, 2.067108154296875, 2.15350341796875, 2.239898681640625, 2.3262939453125, 2.412689208984375, 2.49908447265625, 2.585479736328125, 2.671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 8.0, 6.0, 6.0, 12.0, 8.0, 21.0, 21.0, 16.0, 34.0, 41.0, 61.0, 67.0, 62.0, 95.0, 84.0, 62.0, 67.0, 59.0, 52.0, 45.0, 34.0, 19.0, 24.0, 11.0, 20.0, 10.0, 10.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80078125, -1.7453460693359375, -1.689910888671875, -1.6344757080078125, -1.57904052734375, -1.5236053466796875, -1.468170166015625, -1.4127349853515625, -1.3572998046875, -1.3018646240234375, -1.246429443359375, -1.1909942626953125, -1.13555908203125, -1.0801239013671875, -1.024688720703125, -0.9692535400390625, -0.913818359375, -0.8583831787109375, -0.802947998046875, -0.7475128173828125, -0.69207763671875, -0.6366424560546875, -0.581207275390625, -0.5257720947265625, -0.4703369140625, -0.4149017333984375, -0.359466552734375, -0.3040313720703125, -0.24859619140625, -0.1931610107421875, -0.137725830078125, -0.0822906494140625, -0.02685546875, 0.0285797119140625, 0.084014892578125, 0.1394500732421875, 0.19488525390625, 0.2503204345703125, 0.305755615234375, 0.3611907958984375, 0.4166259765625, 0.4720611572265625, 0.527496337890625, 0.5829315185546875, 0.63836669921875, 0.6938018798828125, 0.749237060546875, 0.8046722412109375, 0.860107421875, 0.9155426025390625, 0.970977783203125, 1.0264129638671875, 1.08184814453125, 1.1372833251953125, 1.192718505859375, 1.2481536865234375, 1.3035888671875, 1.3590240478515625, 1.414459228515625, 1.4698944091796875, 1.52532958984375, 1.5807647705078125, 1.636199951171875, 1.6916351318359375, 1.7470703125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 10.0, 23.0, 47.0, 95.0, 168.0, 197.0, 173.0, 120.0, 78.0, 31.0, 19.0, 10.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.984535217285156, -36.55978775024414, -35.135040283203125, -33.710296630859375, -32.28554916381836, -30.860801696777344, -29.436054229736328, -28.011306762695312, -26.58656120300293, -25.161813735961914, -23.73706817626953, -22.312320709228516, -20.8875732421875, -19.462827682495117, -18.0380802154541, -16.61333465576172, -15.188587188720703, -13.763840675354004, -12.339094161987305, -10.914346694946289, -9.48960018157959, -8.06485366821289, -6.640106201171875, -5.215359687805176, -3.7906131744384766, -2.3658664226531982, -0.9411196708679199, 0.4836273193359375, 1.9083738327026367, 3.333120346069336, 4.757867813110352, 6.182614326477051, 7.607357025146484, 9.032103538513184, 10.456850051879883, 11.881597518920898, 13.306344032287598, 14.731090545654297, 16.155838012695312, 17.580585479736328, 19.00533103942871, 20.430078506469727, 21.85482406616211, 23.279571533203125, 24.70431900024414, 26.129064559936523, 27.55381202697754, 28.978557586669922, 30.403305053710938, 31.828052520751953, 33.25279998779297, 34.67754364013672, 36.102291107177734, 37.52703857421875, 38.951786041259766, 40.37653350830078, 41.80127716064453, 43.22602462768555, 44.65077209472656, 46.07551574707031, 47.50026321411133, 48.925010681152344, 50.34975814819336, 51.774505615234375, 53.19925308227539]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 12.0, 14.0, 9.0, 15.0, 9.0, 25.0, 25.0, 27.0, 29.0, 44.0, 33.0, 42.0, 65.0, 61.0, 61.0, 45.0, 54.0, 55.0, 52.0, 37.0, 38.0, 35.0, 29.0, 23.0, 18.0, 15.0, 32.0, 14.0, 12.0, 10.0, 9.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.62863540649414, -22.978681564331055, -22.32872772216797, -21.67877197265625, -21.028818130493164, -20.378864288330078, -19.72890853881836, -19.078954696655273, -18.429000854492188, -17.7790470123291, -17.129093170166016, -16.479137420654297, -15.829183578491211, -15.179229736328125, -14.529274940490723, -13.87932014465332, -13.229366302490234, -12.579412460327148, -11.929457664489746, -11.279502868652344, -10.629549026489258, -9.979595184326172, -9.32964038848877, -8.679685592651367, -8.029731750488281, -7.379777431488037, -6.729823112487793, -6.079868793487549, -5.429914474487305, -4.7799601554870605, -4.130005836486816, -3.4800515174865723, -2.830097198486328, -2.180142879486084, -1.5301885604858398, -0.8802342414855957, -0.23027992248535156, 0.4196743965148926, 1.0696287155151367, 1.7195830345153809, 2.369537353515625, 3.019491672515869, 3.6694459915161133, 4.319400310516357, 4.969354629516602, 5.619308948516846, 6.26926326751709, 6.919217586517334, 7.569171905517578, 8.219125747680664, 8.869080543518066, 9.519035339355469, 10.168989181518555, 10.81894302368164, 11.468897819519043, 12.118852615356445, 12.768806457519531, 13.418760299682617, 14.06871509552002, 14.718669891357422, 15.368623733520508, 16.018577575683594, 16.668533325195312, 17.3184871673584, 17.968441009521484]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 8.0, 10.0, 11.0, 19.0, 12.0, 18.0, 26.0, 36.0, 46.0, 65.0, 84.0, 98.0, 165.0, 266.0, 689.0, 3937.0, 115805.0, 4045137.0, 24821.0, 1830.0, 468.0, 209.0, 133.0, 81.0, 68.0, 53.0, 36.0, 42.0, 24.0, 12.0, 20.0, 13.0, 14.0, 13.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.24505615234375, -6.9471435546875, -6.64923095703125, -6.351318359375, -6.05340576171875, -5.7554931640625, -5.45758056640625, -5.15966796875, -4.86175537109375, -4.5638427734375, -4.26593017578125, -3.968017578125, -3.67010498046875, -3.3721923828125, -3.07427978515625, -2.7763671875, -2.47845458984375, -2.1805419921875, -1.88262939453125, -1.584716796875, -1.28680419921875, -0.9888916015625, -0.69097900390625, -0.39306640625, -0.09515380859375, 0.2027587890625, 0.50067138671875, 0.798583984375, 1.09649658203125, 1.3944091796875, 1.69232177734375, 1.990234375, 2.28814697265625, 2.5860595703125, 2.88397216796875, 3.181884765625, 3.47979736328125, 3.7777099609375, 4.07562255859375, 4.37353515625, 4.67144775390625, 4.9693603515625, 5.26727294921875, 5.565185546875, 5.86309814453125, 6.1610107421875, 6.45892333984375, 6.7568359375, 7.05474853515625, 7.3526611328125, 7.65057373046875, 7.948486328125, 8.24639892578125, 8.5443115234375, 8.84222412109375, 9.14013671875, 9.43804931640625, 9.7359619140625, 10.03387451171875, 10.331787109375, 10.62969970703125, 10.9276123046875, 11.22552490234375, 11.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 10.0, 16.0, 21.0, 30.0, 32.0, 36.0, 56.0, 66.0, 70.0, 85.0, 92.0, 79.0, 88.0, 64.0, 58.0, 51.0, 46.0, 35.0, 21.0, 16.0, 14.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.817962646484375, -1.75701904296875, -1.696075439453125, -1.6351318359375, -1.574188232421875, -1.51324462890625, -1.452301025390625, -1.391357421875, -1.330413818359375, -1.26947021484375, -1.208526611328125, -1.1475830078125, -1.086639404296875, -1.02569580078125, -0.964752197265625, -0.90380859375, -0.842864990234375, -0.78192138671875, -0.720977783203125, -0.6600341796875, -0.599090576171875, -0.53814697265625, -0.477203369140625, -0.416259765625, -0.355316162109375, -0.29437255859375, -0.233428955078125, -0.1724853515625, -0.111541748046875, -0.05059814453125, 0.010345458984375, 0.0712890625, 0.132232666015625, 0.19317626953125, 0.254119873046875, 0.3150634765625, 0.376007080078125, 0.43695068359375, 0.497894287109375, 0.558837890625, 0.619781494140625, 0.68072509765625, 0.741668701171875, 0.8026123046875, 0.863555908203125, 0.92449951171875, 0.985443115234375, 1.04638671875, 1.107330322265625, 1.16827392578125, 1.229217529296875, 1.2901611328125, 1.351104736328125, 1.41204833984375, 1.472991943359375, 1.533935546875, 1.594879150390625, 1.65582275390625, 1.716766357421875, 1.7777099609375, 1.838653564453125, 1.89959716796875, 1.960540771484375, 2.021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 14.0, 19.0, 30.0, 37.0, 71.0, 128.0, 231.0, 421.0, 963.0, 2496.0, 6415.0, 19470.0, 85813.0, 1499115.0, 2435201.0, 109409.0, 22786.0, 7083.0, 2580.0, 1057.0, 455.0, 219.0, 107.0, 68.0, 23.0, 15.0, 18.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.782379150390625, -3.65655517578125, -3.530731201171875, -3.4049072265625, -3.279083251953125, -3.15325927734375, -3.027435302734375, -2.901611328125, -2.775787353515625, -2.64996337890625, -2.524139404296875, -2.3983154296875, -2.272491455078125, -2.14666748046875, -2.020843505859375, -1.89501953125, -1.769195556640625, -1.64337158203125, -1.517547607421875, -1.3917236328125, -1.265899658203125, -1.14007568359375, -1.014251708984375, -0.888427734375, -0.762603759765625, -0.63677978515625, -0.510955810546875, -0.3851318359375, -0.259307861328125, -0.13348388671875, -0.007659912109375, 0.1181640625, 0.243988037109375, 0.36981201171875, 0.495635986328125, 0.6214599609375, 0.747283935546875, 0.87310791015625, 0.998931884765625, 1.124755859375, 1.250579833984375, 1.37640380859375, 1.502227783203125, 1.6280517578125, 1.753875732421875, 1.87969970703125, 2.005523681640625, 2.13134765625, 2.257171630859375, 2.38299560546875, 2.508819580078125, 2.6346435546875, 2.760467529296875, 2.88629150390625, 3.012115478515625, 3.137939453125, 3.263763427734375, 3.38958740234375, 3.515411376953125, 3.6412353515625, 3.767059326171875, 3.89288330078125, 4.018707275390625, 4.14453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 15.0, 8.0, 7.0, 13.0, 28.0, 39.0, 37.0, 65.0, 106.0, 180.0, 346.0, 704.0, 1064.0, 631.0, 300.0, 171.0, 105.0, 69.0, 50.0, 30.0, 21.0, 16.0, 18.0, 7.0, 10.0, 5.0, 1.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.44921875, -4.339202880859375, -4.22918701171875, -4.119171142578125, -4.0091552734375, -3.899139404296875, -3.78912353515625, -3.679107666015625, -3.569091796875, -3.459075927734375, -3.34906005859375, -3.239044189453125, -3.1290283203125, -3.019012451171875, -2.90899658203125, -2.798980712890625, -2.68896484375, -2.578948974609375, -2.46893310546875, -2.358917236328125, -2.2489013671875, -2.138885498046875, -2.02886962890625, -1.918853759765625, -1.808837890625, -1.698822021484375, -1.58880615234375, -1.478790283203125, -1.3687744140625, -1.258758544921875, -1.14874267578125, -1.038726806640625, -0.9287109375, -0.818695068359375, -0.70867919921875, -0.598663330078125, -0.4886474609375, -0.378631591796875, -0.26861572265625, -0.158599853515625, -0.048583984375, 0.061431884765625, 0.17144775390625, 0.281463623046875, 0.3914794921875, 0.501495361328125, 0.61151123046875, 0.721527099609375, 0.83154296875, 0.941558837890625, 1.05157470703125, 1.161590576171875, 1.2716064453125, 1.381622314453125, 1.49163818359375, 1.601654052734375, 1.711669921875, 1.821685791015625, 1.93170166015625, 2.041717529296875, 2.1517333984375, 2.261749267578125, 2.37176513671875, 2.481781005859375, 2.591796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 14.0, 33.0, 62.0, 105.0, 173.0, 203.0, 169.0, 94.0, 59.0, 31.0, 19.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.61330795288086, -36.37720489501953, -35.14110565185547, -33.90500259399414, -32.66890335083008, -31.43280029296875, -30.196699142456055, -28.96059799194336, -27.724496841430664, -26.48839569091797, -25.252294540405273, -24.016193389892578, -22.78009033203125, -21.543991088867188, -20.30788803100586, -19.071786880493164, -17.83568572998047, -16.599584579467773, -15.363483428955078, -14.127381324768066, -12.891280174255371, -11.655179023742676, -10.419076919555664, -9.182975769042969, -7.946874618530273, -6.710773468017578, -5.474671840667725, -4.238570213317871, -3.002469062805176, -1.7663679122924805, -0.530266284942627, 0.7058353424072266, 1.9419326782226562, 3.1780340671539307, 4.414135456085205, 5.650237083435059, 6.886338233947754, 8.12243938446045, 9.358541488647461, 10.594642639160156, 11.830743789672852, 13.066844940185547, 14.302946090698242, 15.539048194885254, 16.775150299072266, 18.011249542236328, 19.247352600097656, 20.48345375061035, 21.719554901123047, 22.955656051635742, 24.191757202148438, 25.427858352661133, 26.663959503173828, 27.900062561035156, 29.13616371154785, 30.372264862060547, 31.608366012573242, 32.84446716308594, 34.080570220947266, 35.31666946411133, 36.552772521972656, 37.78887176513672, 39.02497482299805, 40.261077880859375, 41.49717712402344]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 15.0, 12.0, 16.0, 14.0, 15.0, 15.0, 16.0, 18.0, 31.0, 32.0, 32.0, 30.0, 43.0, 36.0, 50.0, 50.0, 41.0, 56.0, 38.0, 46.0, 37.0, 41.0, 33.0, 46.0, 29.0, 27.0, 26.0, 21.0, 18.0, 18.0, 14.0, 14.0, 14.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.32772159576416, -12.853902816772461, -12.380084037780762, -11.906265258789062, -11.43244743347168, -10.95862865447998, -10.484809875488281, -10.010991096496582, -9.537172317504883, -9.063353538513184, -8.589534759521484, -8.115716934204102, -7.641898155212402, -7.168079376220703, -6.694260597229004, -6.220441818237305, -5.746623992919922, -5.272805213928223, -4.798986911773682, -4.325168132781982, -3.8513495922088623, -3.377531051635742, -2.903712272644043, -2.429893732070923, -1.9560751914978027, -1.4822566509246826, -1.008437991142273, -0.5346193313598633, -0.060800790786743164, 0.41301774978637695, 0.8868365287780762, 1.3606550693511963, 1.83447265625, 2.30829119682312, 2.7821097373962402, 3.2559285163879395, 3.7297470569610596, 4.20356559753418, 4.677384376525879, 5.151203155517578, 5.625021457672119, 6.098840236663818, 6.572658538818359, 7.046477317810059, 7.520296096801758, 7.994114398956299, 8.467933654785156, 8.941751480102539, 9.415570259094238, 9.889389038085938, 10.363207817077637, 10.837026596069336, 11.310844421386719, 11.784663200378418, 12.258481979370117, 12.732300758361816, 13.206119537353516, 13.679938316345215, 14.153757095336914, 14.627574920654297, 15.101393699645996, 15.575212478637695, 16.049030303955078, 16.522850036621094, 16.996667861938477]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 13.0, 22.0, 21.0, 30.0, 41.0, 63.0, 92.0, 138.0, 211.0, 352.0, 583.0, 926.0, 1595.0, 2833.0, 5261.0, 9863.0, 19293.0, 39702.0, 86029.0, 201748.0, 338135.0, 186943.0, 79315.0, 36309.0, 17959.0, 9447.0, 4895.0, 2789.0, 1501.0, 930.0, 529.0, 327.0, 218.0, 139.0, 99.0, 58.0, 36.0, 24.0, 21.0, 15.0, 14.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.318359375, -2.246917724609375, -2.17547607421875, -2.104034423828125, -2.0325927734375, -1.961151123046875, -1.88970947265625, -1.818267822265625, -1.746826171875, -1.675384521484375, -1.60394287109375, -1.532501220703125, -1.4610595703125, -1.389617919921875, -1.31817626953125, -1.246734619140625, -1.17529296875, -1.103851318359375, -1.03240966796875, -0.960968017578125, -0.8895263671875, -0.818084716796875, -0.74664306640625, -0.675201416015625, -0.603759765625, -0.532318115234375, -0.46087646484375, -0.389434814453125, -0.3179931640625, -0.246551513671875, -0.17510986328125, -0.103668212890625, -0.0322265625, 0.039215087890625, 0.11065673828125, 0.182098388671875, 0.2535400390625, 0.324981689453125, 0.39642333984375, 0.467864990234375, 0.539306640625, 0.610748291015625, 0.68218994140625, 0.753631591796875, 0.8250732421875, 0.896514892578125, 0.96795654296875, 1.039398193359375, 1.11083984375, 1.182281494140625, 1.25372314453125, 1.325164794921875, 1.3966064453125, 1.468048095703125, 1.53948974609375, 1.610931396484375, 1.682373046875, 1.753814697265625, 1.82525634765625, 1.896697998046875, 1.9681396484375, 2.039581298828125, 2.11102294921875, 2.182464599609375, 2.25390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 14.0, 19.0, 14.0, 14.0, 36.0, 51.0, 49.0, 57.0, 48.0, 65.0, 67.0, 71.0, 78.0, 67.0, 71.0, 48.0, 51.0, 46.0, 27.0, 34.0, 14.0, 18.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.624908447265625, -1.56622314453125, -1.507537841796875, -1.4488525390625, -1.390167236328125, -1.33148193359375, -1.272796630859375, -1.214111328125, -1.155426025390625, -1.09674072265625, -1.038055419921875, -0.9793701171875, -0.920684814453125, -0.86199951171875, -0.803314208984375, -0.74462890625, -0.685943603515625, -0.62725830078125, -0.568572998046875, -0.5098876953125, -0.451202392578125, -0.39251708984375, -0.333831787109375, -0.275146484375, -0.216461181640625, -0.15777587890625, -0.099090576171875, -0.0404052734375, 0.018280029296875, 0.07696533203125, 0.135650634765625, 0.1943359375, 0.253021240234375, 0.31170654296875, 0.370391845703125, 0.4290771484375, 0.487762451171875, 0.54644775390625, 0.605133056640625, 0.663818359375, 0.722503662109375, 0.78118896484375, 0.839874267578125, 0.8985595703125, 0.957244873046875, 1.01593017578125, 1.074615478515625, 1.13330078125, 1.191986083984375, 1.25067138671875, 1.309356689453125, 1.3680419921875, 1.426727294921875, 1.48541259765625, 1.544097900390625, 1.602783203125, 1.661468505859375, 1.72015380859375, 1.778839111328125, 1.8375244140625, 1.896209716796875, 1.95489501953125, 2.013580322265625, 2.072265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 15.0, 16.0, 15.0, 28.0, 37.0, 39.0, 60.0, 124.0, 182.0, 277.0, 529.0, 933.0, 2159.0, 6042.0, 22861.0, 134559.0, 712187.0, 135110.0, 22882.0, 6044.0, 2170.0, 963.0, 493.0, 288.0, 159.0, 104.0, 69.0, 66.0, 33.0, 27.0, 19.0, 8.0, 15.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.28125, -5.10223388671875, -4.9232177734375, -4.74420166015625, -4.565185546875, -4.38616943359375, -4.2071533203125, -4.02813720703125, -3.84912109375, -3.67010498046875, -3.4910888671875, -3.31207275390625, -3.133056640625, -2.95404052734375, -2.7750244140625, -2.59600830078125, -2.4169921875, -2.23797607421875, -2.0589599609375, -1.87994384765625, -1.700927734375, -1.52191162109375, -1.3428955078125, -1.16387939453125, -0.98486328125, -0.80584716796875, -0.6268310546875, -0.44781494140625, -0.268798828125, -0.08978271484375, 0.0892333984375, 0.26824951171875, 0.447265625, 0.62628173828125, 0.8052978515625, 0.98431396484375, 1.163330078125, 1.34234619140625, 1.5213623046875, 1.70037841796875, 1.87939453125, 2.05841064453125, 2.2374267578125, 2.41644287109375, 2.595458984375, 2.77447509765625, 2.9534912109375, 3.13250732421875, 3.3115234375, 3.49053955078125, 3.6695556640625, 3.84857177734375, 4.027587890625, 4.20660400390625, 4.3856201171875, 4.56463623046875, 4.74365234375, 4.92266845703125, 5.1016845703125, 5.28070068359375, 5.459716796875, 5.63873291015625, 5.8177490234375, 5.99676513671875, 6.17578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 2.0, 11.0, 12.0, 17.0, 23.0, 31.0, 41.0, 60.0, 70.0, 88.0, 92.0, 95.0, 82.0, 85.0, 71.0, 54.0, 36.0, 46.0, 27.0, 17.0, 14.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.517822265625, -9.20751953125, -8.897216796875, -8.5869140625, -8.276611328125, -7.96630859375, -7.656005859375, -7.345703125, -7.035400390625, -6.72509765625, -6.414794921875, -6.1044921875, -5.794189453125, -5.48388671875, -5.173583984375, -4.86328125, -4.552978515625, -4.24267578125, -3.932373046875, -3.6220703125, -3.311767578125, -3.00146484375, -2.691162109375, -2.380859375, -2.070556640625, -1.76025390625, -1.449951171875, -1.1396484375, -0.829345703125, -0.51904296875, -0.208740234375, 0.1015625, 0.411865234375, 0.72216796875, 1.032470703125, 1.3427734375, 1.653076171875, 1.96337890625, 2.273681640625, 2.583984375, 2.894287109375, 3.20458984375, 3.514892578125, 3.8251953125, 4.135498046875, 4.44580078125, 4.756103515625, 5.06640625, 5.376708984375, 5.68701171875, 5.997314453125, 6.3076171875, 6.617919921875, 6.92822265625, 7.238525390625, 7.548828125, 7.859130859375, 8.16943359375, 8.479736328125, 8.7900390625, 9.100341796875, 9.41064453125, 9.720947265625, 10.03125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 15.0, 19.0, 43.0, 86.0, 216.0, 697.0, 3228.0, 46293.0, 953096.0, 40905.0, 2885.0, 615.0, 213.0, 98.0, 47.0, 35.0, 17.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.63092041015625, -4.4337158203125, -4.23651123046875, -4.039306640625, -3.84210205078125, -3.6448974609375, -3.44769287109375, -3.25048828125, -3.05328369140625, -2.8560791015625, -2.65887451171875, -2.461669921875, -2.26446533203125, -2.0672607421875, -1.87005615234375, -1.6728515625, -1.47564697265625, -1.2784423828125, -1.08123779296875, -0.884033203125, -0.68682861328125, -0.4896240234375, -0.29241943359375, -0.09521484375, 0.10198974609375, 0.2991943359375, 0.49639892578125, 0.693603515625, 0.89080810546875, 1.0880126953125, 1.28521728515625, 1.482421875, 1.67962646484375, 1.8768310546875, 2.07403564453125, 2.271240234375, 2.46844482421875, 2.6656494140625, 2.86285400390625, 3.06005859375, 3.25726318359375, 3.4544677734375, 3.65167236328125, 3.848876953125, 4.04608154296875, 4.2432861328125, 4.44049072265625, 4.6376953125, 4.83489990234375, 5.0321044921875, 5.22930908203125, 5.426513671875, 5.62371826171875, 5.8209228515625, 6.01812744140625, 6.21533203125, 6.41253662109375, 6.6097412109375, 6.80694580078125, 7.004150390625, 7.20135498046875, 7.3985595703125, 7.59576416015625, 7.79296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 10.0, 8.0, 14.0, 16.0, 24.0, 35.0, 42.0, 44.0, 61.0, 80.0, 117.0, 102.0, 108.0, 58.0, 38.0, 56.0, 36.0, 26.0, 28.0, 15.0, 14.0, 7.0, 8.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00039577484130859375, -0.00038354843854904175, -0.00037132203578948975, -0.00035909563302993774, -0.00034686923027038574, -0.00033464282751083374, -0.00032241642475128174, -0.00031019002199172974, -0.00029796361923217773, -0.00028573721647262573, -0.00027351081371307373, -0.00026128441095352173, -0.0002490580081939697, -0.00023683160543441772, -0.00022460520267486572, -0.00021237879991531372, -0.00020015239715576172, -0.00018792599439620972, -0.00017569959163665771, -0.0001634731888771057, -0.0001512467861175537, -0.0001390203833580017, -0.0001267939805984497, -0.0001145675778388977, -0.0001023411750793457, -9.01147723197937e-05, -7.78883695602417e-05, -6.56619668006897e-05, -5.3435564041137695e-05, -4.120916128158569e-05, -2.898275852203369e-05, -1.675635576248169e-05, -4.5299530029296875e-06, 7.696449756622314e-06, 1.9922852516174316e-05, 3.214925527572632e-05, 4.437565803527832e-05, 5.660206079483032e-05, 6.882846355438232e-05, 8.105486631393433e-05, 9.328126907348633e-05, 0.00010550767183303833, 0.00011773407459259033, 0.00012996047735214233, 0.00014218688011169434, 0.00015441328287124634, 0.00016663968563079834, 0.00017886608839035034, 0.00019109249114990234, 0.00020331889390945435, 0.00021554529666900635, 0.00022777169942855835, 0.00023999810218811035, 0.00025222450494766235, 0.00026445090770721436, 0.00027667731046676636, 0.00028890371322631836, 0.00030113011598587036, 0.00031335651874542236, 0.00032558292150497437, 0.00033780932426452637, 0.00035003572702407837, 0.00036226212978363037, 0.0003744885325431824, 0.0003867149353027344]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 9.0, 18.0, 21.0, 32.0, 71.0, 152.0, 361.0, 985.0, 3197.0, 21415.0, 761729.0, 246767.0, 10452.0, 2098.0, 680.0, 291.0, 108.0, 65.0, 41.0, 16.0, 13.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.68359375, -5.54095458984375, -5.3983154296875, -5.25567626953125, -5.113037109375, -4.97039794921875, -4.8277587890625, -4.68511962890625, -4.54248046875, -4.39984130859375, -4.2572021484375, -4.11456298828125, -3.971923828125, -3.82928466796875, -3.6866455078125, -3.54400634765625, -3.4013671875, -3.25872802734375, -3.1160888671875, -2.97344970703125, -2.830810546875, -2.68817138671875, -2.5455322265625, -2.40289306640625, -2.26025390625, -2.11761474609375, -1.9749755859375, -1.83233642578125, -1.689697265625, -1.54705810546875, -1.4044189453125, -1.26177978515625, -1.119140625, -0.97650146484375, -0.8338623046875, -0.69122314453125, -0.548583984375, -0.40594482421875, -0.2633056640625, -0.12066650390625, 0.02197265625, 0.16461181640625, 0.3072509765625, 0.44989013671875, 0.592529296875, 0.73516845703125, 0.8778076171875, 1.02044677734375, 1.1630859375, 1.30572509765625, 1.4483642578125, 1.59100341796875, 1.733642578125, 1.87628173828125, 2.0189208984375, 2.16156005859375, 2.30419921875, 2.44683837890625, 2.5894775390625, 2.73211669921875, 2.874755859375, 3.01739501953125, 3.1600341796875, 3.30267333984375, 3.4453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 13.0, 12.0, 14.0, 31.0, 57.0, 53.0, 80.0, 112.0, 117.0, 143.0, 113.0, 65.0, 62.0, 47.0, 30.0, 18.0, 10.0, 3.0, 4.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.087890625, -1.987884521484375, -1.88787841796875, -1.787872314453125, -1.6878662109375, -1.587860107421875, -1.48785400390625, -1.387847900390625, -1.287841796875, -1.187835693359375, -1.08782958984375, -0.987823486328125, -0.8878173828125, -0.787811279296875, -0.68780517578125, -0.587799072265625, -0.48779296875, -0.387786865234375, -0.28778076171875, -0.187774658203125, -0.0877685546875, 0.012237548828125, 0.11224365234375, 0.212249755859375, 0.312255859375, 0.412261962890625, 0.51226806640625, 0.612274169921875, 0.7122802734375, 0.812286376953125, 0.91229248046875, 1.012298583984375, 1.1123046875, 1.212310791015625, 1.31231689453125, 1.412322998046875, 1.5123291015625, 1.612335205078125, 1.71234130859375, 1.812347412109375, 1.912353515625, 2.012359619140625, 2.11236572265625, 2.212371826171875, 2.3123779296875, 2.412384033203125, 2.51239013671875, 2.612396240234375, 2.71240234375, 2.812408447265625, 2.91241455078125, 3.012420654296875, 3.1124267578125, 3.212432861328125, 3.31243896484375, 3.412445068359375, 3.512451171875, 3.612457275390625, 3.71246337890625, 3.812469482421875, 3.9124755859375, 4.012481689453125, 4.11248779296875, 4.212493896484375, 4.3125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 9.0, 14.0, 29.0, 47.0, 125.0, 164.0, 190.0, 174.0, 99.0, 68.0, 37.0, 17.0, 10.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.28925323486328, -53.89160919189453, -52.49396514892578, -51.0963249206543, -49.69868087768555, -48.3010368347168, -46.90339660644531, -45.50575256347656, -44.10810852050781, -42.71046447753906, -41.31282043457031, -39.91518020629883, -38.51753616333008, -37.11989212036133, -35.722251892089844, -34.324607849121094, -32.926963806152344, -31.529319763183594, -30.131677627563477, -28.73403549194336, -27.33639144897461, -25.93874740600586, -24.541105270385742, -23.143463134765625, -21.745819091796875, -20.348175048828125, -18.950532913208008, -17.55289077758789, -16.15524673461914, -14.757603645324707, -13.359960556030273, -11.96231746673584, -10.56467056274414, -9.167027473449707, -7.769384384155273, -6.37174129486084, -4.974098205566406, -3.5764551162719727, -2.178812026977539, -0.7811689376831055, 0.6164741516113281, 2.0141172409057617, 3.4117603302001953, 4.809403419494629, 6.2070465087890625, 7.604689598083496, 9.00233268737793, 10.399975776672363, 11.797618865966797, 13.19526195526123, 14.592905044555664, 15.990548133850098, 17.38819122314453, 18.78583526611328, 20.1834774017334, 21.581119537353516, 22.978763580322266, 24.376407623291016, 25.774049758911133, 27.17169189453125, 28.5693359375, 29.96697998046875, 31.364622116088867, 32.762264251708984, 34.159908294677734]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 18.0, 19.0, 41.0, 55.0, 54.0, 82.0, 97.0, 115.0, 133.0, 89.0, 66.0, 70.0, 61.0, 41.0, 22.0, 15.0, 10.0, 12.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.957256317138672, -22.386268615722656, -20.81528091430664, -19.244291305541992, -17.673303604125977, -16.10231590270996, -14.531327247619629, -12.960338592529297, -11.389350891113281, -9.818363189697266, -8.247374534606934, -6.67638635635376, -5.105398178100586, -3.534409999847412, -1.9634218215942383, -0.39243316650390625, 1.1785545349121094, 2.749542713165283, 4.320530891418457, 5.891519069671631, 7.462507247924805, 9.03349494934082, 10.604483604431152, 12.175472259521484, 13.7464599609375, 15.317447662353516, 16.88843536376953, 18.45942497253418, 20.030412673950195, 21.60140037536621, 23.17238998413086, 24.743377685546875, 26.314369201660156, 27.885356903076172, 29.456344604492188, 31.027334213256836, 32.59832000732422, 34.1693115234375, 35.740299224853516, 37.31128692626953, 38.88227462768555, 40.45326232910156, 42.02425003051758, 43.595237731933594, 45.166229248046875, 46.73721694946289, 48.308204650878906, 49.87919235229492, 51.45018005371094, 53.02116775512695, 54.59215545654297, 56.163143157958984, 57.734130859375, 59.30512237548828, 60.8761100769043, 62.44709777832031, 64.01808166503906, 65.58907318115234, 67.1600570678711, 68.73104858398438, 70.30203247070312, 71.8730239868164, 73.44400787353516, 75.01499938964844, 76.58599090576172]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 14.0, 36.0, 83.0, 202.0, 428.0, 905.0, 2563.0, 10956.0, 90508.0, 2741617.0, 1288727.0, 49412.0, 6634.0, 1403.0, 405.0, 148.0, 74.0, 41.0, 28.0, 19.0, 17.0, 16.0, 9.0, 14.0, 5.0, 7.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.12774658203125, -1.9937744140625, -1.85980224609375, -1.725830078125, -1.59185791015625, -1.4578857421875, -1.32391357421875, -1.18994140625, -1.05596923828125, -0.9219970703125, -0.78802490234375, -0.654052734375, -0.52008056640625, -0.3861083984375, -0.25213623046875, -0.1181640625, 0.01580810546875, 0.1497802734375, 0.28375244140625, 0.417724609375, 0.55169677734375, 0.6856689453125, 0.81964111328125, 0.95361328125, 1.08758544921875, 1.2215576171875, 1.35552978515625, 1.489501953125, 1.62347412109375, 1.7574462890625, 1.89141845703125, 2.025390625, 2.15936279296875, 2.2933349609375, 2.42730712890625, 2.561279296875, 2.69525146484375, 2.8292236328125, 2.96319580078125, 3.09716796875, 3.23114013671875, 3.3651123046875, 3.49908447265625, 3.633056640625, 3.76702880859375, 3.9010009765625, 4.03497314453125, 4.1689453125, 4.30291748046875, 4.4368896484375, 4.57086181640625, 4.704833984375, 4.83880615234375, 4.9727783203125, 5.10675048828125, 5.24072265625, 5.37469482421875, 5.5086669921875, 5.64263916015625, 5.776611328125, 5.91058349609375, 6.0445556640625, 6.17852783203125, 6.3125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 11.0, 24.0, 49.0, 122.0, 191.0, 228.0, 186.0, 107.0, 59.0, 30.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.4132080078125, -1.248291015625, -1.0833740234375, -0.91845703125, -0.7535400390625, -0.588623046875, -0.4237060546875, -0.2587890625, -0.0938720703125, 0.071044921875, 0.2359619140625, 0.40087890625, 0.5657958984375, 0.730712890625, 0.8956298828125, 1.060546875, 1.2254638671875, 1.390380859375, 1.5552978515625, 1.72021484375, 1.8851318359375, 2.050048828125, 2.2149658203125, 2.3798828125, 2.5447998046875, 2.709716796875, 2.8746337890625, 3.03955078125, 3.2044677734375, 3.369384765625, 3.5343017578125, 3.69921875, 3.8641357421875, 4.029052734375, 4.1939697265625, 4.35888671875, 4.5238037109375, 4.688720703125, 4.8536376953125, 5.0185546875, 5.1834716796875, 5.348388671875, 5.5133056640625, 5.67822265625, 5.8431396484375, 6.008056640625, 6.1729736328125, 6.337890625, 6.5028076171875, 6.667724609375, 6.8326416015625, 6.99755859375, 7.1624755859375, 7.327392578125, 7.4923095703125, 7.6572265625, 7.8221435546875, 7.987060546875, 8.1519775390625, 8.31689453125, 8.4818115234375, 8.646728515625, 8.8116455078125, 8.9765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 7.0, 10.0, 13.0, 8.0, 20.0, 40.0, 61.0, 76.0, 151.0, 273.0, 535.0, 1129.0, 2704.0, 7292.0, 24422.0, 117045.0, 1715388.0, 2154533.0, 132468.0, 26125.0, 7246.0, 2619.0, 1061.0, 480.0, 250.0, 150.0, 58.0, 43.0, 20.0, 13.0, 8.0, 9.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.70855712890625, -3.5850830078125, -3.46160888671875, -3.338134765625, -3.21466064453125, -3.0911865234375, -2.96771240234375, -2.84423828125, -2.72076416015625, -2.5972900390625, -2.47381591796875, -2.350341796875, -2.22686767578125, -2.1033935546875, -1.97991943359375, -1.8564453125, -1.73297119140625, -1.6094970703125, -1.48602294921875, -1.362548828125, -1.23907470703125, -1.1156005859375, -0.99212646484375, -0.86865234375, -0.74517822265625, -0.6217041015625, -0.49822998046875, -0.374755859375, -0.25128173828125, -0.1278076171875, -0.00433349609375, 0.119140625, 0.24261474609375, 0.3660888671875, 0.48956298828125, 0.613037109375, 0.73651123046875, 0.8599853515625, 0.98345947265625, 1.10693359375, 1.23040771484375, 1.3538818359375, 1.47735595703125, 1.600830078125, 1.72430419921875, 1.8477783203125, 1.97125244140625, 2.0947265625, 2.21820068359375, 2.3416748046875, 2.46514892578125, 2.588623046875, 2.71209716796875, 2.8355712890625, 2.95904541015625, 3.08251953125, 3.20599365234375, 3.3294677734375, 3.45294189453125, 3.576416015625, 3.69989013671875, 3.8233642578125, 3.94683837890625, 4.0703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 3.0, 4.0, 11.0, 5.0, 18.0, 22.0, 28.0, 36.0, 42.0, 65.0, 86.0, 111.0, 195.0, 286.0, 529.0, 649.0, 626.0, 472.0, 316.0, 161.0, 100.0, 72.0, 51.0, 45.0, 31.0, 19.0, 20.0, 10.0, 15.0, 7.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1875, -4.07080078125, -3.9541015625, -3.83740234375, -3.720703125, -3.60400390625, -3.4873046875, -3.37060546875, -3.25390625, -3.13720703125, -3.0205078125, -2.90380859375, -2.787109375, -2.67041015625, -2.5537109375, -2.43701171875, -2.3203125, -2.20361328125, -2.0869140625, -1.97021484375, -1.853515625, -1.73681640625, -1.6201171875, -1.50341796875, -1.38671875, -1.27001953125, -1.1533203125, -1.03662109375, -0.919921875, -0.80322265625, -0.6865234375, -0.56982421875, -0.453125, -0.33642578125, -0.2197265625, -0.10302734375, 0.013671875, 0.13037109375, 0.2470703125, 0.36376953125, 0.48046875, 0.59716796875, 0.7138671875, 0.83056640625, 0.947265625, 1.06396484375, 1.1806640625, 1.29736328125, 1.4140625, 1.53076171875, 1.6474609375, 1.76416015625, 1.880859375, 1.99755859375, 2.1142578125, 2.23095703125, 2.34765625, 2.46435546875, 2.5810546875, 2.69775390625, 2.814453125, 2.93115234375, 3.0478515625, 3.16455078125, 3.28125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 29.0, 58.0, 119.0, 191.0, 218.0, 169.0, 99.0, 33.0, 26.0, 19.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.176084518432617, -28.619718551635742, -27.063350677490234, -25.50698471069336, -23.950618743896484, -22.39425277709961, -20.837886810302734, -19.281518936157227, -17.72515296936035, -16.168787002563477, -14.612420082092285, -13.056053161621094, -11.499687194824219, -9.943321228027344, -8.386954307556152, -6.830587387084961, -5.274221420288086, -3.7178549766540527, -2.1614885330200195, -0.6051220893859863, 0.9512443542480469, 2.50761079788208, 4.063977241516113, 5.620344161987305, 7.17671012878418, 8.733076095581055, 10.289443016052246, 11.845809936523438, 13.402175903320312, 14.958541870117188, 16.514907836914062, 18.07127571105957, 19.627639770507812, 21.184005737304688, 22.740371704101562, 24.29673957824707, 25.853105545043945, 27.40947151184082, 28.965839385986328, 30.522205352783203, 32.07857131958008, 33.63493728637695, 35.19130325317383, 36.7476692199707, 38.304039001464844, 39.86040496826172, 41.416770935058594, 42.97313690185547, 44.529502868652344, 46.08586883544922, 47.642234802246094, 49.19860076904297, 50.754966735839844, 52.311336517333984, 53.86770248413086, 55.424068450927734, 56.98043441772461, 58.536800384521484, 60.09316635131836, 61.649532318115234, 63.205902099609375, 64.76226806640625, 66.31863403320312, 67.875, 69.43136596679688]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 18.0, 15.0, 9.0, 31.0, 62.0, 85.0, 73.0, 81.0, 98.0, 120.0, 98.0, 82.0, 62.0, 51.0, 33.0, 32.0, 26.0, 13.0, 9.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.40704345703125, -58.18239212036133, -56.95773696899414, -55.73308563232422, -54.50843048095703, -53.28377914428711, -52.05912780761719, -50.83447265625, -49.60982131958008, -48.385169982910156, -47.16051483154297, -45.93586349487305, -44.711212158203125, -43.48655700683594, -42.261905670166016, -41.037254333496094, -39.812599182128906, -38.587947845458984, -37.3632926940918, -36.138641357421875, -34.91398620605469, -33.689334869384766, -32.464683532714844, -31.24003028869629, -30.015377044677734, -28.79072380065918, -27.566070556640625, -26.341419219970703, -25.11676597595215, -23.892112731933594, -22.667461395263672, -21.442808151245117, -20.218154907226562, -18.993501663208008, -17.768848419189453, -16.54419708251953, -15.319543838500977, -14.094890594482422, -12.870238304138184, -11.645586013793945, -10.42093276977539, -9.196279525756836, -7.971627235412598, -6.746974468231201, -5.522321701049805, -4.297668933868408, -3.0730161666870117, -1.8483638763427734, -0.6237106323242188, 0.6009421348571777, 1.8255949020385742, 3.0502476692199707, 4.274900436401367, 5.499553203582764, 6.72420597076416, 7.948858261108398, 9.173511505126953, 10.398164749145508, 11.622817039489746, 12.847469329833984, 14.072122573852539, 15.296775817871094, 16.521427154541016, 17.74608039855957, 18.970733642578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 9.0, 8.0, 7.0, 9.0, 17.0, 17.0, 28.0, 46.0, 63.0, 90.0, 151.0, 204.0, 309.0, 515.0, 907.0, 1552.0, 2668.0, 4886.0, 8990.0, 17493.0, 34446.0, 67147.0, 132680.0, 267296.0, 253364.0, 124332.0, 63291.0, 32009.0, 16725.0, 8484.0, 4651.0, 2456.0, 1440.0, 829.0, 521.0, 291.0, 187.0, 129.0, 89.0, 69.0, 42.0, 27.0, 22.0, 16.0, 10.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.171875, -2.099365234375, -2.02685546875, -1.954345703125, -1.8818359375, -1.809326171875, -1.73681640625, -1.664306640625, -1.591796875, -1.519287109375, -1.44677734375, -1.374267578125, -1.3017578125, -1.229248046875, -1.15673828125, -1.084228515625, -1.01171875, -0.939208984375, -0.86669921875, -0.794189453125, -0.7216796875, -0.649169921875, -0.57666015625, -0.504150390625, -0.431640625, -0.359130859375, -0.28662109375, -0.214111328125, -0.1416015625, -0.069091796875, 0.00341796875, 0.075927734375, 0.1484375, 0.220947265625, 0.29345703125, 0.365966796875, 0.4384765625, 0.510986328125, 0.58349609375, 0.656005859375, 0.728515625, 0.801025390625, 0.87353515625, 0.946044921875, 1.0185546875, 1.091064453125, 1.16357421875, 1.236083984375, 1.30859375, 1.381103515625, 1.45361328125, 1.526123046875, 1.5986328125, 1.671142578125, 1.74365234375, 1.816162109375, 1.888671875, 1.961181640625, 2.03369140625, 2.106201171875, 2.1787109375, 2.251220703125, 2.32373046875, 2.396240234375, 2.46875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 0.0, 9.0, 10.0, 17.0, 21.0, 41.0, 29.0, 47.0, 64.0, 59.0, 89.0, 82.0, 79.0, 77.0, 71.0, 63.0, 56.0, 43.0, 41.0, 26.0, 22.0, 17.0, 14.0, 10.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2392578125, -1.1761322021484375, -1.113006591796875, -1.0498809814453125, -0.98675537109375, -0.9236297607421875, -0.860504150390625, -0.7973785400390625, -0.7342529296875, -0.6711273193359375, -0.608001708984375, -0.5448760986328125, -0.48175048828125, -0.4186248779296875, -0.355499267578125, -0.2923736572265625, -0.229248046875, -0.1661224365234375, -0.102996826171875, -0.0398712158203125, 0.02325439453125, 0.0863800048828125, 0.149505615234375, 0.2126312255859375, 0.2757568359375, 0.3388824462890625, 0.402008056640625, 0.4651336669921875, 0.52825927734375, 0.5913848876953125, 0.654510498046875, 0.7176361083984375, 0.78076171875, 0.8438873291015625, 0.907012939453125, 0.9701385498046875, 1.03326416015625, 1.0963897705078125, 1.159515380859375, 1.2226409912109375, 1.2857666015625, 1.3488922119140625, 1.412017822265625, 1.4751434326171875, 1.53826904296875, 1.6013946533203125, 1.664520263671875, 1.7276458740234375, 1.790771484375, 1.8538970947265625, 1.917022705078125, 1.9801483154296875, 2.04327392578125, 2.1063995361328125, 2.169525146484375, 2.2326507568359375, 2.2957763671875, 2.3589019775390625, 2.422027587890625, 2.4851531982421875, 2.54827880859375, 2.6114044189453125, 2.674530029296875, 2.7376556396484375, 2.80078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 3.0, 12.0, 17.0, 12.0, 21.0, 28.0, 64.0, 76.0, 124.0, 198.0, 324.0, 561.0, 1118.0, 2509.0, 7675.0, 57183.0, 818396.0, 140742.0, 13009.0, 3276.0, 1379.0, 733.0, 404.0, 226.0, 155.0, 102.0, 56.0, 43.0, 26.0, 12.0, 15.0, 10.0, 11.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.154541015625, -8.85595703125, -8.557373046875, -8.2587890625, -7.960205078125, -7.66162109375, -7.363037109375, -7.064453125, -6.765869140625, -6.46728515625, -6.168701171875, -5.8701171875, -5.571533203125, -5.27294921875, -4.974365234375, -4.67578125, -4.377197265625, -4.07861328125, -3.780029296875, -3.4814453125, -3.182861328125, -2.88427734375, -2.585693359375, -2.287109375, -1.988525390625, -1.68994140625, -1.391357421875, -1.0927734375, -0.794189453125, -0.49560546875, -0.197021484375, 0.1015625, 0.400146484375, 0.69873046875, 0.997314453125, 1.2958984375, 1.594482421875, 1.89306640625, 2.191650390625, 2.490234375, 2.788818359375, 3.08740234375, 3.385986328125, 3.6845703125, 3.983154296875, 4.28173828125, 4.580322265625, 4.87890625, 5.177490234375, 5.47607421875, 5.774658203125, 6.0732421875, 6.371826171875, 6.67041015625, 6.968994140625, 7.267578125, 7.566162109375, 7.86474609375, 8.163330078125, 8.4619140625, 8.760498046875, 9.05908203125, 9.357666015625, 9.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 15.0, 5.0, 7.0, 17.0, 17.0, 20.0, 33.0, 28.0, 30.0, 35.0, 33.0, 50.0, 53.0, 57.0, 63.0, 48.0, 62.0, 45.0, 56.0, 48.0, 30.0, 29.0, 24.0, 37.0, 16.0, 33.0, 26.0, 16.0, 13.0, 7.0, 7.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9921875, -5.78424072265625, -5.5762939453125, -5.36834716796875, -5.160400390625, -4.95245361328125, -4.7445068359375, -4.53656005859375, -4.32861328125, -4.12066650390625, -3.9127197265625, -3.70477294921875, -3.496826171875, -3.28887939453125, -3.0809326171875, -2.87298583984375, -2.6650390625, -2.45709228515625, -2.2491455078125, -2.04119873046875, -1.833251953125, -1.62530517578125, -1.4173583984375, -1.20941162109375, -1.00146484375, -0.79351806640625, -0.5855712890625, -0.37762451171875, -0.169677734375, 0.03826904296875, 0.2462158203125, 0.45416259765625, 0.662109375, 0.87005615234375, 1.0780029296875, 1.28594970703125, 1.493896484375, 1.70184326171875, 1.9097900390625, 2.11773681640625, 2.32568359375, 2.53363037109375, 2.7415771484375, 2.94952392578125, 3.157470703125, 3.36541748046875, 3.5733642578125, 3.78131103515625, 3.9892578125, 4.19720458984375, 4.4051513671875, 4.61309814453125, 4.821044921875, 5.02899169921875, 5.2369384765625, 5.44488525390625, 5.65283203125, 5.86077880859375, 6.0687255859375, 6.27667236328125, 6.484619140625, 6.69256591796875, 6.9005126953125, 7.10845947265625, 7.31640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 15.0, 25.0, 31.0, 61.0, 95.0, 169.0, 329.0, 778.0, 2400.0, 10309.0, 77471.0, 801129.0, 135358.0, 15317.0, 3211.0, 992.0, 386.0, 159.0, 94.0, 71.0, 48.0, 24.0, 12.0, 18.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.6484375, -3.545989990234375, -3.44354248046875, -3.341094970703125, -3.2386474609375, -3.136199951171875, -3.03375244140625, -2.931304931640625, -2.828857421875, -2.726409912109375, -2.62396240234375, -2.521514892578125, -2.4190673828125, -2.316619873046875, -2.21417236328125, -2.111724853515625, -2.00927734375, -1.906829833984375, -1.80438232421875, -1.701934814453125, -1.5994873046875, -1.497039794921875, -1.39459228515625, -1.292144775390625, -1.189697265625, -1.087249755859375, -0.98480224609375, -0.882354736328125, -0.7799072265625, -0.677459716796875, -0.57501220703125, -0.472564697265625, -0.3701171875, -0.267669677734375, -0.16522216796875, -0.062774658203125, 0.0396728515625, 0.142120361328125, 0.24456787109375, 0.347015380859375, 0.449462890625, 0.551910400390625, 0.65435791015625, 0.756805419921875, 0.8592529296875, 0.961700439453125, 1.06414794921875, 1.166595458984375, 1.26904296875, 1.371490478515625, 1.47393798828125, 1.576385498046875, 1.6788330078125, 1.781280517578125, 1.88372802734375, 1.986175537109375, 2.088623046875, 2.191070556640625, 2.29351806640625, 2.395965576171875, 2.4984130859375, 2.600860595703125, 2.70330810546875, 2.805755615234375, 2.908203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 0.0, 5.0, 5.0, 10.0, 9.0, 10.0, 17.0, 17.0, 34.0, 34.0, 48.0, 73.0, 116.0, 195.0, 131.0, 75.0, 61.0, 39.0, 30.0, 24.0, 10.0, 15.0, 13.0, 7.0, 4.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005507469177246094, -0.0005264952778816223, -0.0005022436380386353, -0.0004779919981956482, -0.00045374035835266113, -0.00042948871850967407, -0.000405237078666687, -0.00038098543882369995, -0.0003567337989807129, -0.00033248215913772583, -0.00030823051929473877, -0.0002839788794517517, -0.00025972723960876465, -0.0002354755997657776, -0.00021122395992279053, -0.00018697232007980347, -0.0001627206802368164, -0.00013846904039382935, -0.00011421740055084229, -8.996576070785522e-05, -6.571412086486816e-05, -4.1462481021881104e-05, -1.7210841178894043e-05, 7.040798664093018e-06, 3.129243850708008e-05, 5.554407835006714e-05, 7.97957181930542e-05, 0.00010404735803604126, 0.00012829899787902832, 0.00015255063772201538, 0.00017680227756500244, 0.0002010539174079895, 0.00022530555725097656, 0.0002495571970939636, 0.0002738088369369507, 0.00029806047677993774, 0.0003223121166229248, 0.00034656375646591187, 0.0003708153963088989, 0.000395067036151886, 0.00041931867599487305, 0.0004435703158378601, 0.00046782195568084717, 0.0004920735955238342, 0.0005163252353668213, 0.0005405768752098083, 0.0005648285150527954, 0.0005890801548957825, 0.0006133317947387695, 0.0006375834345817566, 0.0006618350744247437, 0.0006860867142677307, 0.0007103383541107178, 0.0007345899939537048, 0.0007588416337966919, 0.000783093273639679, 0.000807344913482666, 0.0008315965533256531, 0.0008558481931686401, 0.0008800998330116272, 0.0009043514728546143, 0.0009286031126976013, 0.0009528547525405884, 0.0009771063923835754, 0.0010013580322265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 9.0, 17.0, 10.0, 16.0, 27.0, 29.0, 63.0, 72.0, 98.0, 151.0, 277.0, 450.0, 792.0, 1504.0, 3631.0, 11446.0, 56941.0, 604594.0, 315233.0, 38350.0, 8615.0, 2926.0, 1436.0, 721.0, 414.0, 237.0, 151.0, 111.0, 75.0, 40.0, 23.0, 26.0, 25.0, 13.0, 9.0, 4.0, 7.0, 8.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.944427490234375, -1.87713623046875, -1.809844970703125, -1.7425537109375, -1.675262451171875, -1.60797119140625, -1.540679931640625, -1.473388671875, -1.406097412109375, -1.33880615234375, -1.271514892578125, -1.2042236328125, -1.136932373046875, -1.06964111328125, -1.002349853515625, -0.93505859375, -0.867767333984375, -0.80047607421875, -0.733184814453125, -0.6658935546875, -0.598602294921875, -0.53131103515625, -0.464019775390625, -0.396728515625, -0.329437255859375, -0.26214599609375, -0.194854736328125, -0.1275634765625, -0.060272216796875, 0.00701904296875, 0.074310302734375, 0.1416015625, 0.208892822265625, 0.27618408203125, 0.343475341796875, 0.4107666015625, 0.478057861328125, 0.54534912109375, 0.612640380859375, 0.679931640625, 0.747222900390625, 0.81451416015625, 0.881805419921875, 0.9490966796875, 1.016387939453125, 1.08367919921875, 1.150970458984375, 1.21826171875, 1.285552978515625, 1.35284423828125, 1.420135498046875, 1.4874267578125, 1.554718017578125, 1.62200927734375, 1.689300537109375, 1.756591796875, 1.823883056640625, 1.89117431640625, 1.958465576171875, 2.0257568359375, 2.093048095703125, 2.16033935546875, 2.227630615234375, 2.294921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 6.0, 10.0, 4.0, 5.0, 11.0, 7.0, 11.0, 25.0, 22.0, 21.0, 31.0, 38.0, 38.0, 48.0, 64.0, 64.0, 87.0, 83.0, 68.0, 54.0, 47.0, 47.0, 34.0, 30.0, 33.0, 20.0, 14.0, 22.0, 12.0, 5.0, 7.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.794921875, -1.7417755126953125, -1.688629150390625, -1.6354827880859375, -1.58233642578125, -1.5291900634765625, -1.476043701171875, -1.4228973388671875, -1.3697509765625, -1.3166046142578125, -1.263458251953125, -1.2103118896484375, -1.15716552734375, -1.1040191650390625, -1.050872802734375, -0.9977264404296875, -0.944580078125, -0.8914337158203125, -0.838287353515625, -0.7851409912109375, -0.73199462890625, -0.6788482666015625, -0.625701904296875, -0.5725555419921875, -0.5194091796875, -0.4662628173828125, -0.413116455078125, -0.3599700927734375, -0.30682373046875, -0.2536773681640625, -0.200531005859375, -0.1473846435546875, -0.09423828125, -0.0410919189453125, 0.012054443359375, 0.0652008056640625, 0.11834716796875, 0.1714935302734375, 0.224639892578125, 0.2777862548828125, 0.3309326171875, 0.3840789794921875, 0.437225341796875, 0.4903717041015625, 0.54351806640625, 0.5966644287109375, 0.649810791015625, 0.7029571533203125, 0.756103515625, 0.8092498779296875, 0.862396240234375, 0.9155426025390625, 0.96868896484375, 1.0218353271484375, 1.074981689453125, 1.1281280517578125, 1.1812744140625, 1.2344207763671875, 1.287567138671875, 1.3407135009765625, 1.39385986328125, 1.4470062255859375, 1.500152587890625, 1.5532989501953125, 1.6064453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 12.0, 19.0, 34.0, 54.0, 104.0, 156.0, 215.0, 116.0, 102.0, 67.0, 39.0, 23.0, 14.0, 9.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8177604675293, -38.551513671875, -37.28527069091797, -36.01902389526367, -34.752777099609375, -33.48653030395508, -32.22028350830078, -30.95404052734375, -29.687793731689453, -28.421546936035156, -27.155302047729492, -25.889057159423828, -24.62281036376953, -23.356563568115234, -22.09031867980957, -20.824073791503906, -19.55782699584961, -18.291580200195312, -17.02533531188965, -15.759089469909668, -14.492843627929688, -13.226597785949707, -11.960351943969727, -10.694106101989746, -9.427860260009766, -8.161614418029785, -6.895368576049805, -5.629122734069824, -4.362876892089844, -3.0966310501098633, -1.8303852081298828, -0.5641393661499023, 0.7021064758300781, 1.9683523178100586, 3.234598159790039, 4.5008440017700195, 5.76708984375, 7.0333356857299805, 8.299581527709961, 9.565827369689941, 10.832073211669922, 12.098319053649902, 13.364564895629883, 14.630810737609863, 15.897056579589844, 17.16330337524414, 18.429548263549805, 19.69579315185547, 20.962039947509766, 22.228286743164062, 23.494531631469727, 24.76077651977539, 26.027023315429688, 27.293270111083984, 28.55951499938965, 29.825759887695312, 31.09200668334961, 32.358253479003906, 33.62449645996094, 34.890743255615234, 36.15699005126953, 37.42323684692383, 38.689483642578125, 39.955726623535156, 41.22197341918945]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 0.0, 4.0, 5.0, 8.0, 4.0, 9.0, 10.0, 12.0, 18.0, 33.0, 26.0, 27.0, 31.0, 19.0, 36.0, 45.0, 45.0, 54.0, 64.0, 79.0, 75.0, 51.0, 38.0, 32.0, 31.0, 28.0, 35.0, 20.0, 25.0, 19.0, 17.0, 21.0, 16.0, 8.0, 15.0, 10.0, 9.0, 7.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-24.91098403930664, -24.229276657104492, -23.54756736755371, -22.865859985351562, -22.184152603149414, -21.502445220947266, -20.820735931396484, -20.139028549194336, -19.457321166992188, -18.77561378479004, -18.093904495239258, -17.41219711303711, -16.73048973083496, -16.048782348632812, -15.367073059082031, -14.685365676879883, -14.003656387329102, -13.321948051452637, -12.640240669250488, -11.958532333374023, -11.276824951171875, -10.59511661529541, -9.913408279418945, -9.231700897216797, -8.549992561340332, -7.868284702301025, -7.186576843261719, -6.504868507385254, -5.823160648345947, -5.141452789306641, -4.459744453430176, -3.778036594390869, -3.0963287353515625, -2.414620876312256, -1.7329127788543701, -1.0512046813964844, -0.36949682235717773, 0.3122110366821289, 0.9939193725585938, 1.6756272315979004, 2.357335090637207, 3.0390429496765137, 3.7207510471343994, 4.402459144592285, 5.084167003631592, 5.765874862670898, 6.447583198547363, 7.12929105758667, 7.810998916625977, 8.492707252502441, 9.17441463470459, 9.856122970581055, 10.537830352783203, 11.219538688659668, 11.901247024536133, 12.582954406738281, 13.264662742614746, 13.946371078491211, 14.62807846069336, 15.309786796569824, 15.991495132446289, 16.673202514648438, 17.35491180419922, 18.036619186401367, 18.718326568603516]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 8.0, 13.0, 20.0, 27.0, 36.0, 59.0, 112.0, 187.0, 344.0, 738.0, 1382.0, 3240.0, 8173.0, 25567.0, 110115.0, 1360104.0, 2449023.0, 181455.0, 35077.0, 10896.0, 4155.0, 1739.0, 784.0, 402.0, 248.0, 142.0, 95.0, 42.0, 33.0, 18.0, 11.0, 11.0, 5.0, 7.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6875, -2.598297119140625, -2.50909423828125, -2.419891357421875, -2.3306884765625, -2.241485595703125, -2.15228271484375, -2.063079833984375, -1.973876953125, -1.884674072265625, -1.79547119140625, -1.706268310546875, -1.6170654296875, -1.527862548828125, -1.43865966796875, -1.349456787109375, -1.26025390625, -1.171051025390625, -1.08184814453125, -0.992645263671875, -0.9034423828125, -0.814239501953125, -0.72503662109375, -0.635833740234375, -0.546630859375, -0.457427978515625, -0.36822509765625, -0.279022216796875, -0.1898193359375, -0.100616455078125, -0.01141357421875, 0.077789306640625, 0.1669921875, 0.256195068359375, 0.34539794921875, 0.434600830078125, 0.5238037109375, 0.613006591796875, 0.70220947265625, 0.791412353515625, 0.880615234375, 0.969818115234375, 1.05902099609375, 1.148223876953125, 1.2374267578125, 1.326629638671875, 1.41583251953125, 1.505035400390625, 1.59423828125, 1.683441162109375, 1.77264404296875, 1.861846923828125, 1.9510498046875, 2.040252685546875, 2.12945556640625, 2.218658447265625, 2.307861328125, 2.397064208984375, 2.48626708984375, 2.575469970703125, 2.6646728515625, 2.753875732421875, 2.84307861328125, 2.932281494140625, 3.021484375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 2.0, 9.0, 8.0, 8.0, 11.0, 16.0, 12.0, 26.0, 17.0, 20.0, 29.0, 33.0, 35.0, 36.0, 30.0, 63.0, 55.0, 50.0, 49.0, 38.0, 54.0, 52.0, 39.0, 39.0, 43.0, 32.0, 24.0, 21.0, 22.0, 21.0, 23.0, 18.0, 18.0, 9.0, 7.0, 8.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.3623046875, -1.32452392578125, -1.2867431640625, -1.24896240234375, -1.211181640625, -1.17340087890625, -1.1356201171875, -1.09783935546875, -1.06005859375, -1.02227783203125, -0.9844970703125, -0.94671630859375, -0.908935546875, -0.87115478515625, -0.8333740234375, -0.79559326171875, -0.7578125, -0.72003173828125, -0.6822509765625, -0.64447021484375, -0.606689453125, -0.56890869140625, -0.5311279296875, -0.49334716796875, -0.45556640625, -0.41778564453125, -0.3800048828125, -0.34222412109375, -0.304443359375, -0.26666259765625, -0.2288818359375, -0.19110107421875, -0.1533203125, -0.11553955078125, -0.0777587890625, -0.03997802734375, -0.002197265625, 0.03558349609375, 0.0733642578125, 0.11114501953125, 0.14892578125, 0.18670654296875, 0.2244873046875, 0.26226806640625, 0.300048828125, 0.33782958984375, 0.3756103515625, 0.41339111328125, 0.451171875, 0.48895263671875, 0.5267333984375, 0.56451416015625, 0.602294921875, 0.64007568359375, 0.6778564453125, 0.71563720703125, 0.75341796875, 0.79119873046875, 0.8289794921875, 0.86676025390625, 0.904541015625, 0.94232177734375, 0.9801025390625, 1.01788330078125, 1.0556640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 9.0, 5.0, 6.0, 12.0, 24.0, 30.0, 48.0, 68.0, 111.0, 159.0, 324.0, 509.0, 914.0, 1872.0, 4030.0, 10436.0, 35257.0, 198550.0, 3127794.0, 713243.0, 71070.0, 17906.0, 6097.0, 2658.0, 1320.0, 707.0, 417.0, 237.0, 167.0, 94.0, 49.0, 49.0, 27.0, 23.0, 13.0, 11.0, 9.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.36328125, -4.22998046875, -4.0966796875, -3.96337890625, -3.830078125, -3.69677734375, -3.5634765625, -3.43017578125, -3.296875, -3.16357421875, -3.0302734375, -2.89697265625, -2.763671875, -2.63037109375, -2.4970703125, -2.36376953125, -2.23046875, -2.09716796875, -1.9638671875, -1.83056640625, -1.697265625, -1.56396484375, -1.4306640625, -1.29736328125, -1.1640625, -1.03076171875, -0.8974609375, -0.76416015625, -0.630859375, -0.49755859375, -0.3642578125, -0.23095703125, -0.09765625, 0.03564453125, 0.1689453125, 0.30224609375, 0.435546875, 0.56884765625, 0.7021484375, 0.83544921875, 0.96875, 1.10205078125, 1.2353515625, 1.36865234375, 1.501953125, 1.63525390625, 1.7685546875, 1.90185546875, 2.03515625, 2.16845703125, 2.3017578125, 2.43505859375, 2.568359375, 2.70166015625, 2.8349609375, 2.96826171875, 3.1015625, 3.23486328125, 3.3681640625, 3.50146484375, 3.634765625, 3.76806640625, 3.9013671875, 4.03466796875, 4.16796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 11.0, 13.0, 19.0, 38.0, 36.0, 72.0, 117.0, 174.0, 368.0, 843.0, 1070.0, 583.0, 277.0, 156.0, 83.0, 68.0, 37.0, 37.0, 15.0, 6.0, 8.0, 5.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.65142822265625, -4.4747314453125, -4.29803466796875, -4.121337890625, -3.94464111328125, -3.7679443359375, -3.59124755859375, -3.41455078125, -3.23785400390625, -3.0611572265625, -2.88446044921875, -2.707763671875, -2.53106689453125, -2.3543701171875, -2.17767333984375, -2.0009765625, -1.82427978515625, -1.6475830078125, -1.47088623046875, -1.294189453125, -1.11749267578125, -0.9407958984375, -0.76409912109375, -0.58740234375, -0.41070556640625, -0.2340087890625, -0.05731201171875, 0.119384765625, 0.29608154296875, 0.4727783203125, 0.64947509765625, 0.826171875, 1.00286865234375, 1.1795654296875, 1.35626220703125, 1.532958984375, 1.70965576171875, 1.8863525390625, 2.06304931640625, 2.23974609375, 2.41644287109375, 2.5931396484375, 2.76983642578125, 2.946533203125, 3.12322998046875, 3.2999267578125, 3.47662353515625, 3.6533203125, 3.83001708984375, 4.0067138671875, 4.18341064453125, 4.360107421875, 4.53680419921875, 4.7135009765625, 4.89019775390625, 5.06689453125, 5.24359130859375, 5.4202880859375, 5.59698486328125, 5.773681640625, 5.95037841796875, 6.1270751953125, 6.30377197265625, 6.48046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 13.0, 30.0, 61.0, 149.0, 238.0, 231.0, 140.0, 80.0, 20.0, 12.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.4642448425293, -61.53456497192383, -59.60488510131836, -57.67520523071289, -55.74552536010742, -53.81584930419922, -51.88616943359375, -49.95648956298828, -48.02680969238281, -46.097129821777344, -44.167449951171875, -42.237770080566406, -40.30809020996094, -38.37841033935547, -36.44873046875, -34.5190544128418, -32.58937072753906, -30.659690856933594, -28.730010986328125, -26.800331115722656, -24.87065315246582, -22.94097328186035, -21.011293411254883, -19.081615447998047, -17.151935577392578, -15.22225570678711, -13.292576789855957, -11.362896919250488, -9.433218002319336, -7.503538131713867, -5.573858261108398, -3.644179344177246, -1.7145004272460938, 0.21517908573150635, 2.1448585987091064, 4.074538230895996, 6.004217624664307, 7.933897018432617, 9.863576889038086, 11.793255805969238, 13.722935676574707, 15.652615547180176, 17.582294464111328, 19.511974334716797, 21.441654205322266, 23.371334075927734, 25.301013946533203, 27.23069190979004, 29.160371780395508, 31.090051651000977, 33.01972961425781, 34.94940948486328, 36.87908935546875, 38.80876922607422, 40.73844909667969, 42.668128967285156, 44.597808837890625, 46.527488708496094, 48.45716857910156, 50.38684844970703, 52.3165283203125, 54.24620819091797, 56.17588806152344, 58.10556411743164, 60.03524398803711]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 10.0, 3.0, 7.0, 7.0, 10.0, 9.0, 12.0, 13.0, 22.0, 18.0, 16.0, 32.0, 33.0, 35.0, 34.0, 42.0, 36.0, 51.0, 48.0, 50.0, 44.0, 56.0, 46.0, 61.0, 33.0, 31.0, 31.0, 27.0, 31.0, 29.0, 20.0, 16.0, 19.0, 15.0, 11.0, 7.0, 7.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.495256423950195, -19.847238540649414, -19.19921875, -18.55120086669922, -17.903182983398438, -17.255165100097656, -16.607147216796875, -15.959127426147461, -15.31110954284668, -14.663091659545898, -14.0150728225708, -13.367053985595703, -12.719036102294922, -12.07101821899414, -11.422999382019043, -10.774980545043945, -10.126962661743164, -9.478944778442383, -8.830925941467285, -8.182907104492188, -7.534889221191406, -6.886870861053467, -6.238852500915527, -5.590834140777588, -4.942815780639648, -4.294797420501709, -3.6467790603637695, -2.99876070022583, -2.3507423400878906, -1.7027239799499512, -1.0547056198120117, -0.40668725967407227, 0.24132919311523438, 0.8893475532531738, 1.5373659133911133, 2.1853842735290527, 2.833402633666992, 3.4814209938049316, 4.129439353942871, 4.7774577140808105, 5.42547607421875, 6.0734944343566895, 6.721512794494629, 7.369531154632568, 8.017549514770508, 8.665567398071289, 9.313586235046387, 9.961605072021484, 10.609622955322266, 11.257640838623047, 11.905659675598145, 12.553678512573242, 13.201696395874023, 13.849714279174805, 14.497733116149902, 15.145751953125, 15.793769836425781, 16.441787719726562, 17.089805603027344, 17.737825393676758, 18.38584327697754, 19.03386116027832, 19.681880950927734, 20.329898834228516, 20.977916717529297]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 9.0, 11.0, 23.0, 33.0, 63.0, 73.0, 95.0, 140.0, 202.0, 291.0, 449.0, 630.0, 998.0, 1438.0, 2317.0, 3583.0, 5820.0, 9613.0, 16837.0, 30694.0, 58959.0, 124264.0, 257275.0, 265974.0, 130507.0, 61716.0, 32126.0, 17558.0, 9977.0, 6131.0, 3784.0, 2382.0, 1514.0, 988.0, 689.0, 411.0, 288.0, 240.0, 125.0, 98.0, 70.0, 52.0, 22.0, 29.0, 10.0, 9.0, 8.0, 4.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1015625, -2.033843994140625, -1.96612548828125, -1.898406982421875, -1.8306884765625, -1.762969970703125, -1.69525146484375, -1.627532958984375, -1.559814453125, -1.492095947265625, -1.42437744140625, -1.356658935546875, -1.2889404296875, -1.221221923828125, -1.15350341796875, -1.085784912109375, -1.01806640625, -0.950347900390625, -0.88262939453125, -0.814910888671875, -0.7471923828125, -0.679473876953125, -0.61175537109375, -0.544036865234375, -0.476318359375, -0.408599853515625, -0.34088134765625, -0.273162841796875, -0.2054443359375, -0.137725830078125, -0.07000732421875, -0.002288818359375, 0.0654296875, 0.133148193359375, 0.20086669921875, 0.268585205078125, 0.3363037109375, 0.404022216796875, 0.47174072265625, 0.539459228515625, 0.607177734375, 0.674896240234375, 0.74261474609375, 0.810333251953125, 0.8780517578125, 0.945770263671875, 1.01348876953125, 1.081207275390625, 1.14892578125, 1.216644287109375, 1.28436279296875, 1.352081298828125, 1.4197998046875, 1.487518310546875, 1.55523681640625, 1.622955322265625, 1.690673828125, 1.758392333984375, 1.82611083984375, 1.893829345703125, 1.9615478515625, 2.029266357421875, 2.09698486328125, 2.164703369140625, 2.232421875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 5.0, 12.0, 19.0, 14.0, 29.0, 38.0, 30.0, 41.0, 40.0, 37.0, 45.0, 55.0, 40.0, 43.0, 44.0, 64.0, 39.0, 41.0, 47.0, 27.0, 41.0, 39.0, 34.0, 31.0, 27.0, 15.0, 17.0, 13.0, 4.0, 7.0, 13.0, 6.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32379150390625, -1.2774658203125, -1.23114013671875, -1.184814453125, -1.13848876953125, -1.0921630859375, -1.04583740234375, -0.99951171875, -0.95318603515625, -0.9068603515625, -0.86053466796875, -0.814208984375, -0.76788330078125, -0.7215576171875, -0.67523193359375, -0.62890625, -0.58258056640625, -0.5362548828125, -0.48992919921875, -0.443603515625, -0.39727783203125, -0.3509521484375, -0.30462646484375, -0.25830078125, -0.21197509765625, -0.1656494140625, -0.11932373046875, -0.072998046875, -0.02667236328125, 0.0196533203125, 0.06597900390625, 0.1123046875, 0.15863037109375, 0.2049560546875, 0.25128173828125, 0.297607421875, 0.34393310546875, 0.3902587890625, 0.43658447265625, 0.48291015625, 0.52923583984375, 0.5755615234375, 0.62188720703125, 0.668212890625, 0.71453857421875, 0.7608642578125, 0.80718994140625, 0.853515625, 0.89984130859375, 0.9461669921875, 0.99249267578125, 1.038818359375, 1.08514404296875, 1.1314697265625, 1.17779541015625, 1.22412109375, 1.27044677734375, 1.3167724609375, 1.36309814453125, 1.409423828125, 1.45574951171875, 1.5020751953125, 1.54840087890625, 1.5947265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 9.0, 22.0, 33.0, 45.0, 72.0, 112.0, 173.0, 360.0, 671.0, 1563.0, 5792.0, 62851.0, 914679.0, 53893.0, 5252.0, 1580.0, 620.0, 317.0, 193.0, 104.0, 73.0, 40.0, 35.0, 17.0, 13.0, 7.0, 5.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5234375, -10.1259765625, -9.728515625, -9.3310546875, -8.93359375, -8.5361328125, -8.138671875, -7.7412109375, -7.34375, -6.9462890625, -6.548828125, -6.1513671875, -5.75390625, -5.3564453125, -4.958984375, -4.5615234375, -4.1640625, -3.7666015625, -3.369140625, -2.9716796875, -2.57421875, -2.1767578125, -1.779296875, -1.3818359375, -0.984375, -0.5869140625, -0.189453125, 0.2080078125, 0.60546875, 1.0029296875, 1.400390625, 1.7978515625, 2.1953125, 2.5927734375, 2.990234375, 3.3876953125, 3.78515625, 4.1826171875, 4.580078125, 4.9775390625, 5.375, 5.7724609375, 6.169921875, 6.5673828125, 6.96484375, 7.3623046875, 7.759765625, 8.1572265625, 8.5546875, 8.9521484375, 9.349609375, 9.7470703125, 10.14453125, 10.5419921875, 10.939453125, 11.3369140625, 11.734375, 12.1318359375, 12.529296875, 12.9267578125, 13.32421875, 13.7216796875, 14.119140625, 14.5166015625, 14.9140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 5.0, 7.0, 19.0, 11.0, 24.0, 24.0, 30.0, 41.0, 52.0, 37.0, 41.0, 59.0, 59.0, 76.0, 50.0, 69.0, 62.0, 53.0, 47.0, 40.0, 43.0, 30.0, 23.0, 19.0, 12.0, 13.0, 11.0, 6.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.288330078125, -7.03759765625, -6.786865234375, -6.5361328125, -6.285400390625, -6.03466796875, -5.783935546875, -5.533203125, -5.282470703125, -5.03173828125, -4.781005859375, -4.5302734375, -4.279541015625, -4.02880859375, -3.778076171875, -3.52734375, -3.276611328125, -3.02587890625, -2.775146484375, -2.5244140625, -2.273681640625, -2.02294921875, -1.772216796875, -1.521484375, -1.270751953125, -1.02001953125, -0.769287109375, -0.5185546875, -0.267822265625, -0.01708984375, 0.233642578125, 0.484375, 0.735107421875, 0.98583984375, 1.236572265625, 1.4873046875, 1.738037109375, 1.98876953125, 2.239501953125, 2.490234375, 2.740966796875, 2.99169921875, 3.242431640625, 3.4931640625, 3.743896484375, 3.99462890625, 4.245361328125, 4.49609375, 4.746826171875, 4.99755859375, 5.248291015625, 5.4990234375, 5.749755859375, 6.00048828125, 6.251220703125, 6.501953125, 6.752685546875, 7.00341796875, 7.254150390625, 7.5048828125, 7.755615234375, 8.00634765625, 8.257080078125, 8.5078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 9.0, 18.0, 26.0, 26.0, 48.0, 63.0, 116.0, 196.0, 345.0, 720.0, 2066.0, 7382.0, 38355.0, 443391.0, 506033.0, 38573.0, 7610.0, 2034.0, 707.0, 324.0, 183.0, 101.0, 61.0, 55.0, 27.0, 23.0, 19.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.0357666015625, -1.954345703125, -1.8729248046875, -1.79150390625, -1.7100830078125, -1.628662109375, -1.5472412109375, -1.4658203125, -1.3843994140625, -1.302978515625, -1.2215576171875, -1.14013671875, -1.0587158203125, -0.977294921875, -0.8958740234375, -0.814453125, -0.7330322265625, -0.651611328125, -0.5701904296875, -0.48876953125, -0.4073486328125, -0.325927734375, -0.2445068359375, -0.1630859375, -0.0816650390625, -0.000244140625, 0.0811767578125, 0.16259765625, 0.2440185546875, 0.325439453125, 0.4068603515625, 0.48828125, 0.5697021484375, 0.651123046875, 0.7325439453125, 0.81396484375, 0.8953857421875, 0.976806640625, 1.0582275390625, 1.1396484375, 1.2210693359375, 1.302490234375, 1.3839111328125, 1.46533203125, 1.5467529296875, 1.628173828125, 1.7095947265625, 1.791015625, 1.8724365234375, 1.953857421875, 2.0352783203125, 2.11669921875, 2.1981201171875, 2.279541015625, 2.3609619140625, 2.4423828125, 2.5238037109375, 2.605224609375, 2.6866455078125, 2.76806640625, 2.8494873046875, 2.930908203125, 3.0123291015625, 3.09375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 9.0, 11.0, 5.0, 16.0, 16.0, 21.0, 26.0, 31.0, 51.0, 76.0, 95.0, 133.0, 135.0, 96.0, 68.0, 36.0, 33.0, 31.0, 26.0, 22.0, 9.0, 10.0, 6.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005865097045898438, -0.0005697011947631836, -0.0005528926849365234, -0.0005360841751098633, -0.0005192756652832031, -0.000502467155456543, -0.0004856586456298828, -0.00046885013580322266, -0.0004520416259765625, -0.00043523311614990234, -0.0004184246063232422, -0.00040161609649658203, -0.0003848075866699219, -0.0003679990768432617, -0.00035119056701660156, -0.0003343820571899414, -0.00031757354736328125, -0.0003007650375366211, -0.00028395652770996094, -0.0002671480178833008, -0.0002503395080566406, -0.00023353099822998047, -0.0002167224884033203, -0.00019991397857666016, -0.00018310546875, -0.00016629695892333984, -0.0001494884490966797, -0.00013267993927001953, -0.00011587142944335938, -9.906291961669922e-05, -8.225440979003906e-05, -6.54458999633789e-05, -4.863739013671875e-05, -3.1828880310058594e-05, -1.5020370483398438e-05, 1.7881393432617188e-06, 1.8596649169921875e-05, 3.540515899658203e-05, 5.221366882324219e-05, 6.902217864990234e-05, 8.58306884765625e-05, 0.00010263919830322266, 0.00011944770812988281, 0.00013625621795654297, 0.00015306472778320312, 0.00016987323760986328, 0.00018668174743652344, 0.0002034902572631836, 0.00022029876708984375, 0.0002371072769165039, 0.00025391578674316406, 0.0002707242965698242, 0.0002875328063964844, 0.00030434131622314453, 0.0003211498260498047, 0.00033795833587646484, 0.000354766845703125, 0.00037157535552978516, 0.0003883838653564453, 0.00040519237518310547, 0.0004220008850097656, 0.0004388093948364258, 0.00045561790466308594, 0.0004724264144897461, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 3.0, 5.0, 4.0, 14.0, 21.0, 41.0, 70.0, 113.0, 219.0, 462.0, 862.0, 2000.0, 5930.0, 30061.0, 579680.0, 393079.0, 26675.0, 5615.0, 1972.0, 814.0, 394.0, 226.0, 112.0, 66.0, 43.0, 14.0, 15.0, 14.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.33477783203125, -2.2593994140625, -2.18402099609375, -2.108642578125, -2.03326416015625, -1.9578857421875, -1.88250732421875, -1.80712890625, -1.73175048828125, -1.6563720703125, -1.58099365234375, -1.505615234375, -1.43023681640625, -1.3548583984375, -1.27947998046875, -1.2041015625, -1.12872314453125, -1.0533447265625, -0.97796630859375, -0.902587890625, -0.82720947265625, -0.7518310546875, -0.67645263671875, -0.60107421875, -0.52569580078125, -0.4503173828125, -0.37493896484375, -0.299560546875, -0.22418212890625, -0.1488037109375, -0.07342529296875, 0.001953125, 0.07733154296875, 0.1527099609375, 0.22808837890625, 0.303466796875, 0.37884521484375, 0.4542236328125, 0.52960205078125, 0.60498046875, 0.68035888671875, 0.7557373046875, 0.83111572265625, 0.906494140625, 0.98187255859375, 1.0572509765625, 1.13262939453125, 1.2080078125, 1.28338623046875, 1.3587646484375, 1.43414306640625, 1.509521484375, 1.58489990234375, 1.6602783203125, 1.73565673828125, 1.81103515625, 1.88641357421875, 1.9617919921875, 2.03717041015625, 2.112548828125, 2.18792724609375, 2.2633056640625, 2.33868408203125, 2.4140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 9.0, 6.0, 6.0, 6.0, 14.0, 13.0, 21.0, 17.0, 17.0, 31.0, 40.0, 54.0, 64.0, 74.0, 83.0, 96.0, 73.0, 61.0, 64.0, 47.0, 55.0, 30.0, 21.0, 17.0, 22.0, 17.0, 15.0, 8.0, 9.0, 6.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8346405029296875, -1.789398193359375, -1.7441558837890625, -1.69891357421875, -1.6536712646484375, -1.608428955078125, -1.5631866455078125, -1.5179443359375, -1.4727020263671875, -1.427459716796875, -1.3822174072265625, -1.33697509765625, -1.2917327880859375, -1.246490478515625, -1.2012481689453125, -1.156005859375, -1.1107635498046875, -1.065521240234375, -1.0202789306640625, -0.97503662109375, -0.9297943115234375, -0.884552001953125, -0.8393096923828125, -0.7940673828125, -0.7488250732421875, -0.703582763671875, -0.6583404541015625, -0.61309814453125, -0.5678558349609375, -0.522613525390625, -0.4773712158203125, -0.43212890625, -0.3868865966796875, -0.341644287109375, -0.2964019775390625, -0.25115966796875, -0.2059173583984375, -0.160675048828125, -0.1154327392578125, -0.0701904296875, -0.0249481201171875, 0.020294189453125, 0.0655364990234375, 0.11077880859375, 0.1560211181640625, 0.201263427734375, 0.2465057373046875, 0.291748046875, 0.3369903564453125, 0.382232666015625, 0.4274749755859375, 0.47271728515625, 0.5179595947265625, 0.563201904296875, 0.6084442138671875, 0.6536865234375, 0.6989288330078125, 0.744171142578125, 0.7894134521484375, 0.83465576171875, 0.8798980712890625, 0.925140380859375, 0.9703826904296875, 1.015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 20.0, 33.0, 71.0, 84.0, 141.0, 205.0, 156.0, 103.0, 64.0, 32.0, 23.0, 18.0, 6.0, 7.0, 2.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.67342758178711, -42.45110321044922, -41.22877502441406, -40.006446838378906, -38.784122467041016, -37.561798095703125, -36.33946990966797, -35.11714172363281, -33.89481735229492, -32.67249298095703, -31.450164794921875, -30.22783851623535, -29.005512237548828, -27.783185958862305, -26.56085968017578, -25.338533401489258, -24.116207122802734, -22.89388084411621, -21.671554565429688, -20.449228286743164, -19.22690200805664, -18.004575729370117, -16.782249450683594, -15.55992317199707, -14.337596893310547, -13.115270614624023, -11.8929443359375, -10.670618057250977, -9.448291778564453, -8.22596549987793, -7.003639221191406, -5.781312942504883, -4.558990478515625, -3.3366641998291016, -2.114337921142578, -0.8920116424560547, 0.33031463623046875, 1.5526409149169922, 2.7749671936035156, 3.997293472290039, 5.2196197509765625, 6.441946029663086, 7.664272308349609, 8.886598587036133, 10.108924865722656, 11.33125114440918, 12.553577423095703, 13.775903701782227, 14.99822998046875, 16.220556259155273, 17.442882537841797, 18.66520881652832, 19.887535095214844, 21.109861373901367, 22.33218765258789, 23.554513931274414, 24.776840209960938, 25.99916648864746, 27.221492767333984, 28.443819046020508, 29.66614532470703, 30.888471603393555, 32.11079788208008, 33.33312225341797, 34.555450439453125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 9.0, 9.0, 10.0, 14.0, 6.0, 24.0, 22.0, 19.0, 19.0, 15.0, 16.0, 37.0, 20.0, 36.0, 38.0, 41.0, 52.0, 60.0, 75.0, 70.0, 51.0, 40.0, 36.0, 32.0, 32.0, 26.0, 16.0, 19.0, 27.0, 20.0, 12.0, 11.0, 11.0, 9.0, 9.0, 8.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-26.3154239654541, -25.593761444091797, -24.872098922729492, -24.150436401367188, -23.42877197265625, -22.707109451293945, -21.98544692993164, -21.263784408569336, -20.54212188720703, -19.820459365844727, -19.098796844482422, -18.377134323120117, -17.655471801757812, -16.933807373046875, -16.21214485168457, -15.490482330322266, -14.768819808959961, -14.047157287597656, -13.325494766235352, -12.60383129119873, -11.882168769836426, -11.160506248474121, -10.4388427734375, -9.717180252075195, -8.99551773071289, -8.273855209350586, -7.552192211151123, -6.83052921295166, -6.1088666915893555, -5.387204170227051, -4.665541172027588, -3.943878173828125, -3.222217559814453, -2.5005548000335693, -1.7788920402526855, -1.0572292804718018, -0.33556652069091797, 0.3860962390899658, 1.1077589988708496, 1.8294219970703125, 2.551084518432617, 3.272747278213501, 3.9944100379943848, 4.716073036193848, 5.437735557556152, 6.159398078918457, 6.88106107711792, 7.602724075317383, 8.324386596679688, 9.046049118041992, 9.767711639404297, 10.489375114440918, 11.211037635803223, 11.932700157165527, 12.654363632202148, 13.376026153564453, 14.097688674926758, 14.819351196289062, 15.541013717651367, 16.262676239013672, 16.98434066772461, 17.706003189086914, 18.42766571044922, 19.149328231811523, 19.870990753173828]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 6.0, 15.0, 19.0, 19.0, 38.0, 36.0, 60.0, 96.0, 168.0, 232.0, 444.0, 768.0, 1721.0, 4162.0, 13266.0, 56788.0, 736408.0, 3088648.0, 246390.0, 31173.0, 8168.0, 2877.0, 1221.0, 619.0, 324.0, 197.0, 122.0, 80.0, 63.0, 57.0, 15.0, 18.0, 15.0, 10.0, 8.0, 3.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.830474853515625, -2.73712158203125, -2.643768310546875, -2.5504150390625, -2.457061767578125, -2.36370849609375, -2.270355224609375, -2.177001953125, -2.083648681640625, -1.99029541015625, -1.896942138671875, -1.8035888671875, -1.710235595703125, -1.61688232421875, -1.523529052734375, -1.43017578125, -1.336822509765625, -1.24346923828125, -1.150115966796875, -1.0567626953125, -0.963409423828125, -0.87005615234375, -0.776702880859375, -0.683349609375, -0.589996337890625, -0.49664306640625, -0.403289794921875, -0.3099365234375, -0.216583251953125, -0.12322998046875, -0.029876708984375, 0.0634765625, 0.156829833984375, 0.25018310546875, 0.343536376953125, 0.4368896484375, 0.530242919921875, 0.62359619140625, 0.716949462890625, 0.810302734375, 0.903656005859375, 0.99700927734375, 1.090362548828125, 1.1837158203125, 1.277069091796875, 1.37042236328125, 1.463775634765625, 1.55712890625, 1.650482177734375, 1.74383544921875, 1.837188720703125, 1.9305419921875, 2.023895263671875, 2.11724853515625, 2.210601806640625, 2.303955078125, 2.397308349609375, 2.49066162109375, 2.584014892578125, 2.6773681640625, 2.770721435546875, 2.86407470703125, 2.957427978515625, 3.05078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 12.0, 7.0, 21.0, 11.0, 27.0, 31.0, 30.0, 26.0, 43.0, 57.0, 44.0, 55.0, 74.0, 63.0, 53.0, 65.0, 59.0, 44.0, 60.0, 38.0, 37.0, 37.0, 29.0, 19.0, 11.0, 9.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.395233154296875, -1.34124755859375, -1.287261962890625, -1.2332763671875, -1.179290771484375, -1.12530517578125, -1.071319580078125, -1.017333984375, -0.963348388671875, -0.90936279296875, -0.855377197265625, -0.8013916015625, -0.747406005859375, -0.69342041015625, -0.639434814453125, -0.58544921875, -0.531463623046875, -0.47747802734375, -0.423492431640625, -0.3695068359375, -0.315521240234375, -0.26153564453125, -0.207550048828125, -0.153564453125, -0.099578857421875, -0.04559326171875, 0.008392333984375, 0.0623779296875, 0.116363525390625, 0.17034912109375, 0.224334716796875, 0.2783203125, 0.332305908203125, 0.38629150390625, 0.440277099609375, 0.4942626953125, 0.548248291015625, 0.60223388671875, 0.656219482421875, 0.710205078125, 0.764190673828125, 0.81817626953125, 0.872161865234375, 0.9261474609375, 0.980133056640625, 1.03411865234375, 1.088104248046875, 1.14208984375, 1.196075439453125, 1.25006103515625, 1.304046630859375, 1.3580322265625, 1.412017822265625, 1.46600341796875, 1.519989013671875, 1.573974609375, 1.627960205078125, 1.68194580078125, 1.735931396484375, 1.7899169921875, 1.843902587890625, 1.89788818359375, 1.951873779296875, 2.005859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 4.0, 18.0, 17.0, 27.0, 38.0, 66.0, 98.0, 167.0, 326.0, 720.0, 1713.0, 4832.0, 17188.0, 102098.0, 3228524.0, 777423.0, 45540.0, 10066.0, 3120.0, 1181.0, 544.0, 240.0, 135.0, 61.0, 41.0, 33.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.3671875, -4.21014404296875, -4.0531005859375, -3.89605712890625, -3.739013671875, -3.58197021484375, -3.4249267578125, -3.26788330078125, -3.11083984375, -2.95379638671875, -2.7967529296875, -2.63970947265625, -2.482666015625, -2.32562255859375, -2.1685791015625, -2.01153564453125, -1.8544921875, -1.69744873046875, -1.5404052734375, -1.38336181640625, -1.226318359375, -1.06927490234375, -0.9122314453125, -0.75518798828125, -0.59814453125, -0.44110107421875, -0.2840576171875, -0.12701416015625, 0.030029296875, 0.18707275390625, 0.3441162109375, 0.50115966796875, 0.658203125, 0.81524658203125, 0.9722900390625, 1.12933349609375, 1.286376953125, 1.44342041015625, 1.6004638671875, 1.75750732421875, 1.91455078125, 2.07159423828125, 2.2286376953125, 2.38568115234375, 2.542724609375, 2.69976806640625, 2.8568115234375, 3.01385498046875, 3.1708984375, 3.32794189453125, 3.4849853515625, 3.64202880859375, 3.799072265625, 3.95611572265625, 4.1131591796875, 4.27020263671875, 4.42724609375, 4.58428955078125, 4.7413330078125, 4.89837646484375, 5.055419921875, 5.21246337890625, 5.3695068359375, 5.52655029296875, 5.68359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 5.0, 9.0, 20.0, 17.0, 30.0, 30.0, 38.0, 78.0, 134.0, 279.0, 475.0, 915.0, 889.0, 525.0, 234.0, 146.0, 79.0, 55.0, 22.0, 21.0, 19.0, 9.0, 5.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.140625, -4.99407958984375, -4.8475341796875, -4.70098876953125, -4.554443359375, -4.40789794921875, -4.2613525390625, -4.11480712890625, -3.96826171875, -3.82171630859375, -3.6751708984375, -3.52862548828125, -3.382080078125, -3.23553466796875, -3.0889892578125, -2.94244384765625, -2.7958984375, -2.64935302734375, -2.5028076171875, -2.35626220703125, -2.209716796875, -2.06317138671875, -1.9166259765625, -1.77008056640625, -1.62353515625, -1.47698974609375, -1.3304443359375, -1.18389892578125, -1.037353515625, -0.89080810546875, -0.7442626953125, -0.59771728515625, -0.451171875, -0.30462646484375, -0.1580810546875, -0.01153564453125, 0.135009765625, 0.28155517578125, 0.4281005859375, 0.57464599609375, 0.72119140625, 0.86773681640625, 1.0142822265625, 1.16082763671875, 1.307373046875, 1.45391845703125, 1.6004638671875, 1.74700927734375, 1.8935546875, 2.04010009765625, 2.1866455078125, 2.33319091796875, 2.479736328125, 2.62628173828125, 2.7728271484375, 2.91937255859375, 3.06591796875, 3.21246337890625, 3.3590087890625, 3.50555419921875, 3.652099609375, 3.79864501953125, 3.9451904296875, 4.09173583984375, 4.23828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 18.0, 41.0, 121.0, 281.0, 296.0, 157.0, 45.0, 14.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.36859893798828, -62.23651885986328, -60.10443878173828, -57.97235870361328, -55.84027862548828, -53.70819854736328, -51.57612228393555, -49.44404220581055, -47.31196212768555, -45.17988204956055, -43.04780197143555, -40.91572189331055, -38.78364562988281, -36.65156555175781, -34.51948547363281, -32.38740539550781, -30.255325317382812, -28.123245239257812, -25.991165161132812, -23.859086990356445, -21.727006912231445, -19.594926834106445, -17.462848663330078, -15.330768585205078, -13.198688507080078, -11.066608428955078, -8.934529304504395, -6.802449703216553, -4.670370101928711, -2.538290023803711, -0.40621089935302734, 1.7258682250976562, 3.8579559326171875, 5.990035533905029, 8.122115135192871, 10.254194259643555, 12.386274337768555, 14.518354415893555, 16.650432586669922, 18.782512664794922, 20.914592742919922, 23.046672821044922, 25.178752899169922, 27.31083106994629, 29.44291114807129, 31.57499122619629, 33.707069396972656, 35.839149475097656, 37.971229553222656, 40.103309631347656, 42.235389709472656, 44.367469787597656, 46.499549865722656, 48.631629943847656, 50.76370620727539, 52.89578628540039, 55.02786636352539, 57.15994644165039, 59.29202651977539, 61.42410659790039, 63.556182861328125, 65.68826293945312, 67.82034301757812, 69.95242309570312, 72.08450317382812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 4.0, 2.0, 8.0, 13.0, 15.0, 16.0, 19.0, 21.0, 26.0, 23.0, 26.0, 37.0, 39.0, 36.0, 41.0, 41.0, 38.0, 45.0, 32.0, 37.0, 52.0, 41.0, 47.0, 43.0, 31.0, 35.0, 33.0, 24.0, 28.0, 21.0, 22.0, 20.0, 12.0, 13.0, 14.0, 9.0, 7.0, 6.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.232139587402344, -13.773418426513672, -13.314697265625, -12.855976104736328, -12.397254943847656, -11.938533782958984, -11.479812622070312, -11.02109146118164, -10.562370300292969, -10.103649139404297, -9.644927978515625, -9.186206817626953, -8.727485656738281, -8.26876449584961, -7.8100433349609375, -7.351322174072266, -6.892601490020752, -6.43388032913208, -5.975159168243408, -5.516438007354736, -5.0577168464660645, -4.598996162414551, -4.140275001525879, -3.681553602218628, -3.222832441329956, -2.764111280441284, -2.3053901195526123, -1.84666907787323, -1.387947916984558, -0.9292268753051758, -0.4705057144165039, -0.011784553527832031, 0.44693660736083984, 0.9056577682495117, 1.3643789291381836, 1.823099970817566, 2.2818212509155273, 2.74054217338562, 3.199263334274292, 3.657984495162964, 4.116705894470215, 4.575427055358887, 5.034148216247559, 5.4928693771362305, 5.951590538024902, 6.410311698913574, 6.869032859802246, 7.327754020690918, 7.786474704742432, 8.245195388793945, 8.703916549682617, 9.162637710571289, 9.621358871459961, 10.080080032348633, 10.538801193237305, 10.997522354125977, 11.456243515014648, 11.91496467590332, 12.373685836791992, 12.832406997680664, 13.291128158569336, 13.749849319458008, 14.20857048034668, 14.667291641235352, 15.126012802124023]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 6.0, 8.0, 11.0, 28.0, 37.0, 62.0, 81.0, 155.0, 277.0, 482.0, 847.0, 1610.0, 3162.0, 7017.0, 16483.0, 44684.0, 132434.0, 325286.0, 317753.0, 126026.0, 42774.0, 16022.0, 6829.0, 3002.0, 1560.0, 840.0, 429.0, 278.0, 160.0, 79.0, 52.0, 22.0, 26.0, 9.0, 14.0, 4.0, 2.0, 2.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.44158935546875, -2.3675537109375, -2.29351806640625, -2.219482421875, -2.14544677734375, -2.0714111328125, -1.99737548828125, -1.92333984375, -1.84930419921875, -1.7752685546875, -1.70123291015625, -1.627197265625, -1.55316162109375, -1.4791259765625, -1.40509033203125, -1.3310546875, -1.25701904296875, -1.1829833984375, -1.10894775390625, -1.034912109375, -0.96087646484375, -0.8868408203125, -0.81280517578125, -0.73876953125, -0.66473388671875, -0.5906982421875, -0.51666259765625, -0.442626953125, -0.36859130859375, -0.2945556640625, -0.22052001953125, -0.146484375, -0.07244873046875, 0.0015869140625, 0.07562255859375, 0.149658203125, 0.22369384765625, 0.2977294921875, 0.37176513671875, 0.44580078125, 0.51983642578125, 0.5938720703125, 0.66790771484375, 0.741943359375, 0.81597900390625, 0.8900146484375, 0.96405029296875, 1.0380859375, 1.11212158203125, 1.1861572265625, 1.26019287109375, 1.334228515625, 1.40826416015625, 1.4822998046875, 1.55633544921875, 1.63037109375, 1.70440673828125, 1.7784423828125, 1.85247802734375, 1.926513671875, 2.00054931640625, 2.0745849609375, 2.14862060546875, 2.22265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 11.0, 10.0, 16.0, 19.0, 30.0, 39.0, 29.0, 36.0, 40.0, 47.0, 62.0, 61.0, 68.0, 71.0, 70.0, 67.0, 53.0, 47.0, 32.0, 51.0, 24.0, 15.0, 22.0, 20.0, 11.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.5473785400390625, -1.488311767578125, -1.4292449951171875, -1.37017822265625, -1.3111114501953125, -1.252044677734375, -1.1929779052734375, -1.1339111328125, -1.0748443603515625, -1.015777587890625, -0.9567108154296875, -0.89764404296875, -0.8385772705078125, -0.779510498046875, -0.7204437255859375, -0.661376953125, -0.6023101806640625, -0.543243408203125, -0.4841766357421875, -0.42510986328125, -0.3660430908203125, -0.306976318359375, -0.2479095458984375, -0.1888427734375, -0.1297760009765625, -0.070709228515625, -0.0116424560546875, 0.04742431640625, 0.1064910888671875, 0.165557861328125, 0.2246246337890625, 0.28369140625, 0.3427581787109375, 0.401824951171875, 0.4608917236328125, 0.51995849609375, 0.5790252685546875, 0.638092041015625, 0.6971588134765625, 0.7562255859375, 0.8152923583984375, 0.874359130859375, 0.9334259033203125, 0.99249267578125, 1.0515594482421875, 1.110626220703125, 1.1696929931640625, 1.228759765625, 1.2878265380859375, 1.346893310546875, 1.4059600830078125, 1.46502685546875, 1.5240936279296875, 1.583160400390625, 1.6422271728515625, 1.7012939453125, 1.7603607177734375, 1.819427490234375, 1.8784942626953125, 1.93756103515625, 1.9966278076171875, 2.055694580078125, 2.1147613525390625, 2.173828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 5.0, 7.0, 4.0, 8.0, 15.0, 17.0, 24.0, 41.0, 35.0, 65.0, 91.0, 123.0, 245.0, 464.0, 939.0, 2259.0, 6461.0, 25389.0, 149307.0, 666360.0, 159033.0, 26420.0, 6738.0, 2384.0, 935.0, 484.0, 245.0, 145.0, 93.0, 55.0, 40.0, 27.0, 23.0, 12.0, 14.0, 8.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-4.44921875, -4.31646728515625, -4.1837158203125, -4.05096435546875, -3.918212890625, -3.78546142578125, -3.6527099609375, -3.51995849609375, -3.38720703125, -3.25445556640625, -3.1217041015625, -2.98895263671875, -2.856201171875, -2.72344970703125, -2.5906982421875, -2.45794677734375, -2.3251953125, -2.19244384765625, -2.0596923828125, -1.92694091796875, -1.794189453125, -1.66143798828125, -1.5286865234375, -1.39593505859375, -1.26318359375, -1.13043212890625, -0.9976806640625, -0.86492919921875, -0.732177734375, -0.59942626953125, -0.4666748046875, -0.33392333984375, -0.201171875, -0.06842041015625, 0.0643310546875, 0.19708251953125, 0.329833984375, 0.46258544921875, 0.5953369140625, 0.72808837890625, 0.86083984375, 0.99359130859375, 1.1263427734375, 1.25909423828125, 1.391845703125, 1.52459716796875, 1.6573486328125, 1.79010009765625, 1.9228515625, 2.05560302734375, 2.1883544921875, 2.32110595703125, 2.453857421875, 2.58660888671875, 2.7193603515625, 2.85211181640625, 2.98486328125, 3.11761474609375, 3.2503662109375, 3.38311767578125, 3.515869140625, 3.64862060546875, 3.7813720703125, 3.91412353515625, 4.046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 10.0, 16.0, 11.0, 11.0, 23.0, 25.0, 40.0, 43.0, 46.0, 35.0, 49.0, 54.0, 59.0, 34.0, 53.0, 46.0, 47.0, 47.0, 45.0, 38.0, 45.0, 33.0, 32.0, 21.0, 18.0, 15.0, 15.0, 9.0, 18.0, 6.0, 9.0, 9.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3046875, -5.12481689453125, -4.9449462890625, -4.76507568359375, -4.585205078125, -4.40533447265625, -4.2254638671875, -4.04559326171875, -3.86572265625, -3.68585205078125, -3.5059814453125, -3.32611083984375, -3.146240234375, -2.96636962890625, -2.7864990234375, -2.60662841796875, -2.4267578125, -2.24688720703125, -2.0670166015625, -1.88714599609375, -1.707275390625, -1.52740478515625, -1.3475341796875, -1.16766357421875, -0.98779296875, -0.80792236328125, -0.6280517578125, -0.44818115234375, -0.268310546875, -0.08843994140625, 0.0914306640625, 0.27130126953125, 0.451171875, 0.63104248046875, 0.8109130859375, 0.99078369140625, 1.170654296875, 1.35052490234375, 1.5303955078125, 1.71026611328125, 1.89013671875, 2.07000732421875, 2.2498779296875, 2.42974853515625, 2.609619140625, 2.78948974609375, 2.9693603515625, 3.14923095703125, 3.3291015625, 3.50897216796875, 3.6888427734375, 3.86871337890625, 4.048583984375, 4.22845458984375, 4.4083251953125, 4.58819580078125, 4.76806640625, 4.94793701171875, 5.1278076171875, 5.30767822265625, 5.487548828125, 5.66741943359375, 5.8472900390625, 6.02716064453125, 6.20703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 12.0, 11.0, 25.0, 39.0, 43.0, 74.0, 93.0, 152.0, 228.0, 344.0, 521.0, 955.0, 1614.0, 3000.0, 6375.0, 17497.0, 65236.0, 344082.0, 506201.0, 69536.0, 18518.0, 6686.0, 3085.0, 1648.0, 936.0, 561.0, 365.0, 255.0, 145.0, 94.0, 71.0, 57.0, 27.0, 22.0, 12.0, 7.0, 11.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.130859375, -1.0944061279296875, -1.057952880859375, -1.0214996337890625, -0.98504638671875, -0.9485931396484375, -0.912139892578125, -0.8756866455078125, -0.8392333984375, -0.8027801513671875, -0.766326904296875, -0.7298736572265625, -0.69342041015625, -0.6569671630859375, -0.620513916015625, -0.5840606689453125, -0.547607421875, -0.5111541748046875, -0.474700927734375, -0.4382476806640625, -0.40179443359375, -0.3653411865234375, -0.328887939453125, -0.2924346923828125, -0.2559814453125, -0.2195281982421875, -0.183074951171875, -0.1466217041015625, -0.11016845703125, -0.0737152099609375, -0.037261962890625, -0.0008087158203125, 0.03564453125, 0.0720977783203125, 0.108551025390625, 0.1450042724609375, 0.18145751953125, 0.2179107666015625, 0.254364013671875, 0.2908172607421875, 0.3272705078125, 0.3637237548828125, 0.400177001953125, 0.4366302490234375, 0.47308349609375, 0.5095367431640625, 0.545989990234375, 0.5824432373046875, 0.618896484375, 0.6553497314453125, 0.691802978515625, 0.7282562255859375, 0.76470947265625, 0.8011627197265625, 0.837615966796875, 0.8740692138671875, 0.9105224609375, 0.9469757080078125, 0.983428955078125, 1.0198822021484375, 1.05633544921875, 1.0927886962890625, 1.129241943359375, 1.1656951904296875, 1.2021484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 12.0, 23.0, 56.0, 128.0, 256.0, 224.0, 158.0, 59.0, 28.0, 15.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006465911865234375, -0.0006243810057640076, -0.0006021708250045776, -0.0005799606442451477, -0.0005577504634857178, -0.0005355402827262878, -0.0005133301019668579, -0.000491119921207428, -0.00046890974044799805, -0.0004466995596885681, -0.0004244893789291382, -0.00040227919816970825, -0.0003800690174102783, -0.0003578588366508484, -0.00033564865589141846, -0.0003134384751319885, -0.0002912282943725586, -0.00026901811361312866, -0.00024680793285369873, -0.0002245977520942688, -0.00020238757133483887, -0.00018017739057540894, -0.000157967209815979, -0.00013575702905654907, -0.00011354684829711914, -9.133666753768921e-05, -6.912648677825928e-05, -4.6916306018829346e-05, -2.4706125259399414e-05, -2.4959444999694824e-06, 1.971423625946045e-05, 4.192441701889038e-05, 6.413459777832031e-05, 8.634477853775024e-05, 0.00010855495929718018, 0.0001307651400566101, 0.00015297532081604004, 0.00017518550157546997, 0.0001973956823348999, 0.00021960586309432983, 0.00024181604385375977, 0.0002640262246131897, 0.00028623640537261963, 0.00030844658613204956, 0.0003306567668914795, 0.0003528669476509094, 0.00037507712841033936, 0.0003972873091697693, 0.0004194974899291992, 0.00044170767068862915, 0.0004639178514480591, 0.000486128032207489, 0.0005083382129669189, 0.0005305483937263489, 0.0005527585744857788, 0.0005749687552452087, 0.0005971789360046387, 0.0006193891167640686, 0.0006415992975234985, 0.0006638094782829285, 0.0006860196590423584, 0.0007082298398017883, 0.0007304400205612183, 0.0007526502013206482, 0.0007748603820800781]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 3.0, 8.0, 13.0, 10.0, 20.0, 37.0, 43.0, 82.0, 116.0, 199.0, 376.0, 679.0, 1332.0, 2950.0, 7163.0, 20885.0, 79165.0, 519086.0, 317865.0, 68002.0, 18632.0, 6477.0, 2692.0, 1247.0, 628.0, 307.0, 189.0, 100.0, 93.0, 45.0, 32.0, 28.0, 13.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1923828125, -1.155059814453125, -1.11773681640625, -1.080413818359375, -1.0430908203125, -1.005767822265625, -0.96844482421875, -0.931121826171875, -0.893798828125, -0.856475830078125, -0.81915283203125, -0.781829833984375, -0.7445068359375, -0.707183837890625, -0.66986083984375, -0.632537841796875, -0.59521484375, -0.557891845703125, -0.52056884765625, -0.483245849609375, -0.4459228515625, -0.408599853515625, -0.37127685546875, -0.333953857421875, -0.296630859375, -0.259307861328125, -0.22198486328125, -0.184661865234375, -0.1473388671875, -0.110015869140625, -0.07269287109375, -0.035369873046875, 0.001953125, 0.039276123046875, 0.07659912109375, 0.113922119140625, 0.1512451171875, 0.188568115234375, 0.22589111328125, 0.263214111328125, 0.300537109375, 0.337860107421875, 0.37518310546875, 0.412506103515625, 0.4498291015625, 0.487152099609375, 0.52447509765625, 0.561798095703125, 0.59912109375, 0.636444091796875, 0.67376708984375, 0.711090087890625, 0.7484130859375, 0.785736083984375, 0.82305908203125, 0.860382080078125, 0.897705078125, 0.935028076171875, 0.97235107421875, 1.009674072265625, 1.0469970703125, 1.084320068359375, 1.12164306640625, 1.158966064453125, 1.1962890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 0.0, 1.0, 6.0, 7.0, 7.0, 8.0, 12.0, 19.0, 22.0, 29.0, 39.0, 66.0, 61.0, 98.0, 104.0, 88.0, 92.0, 75.0, 66.0, 48.0, 38.0, 26.0, 16.0, 14.0, 12.0, 8.0, 6.0, 2.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.638671875, -1.5968780517578125, -1.555084228515625, -1.5132904052734375, -1.47149658203125, -1.4297027587890625, -1.387908935546875, -1.3461151123046875, -1.3043212890625, -1.2625274658203125, -1.220733642578125, -1.1789398193359375, -1.13714599609375, -1.0953521728515625, -1.053558349609375, -1.0117645263671875, -0.969970703125, -0.9281768798828125, -0.886383056640625, -0.8445892333984375, -0.80279541015625, -0.7610015869140625, -0.719207763671875, -0.6774139404296875, -0.6356201171875, -0.5938262939453125, -0.552032470703125, -0.5102386474609375, -0.46844482421875, -0.4266510009765625, -0.384857177734375, -0.3430633544921875, -0.30126953125, -0.2594757080078125, -0.217681884765625, -0.1758880615234375, -0.13409423828125, -0.0923004150390625, -0.050506591796875, -0.0087127685546875, 0.0330810546875, 0.0748748779296875, 0.116668701171875, 0.1584625244140625, 0.20025634765625, 0.2420501708984375, 0.283843994140625, 0.3256378173828125, 0.367431640625, 0.4092254638671875, 0.451019287109375, 0.4928131103515625, 0.53460693359375, 0.5764007568359375, 0.618194580078125, 0.6599884033203125, 0.7017822265625, 0.7435760498046875, 0.785369873046875, 0.8271636962890625, 0.86895751953125, 0.9107513427734375, 0.952545166015625, 0.9943389892578125, 1.0361328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 20.0, 28.0, 91.0, 196.0, 344.0, 187.0, 77.0, 27.0, 13.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.93738555908203, -60.37105941772461, -58.80473327636719, -57.23841094970703, -55.67208480834961, -54.10575866699219, -52.539432525634766, -50.973106384277344, -49.40678024291992, -47.8404541015625, -46.27412796020508, -44.707801818847656, -43.1414794921875, -41.57515335083008, -40.008827209472656, -38.442501068115234, -36.87617492675781, -35.30984878540039, -33.74352264404297, -32.17720031738281, -30.610872268676758, -29.04454803466797, -27.478221893310547, -25.911895751953125, -24.34557342529297, -22.779247283935547, -21.212923049926758, -19.646596908569336, -18.080270767211914, -16.513946533203125, -14.947620391845703, -13.381294250488281, -11.81496810913086, -10.248642921447754, -8.682316780090332, -7.115991592407227, -5.549665927886963, -3.983340263366699, -2.4170150756835938, -0.8506889343261719, 0.7156362533569336, 2.2819619178771973, 3.848287343978882, 5.414612770080566, 6.98093843460083, 8.547264099121094, 10.1135892868042, 11.679915428161621, 13.246240615844727, 14.812565803527832, 16.378890991210938, 17.94521713256836, 19.51154327392578, 21.077869415283203, 22.644193649291992, 24.210519790649414, 25.776844024658203, 27.343170166015625, 28.909494400024414, 30.475820541381836, 32.042144775390625, 33.60847091674805, 35.17479705810547, 36.74112319946289, 38.30744934082031]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 7.0, 8.0, 10.0, 11.0, 12.0, 18.0, 25.0, 26.0, 37.0, 45.0, 36.0, 49.0, 53.0, 80.0, 97.0, 88.0, 85.0, 52.0, 39.0, 36.0, 33.0, 22.0, 31.0, 20.0, 20.0, 15.0, 13.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.187742233276367, -18.34599494934082, -17.504247665405273, -16.662500381469727, -15.82075309753418, -14.979005813598633, -14.137258529663086, -13.295511245727539, -12.453763961791992, -11.612016677856445, -10.770269393920898, -9.928522109985352, -9.086774826049805, -8.245027542114258, -7.403280258178711, -6.561532974243164, -5.719785690307617, -4.87803840637207, -4.036291122436523, -3.1945438385009766, -2.3527965545654297, -1.5110492706298828, -0.6693019866943359, 0.17244529724121094, 1.0141925811767578, 1.8559398651123047, 2.6976871490478516, 3.5394344329833984, 4.381181716918945, 5.222929000854492, 6.064676284790039, 6.906423568725586, 7.7481689453125, 8.589916229248047, 9.431663513183594, 10.27341079711914, 11.115158081054688, 11.956905364990234, 12.798652648925781, 13.640399932861328, 14.482147216796875, 15.323894500732422, 16.16564178466797, 17.007389068603516, 17.849136352539062, 18.69088363647461, 19.532630920410156, 20.374378204345703, 21.21612548828125, 22.057872772216797, 22.899620056152344, 23.74136734008789, 24.583114624023438, 25.424861907958984, 26.26660919189453, 27.108356475830078, 27.950103759765625, 28.791851043701172, 29.63359832763672, 30.475345611572266, 31.317092895507812, 32.15884017944336, 33.000587463378906, 33.84233474731445, 34.68408203125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 12.0, 19.0, 18.0, 42.0, 44.0, 83.0, 101.0, 169.0, 218.0, 315.0, 504.0, 899.0, 1464.0, 2359.0, 4649.0, 9910.0, 24718.0, 77978.0, 319244.0, 1351320.0, 1766108.0, 472550.0, 107408.0, 30761.0, 11419.0, 5220.0, 2620.0, 1461.0, 886.0, 584.0, 369.0, 242.0, 168.0, 118.0, 87.0, 46.0, 59.0, 22.0, 27.0, 16.0, 13.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.4267578125, -1.38494873046875, -1.3431396484375, -1.30133056640625, -1.259521484375, -1.21771240234375, -1.1759033203125, -1.13409423828125, -1.09228515625, -1.05047607421875, -1.0086669921875, -0.96685791015625, -0.925048828125, -0.88323974609375, -0.8414306640625, -0.79962158203125, -0.7578125, -0.71600341796875, -0.6741943359375, -0.63238525390625, -0.590576171875, -0.54876708984375, -0.5069580078125, -0.46514892578125, -0.42333984375, -0.38153076171875, -0.3397216796875, -0.29791259765625, -0.256103515625, -0.21429443359375, -0.1724853515625, -0.13067626953125, -0.0888671875, -0.04705810546875, -0.0052490234375, 0.03656005859375, 0.078369140625, 0.12017822265625, 0.1619873046875, 0.20379638671875, 0.24560546875, 0.28741455078125, 0.3292236328125, 0.37103271484375, 0.412841796875, 0.45465087890625, 0.4964599609375, 0.53826904296875, 0.580078125, 0.62188720703125, 0.6636962890625, 0.70550537109375, 0.747314453125, 0.78912353515625, 0.8309326171875, 0.87274169921875, 0.91455078125, 0.95635986328125, 0.9981689453125, 1.03997802734375, 1.081787109375, 1.12359619140625, 1.1654052734375, 1.20721435546875, 1.2490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 8.0, 5.0, 14.0, 21.0, 29.0, 22.0, 29.0, 33.0, 50.0, 43.0, 38.0, 53.0, 52.0, 49.0, 69.0, 61.0, 54.0, 40.0, 37.0, 43.0, 31.0, 32.0, 44.0, 21.0, 24.0, 13.0, 22.0, 12.0, 3.0, 6.0, 9.0, 6.0, 0.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2666015625, -1.2168731689453125, -1.167144775390625, -1.1174163818359375, -1.06768798828125, -1.0179595947265625, -0.968231201171875, -0.9185028076171875, -0.8687744140625, -0.8190460205078125, -0.769317626953125, -0.7195892333984375, -0.66986083984375, -0.6201324462890625, -0.570404052734375, -0.5206756591796875, -0.470947265625, -0.4212188720703125, -0.371490478515625, -0.3217620849609375, -0.27203369140625, -0.2223052978515625, -0.172576904296875, -0.1228485107421875, -0.0731201171875, -0.0233917236328125, 0.026336669921875, 0.0760650634765625, 0.12579345703125, 0.1755218505859375, 0.225250244140625, 0.2749786376953125, 0.32470703125, 0.3744354248046875, 0.424163818359375, 0.4738922119140625, 0.52362060546875, 0.5733489990234375, 0.623077392578125, 0.6728057861328125, 0.7225341796875, 0.7722625732421875, 0.821990966796875, 0.8717193603515625, 0.92144775390625, 0.9711761474609375, 1.020904541015625, 1.0706329345703125, 1.120361328125, 1.1700897216796875, 1.219818115234375, 1.2695465087890625, 1.31927490234375, 1.3690032958984375, 1.418731689453125, 1.4684600830078125, 1.5181884765625, 1.5679168701171875, 1.617645263671875, 1.6673736572265625, 1.71710205078125, 1.7668304443359375, 1.816558837890625, 1.8662872314453125, 1.916015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 7.0, 18.0, 48.0, 69.0, 144.0, 400.0, 1566.0, 10428.0, 630114.0, 3524817.0, 23333.0, 2340.0, 568.0, 226.0, 87.0, 47.0, 16.0, 13.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.04473876953125, -5.8043212890625, -5.56390380859375, -5.323486328125, -5.08306884765625, -4.8426513671875, -4.60223388671875, -4.36181640625, -4.12139892578125, -3.8809814453125, -3.64056396484375, -3.400146484375, -3.15972900390625, -2.9193115234375, -2.67889404296875, -2.4384765625, -2.19805908203125, -1.9576416015625, -1.71722412109375, -1.476806640625, -1.23638916015625, -0.9959716796875, -0.75555419921875, -0.51513671875, -0.27471923828125, -0.0343017578125, 0.20611572265625, 0.446533203125, 0.68695068359375, 0.9273681640625, 1.16778564453125, 1.408203125, 1.64862060546875, 1.8890380859375, 2.12945556640625, 2.369873046875, 2.61029052734375, 2.8507080078125, 3.09112548828125, 3.33154296875, 3.57196044921875, 3.8123779296875, 4.05279541015625, 4.293212890625, 4.53363037109375, 4.7740478515625, 5.01446533203125, 5.2548828125, 5.49530029296875, 5.7357177734375, 5.97613525390625, 6.216552734375, 6.45697021484375, 6.6973876953125, 6.93780517578125, 7.17822265625, 7.41864013671875, 7.6590576171875, 7.89947509765625, 8.139892578125, 8.38031005859375, 8.6207275390625, 8.86114501953125, 9.1015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 10.0, 11.0, 15.0, 38.0, 63.0, 84.0, 175.0, 357.0, 826.0, 1047.0, 724.0, 356.0, 152.0, 82.0, 32.0, 35.0, 23.0, 14.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.2237548828125, -5.076416015625, -4.9290771484375, -4.78173828125, -4.6343994140625, -4.487060546875, -4.3397216796875, -4.1923828125, -4.0450439453125, -3.897705078125, -3.7503662109375, -3.60302734375, -3.4556884765625, -3.308349609375, -3.1610107421875, -3.013671875, -2.8663330078125, -2.718994140625, -2.5716552734375, -2.42431640625, -2.2769775390625, -2.129638671875, -1.9822998046875, -1.8349609375, -1.6876220703125, -1.540283203125, -1.3929443359375, -1.24560546875, -1.0982666015625, -0.950927734375, -0.8035888671875, -0.65625, -0.5089111328125, -0.361572265625, -0.2142333984375, -0.06689453125, 0.0804443359375, 0.227783203125, 0.3751220703125, 0.5224609375, 0.6697998046875, 0.817138671875, 0.9644775390625, 1.11181640625, 1.2591552734375, 1.406494140625, 1.5538330078125, 1.701171875, 1.8485107421875, 1.995849609375, 2.1431884765625, 2.29052734375, 2.4378662109375, 2.585205078125, 2.7325439453125, 2.8798828125, 3.0272216796875, 3.174560546875, 3.3218994140625, 3.46923828125, 3.6165771484375, 3.763916015625, 3.9112548828125, 4.05859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 5.0, 11.0, 34.0, 48.0, 117.0, 165.0, 220.0, 179.0, 100.0, 64.0, 31.0, 18.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.15801239013672, -34.08146286010742, -33.00490951538086, -31.928359985351562, -30.851810455322266, -29.775259017944336, -28.698707580566406, -27.62215805053711, -26.54560661315918, -25.46905517578125, -24.392505645751953, -23.315954208374023, -22.239402770996094, -21.162853240966797, -20.086301803588867, -19.009750366210938, -17.93320083618164, -16.85664939880371, -15.780099868774414, -14.703548431396484, -13.626997947692871, -12.550447463989258, -11.473896026611328, -10.397345542907715, -9.320795059204102, -8.244244575500488, -7.167693614959717, -6.091142654418945, -5.014592170715332, -3.9380416870117188, -2.8614907264709473, -1.7849397659301758, -0.7083930969238281, 0.36815762519836426, 1.4447083473205566, 2.521259069442749, 3.5978097915649414, 4.674360275268555, 5.750911235809326, 6.827462196350098, 7.904012680053711, 8.980563163757324, 10.057113647460938, 11.133665084838867, 12.21021556854248, 13.286766052246094, 14.363317489624023, 15.439867973327637, 16.51641845703125, 17.59296989440918, 18.669519424438477, 19.746070861816406, 20.822620391845703, 21.899171829223633, 22.975723266601562, 24.05227279663086, 25.12882423400879, 26.20537567138672, 27.281925201416016, 28.358476638793945, 29.435028076171875, 30.511577606201172, 31.5881290435791, 32.66468048095703, 33.74123001098633]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 13.0, 12.0, 12.0, 12.0, 13.0, 17.0, 21.0, 25.0, 19.0, 30.0, 43.0, 47.0, 34.0, 42.0, 63.0, 55.0, 45.0, 64.0, 56.0, 50.0, 51.0, 31.0, 32.0, 36.0, 23.0, 21.0, 22.0, 16.0, 16.0, 20.0, 6.0, 12.0, 4.0, 6.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.210481643676758, -13.767874717712402, -13.325267791748047, -12.882659912109375, -12.44005298614502, -11.997446060180664, -11.554838180541992, -11.112231254577637, -10.669624328613281, -10.227017402648926, -9.78441047668457, -9.341802597045898, -8.899195671081543, -8.456588745117188, -8.013980865478516, -7.57137393951416, -7.128767013549805, -6.686160087585449, -6.2435526847839355, -5.800945281982422, -5.358338356018066, -4.915731430053711, -4.473124027252197, -4.030516624450684, -3.587909698486328, -3.1453025341033936, -2.702695369720459, -2.2600882053375244, -1.8174810409545898, -1.3748738765716553, -0.9322667121887207, -0.48965954780578613, -0.04705238342285156, 0.395554780960083, 0.8381619453430176, 1.2807691097259521, 1.7233762741088867, 2.1659834384918213, 2.608590602874756, 3.0511977672576904, 3.493804931640625, 3.9364120960235596, 4.379019260406494, 4.821626663208008, 5.264233589172363, 5.706840515136719, 6.149447917938232, 6.592055320739746, 7.034662246704102, 7.477269172668457, 7.919876575469971, 8.362483978271484, 8.80509090423584, 9.247697830200195, 9.690305709838867, 10.132912635803223, 10.575519561767578, 11.018126487731934, 11.460733413696289, 11.903341293334961, 12.345948219299316, 12.788555145263672, 13.231163024902344, 13.6737699508667, 14.116376876831055]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 15.0, 25.0, 35.0, 48.0, 88.0, 148.0, 255.0, 419.0, 757.0, 1368.0, 2460.0, 4650.0, 9407.0, 20036.0, 45955.0, 114638.0, 271053.0, 317387.0, 151068.0, 59733.0, 25139.0, 11614.0, 5588.0, 3022.0, 1557.0, 873.0, 502.0, 290.0, 161.0, 100.0, 55.0, 35.0, 34.0, 14.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6552734375, -1.598480224609375, -1.54168701171875, -1.484893798828125, -1.4281005859375, -1.371307373046875, -1.31451416015625, -1.257720947265625, -1.200927734375, -1.144134521484375, -1.08734130859375, -1.030548095703125, -0.9737548828125, -0.916961669921875, -0.86016845703125, -0.803375244140625, -0.74658203125, -0.689788818359375, -0.63299560546875, -0.576202392578125, -0.5194091796875, -0.462615966796875, -0.40582275390625, -0.349029541015625, -0.292236328125, -0.235443115234375, -0.17864990234375, -0.121856689453125, -0.0650634765625, -0.008270263671875, 0.04852294921875, 0.105316162109375, 0.162109375, 0.218902587890625, 0.27569580078125, 0.332489013671875, 0.3892822265625, 0.446075439453125, 0.50286865234375, 0.559661865234375, 0.616455078125, 0.673248291015625, 0.73004150390625, 0.786834716796875, 0.8436279296875, 0.900421142578125, 0.95721435546875, 1.014007568359375, 1.07080078125, 1.127593994140625, 1.18438720703125, 1.241180419921875, 1.2979736328125, 1.354766845703125, 1.41156005859375, 1.468353271484375, 1.525146484375, 1.581939697265625, 1.63873291015625, 1.695526123046875, 1.7523193359375, 1.809112548828125, 1.86590576171875, 1.922698974609375, 1.9794921875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 3.0, 2.0, 12.0, 13.0, 15.0, 16.0, 18.0, 25.0, 31.0, 35.0, 31.0, 37.0, 46.0, 44.0, 56.0, 58.0, 52.0, 63.0, 60.0, 38.0, 46.0, 35.0, 40.0, 27.0, 36.0, 26.0, 26.0, 25.0, 23.0, 16.0, 16.0, 7.0, 6.0, 6.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.36785888671875, -1.3157958984375, -1.26373291015625, -1.211669921875, -1.15960693359375, -1.1075439453125, -1.05548095703125, -1.00341796875, -0.95135498046875, -0.8992919921875, -0.84722900390625, -0.795166015625, -0.74310302734375, -0.6910400390625, -0.63897705078125, -0.5869140625, -0.53485107421875, -0.4827880859375, -0.43072509765625, -0.378662109375, -0.32659912109375, -0.2745361328125, -0.22247314453125, -0.17041015625, -0.11834716796875, -0.0662841796875, -0.01422119140625, 0.037841796875, 0.08990478515625, 0.1419677734375, 0.19403076171875, 0.24609375, 0.29815673828125, 0.3502197265625, 0.40228271484375, 0.454345703125, 0.50640869140625, 0.5584716796875, 0.61053466796875, 0.66259765625, 0.71466064453125, 0.7667236328125, 0.81878662109375, 0.870849609375, 0.92291259765625, 0.9749755859375, 1.02703857421875, 1.0791015625, 1.13116455078125, 1.1832275390625, 1.23529052734375, 1.287353515625, 1.33941650390625, 1.3914794921875, 1.44354248046875, 1.49560546875, 1.54766845703125, 1.5997314453125, 1.65179443359375, 1.703857421875, 1.75592041015625, 1.8079833984375, 1.86004638671875, 1.912109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 5.0, 14.0, 19.0, 28.0, 52.0, 81.0, 124.0, 196.0, 357.0, 778.0, 2328.0, 11402.0, 144018.0, 831095.0, 49557.0, 5737.0, 1481.0, 570.0, 253.0, 160.0, 89.0, 82.0, 42.0, 27.0, 24.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.1331787109375, -4.930419921875, -4.7276611328125, -4.52490234375, -4.3221435546875, -4.119384765625, -3.9166259765625, -3.7138671875, -3.5111083984375, -3.308349609375, -3.1055908203125, -2.90283203125, -2.7000732421875, -2.497314453125, -2.2945556640625, -2.091796875, -1.8890380859375, -1.686279296875, -1.4835205078125, -1.28076171875, -1.0780029296875, -0.875244140625, -0.6724853515625, -0.4697265625, -0.2669677734375, -0.064208984375, 0.1385498046875, 0.34130859375, 0.5440673828125, 0.746826171875, 0.9495849609375, 1.15234375, 1.3551025390625, 1.557861328125, 1.7606201171875, 1.96337890625, 2.1661376953125, 2.368896484375, 2.5716552734375, 2.7744140625, 2.9771728515625, 3.179931640625, 3.3826904296875, 3.58544921875, 3.7882080078125, 3.990966796875, 4.1937255859375, 4.396484375, 4.5992431640625, 4.802001953125, 5.0047607421875, 5.20751953125, 5.4102783203125, 5.613037109375, 5.8157958984375, 6.0185546875, 6.2213134765625, 6.424072265625, 6.6268310546875, 6.82958984375, 7.0323486328125, 7.235107421875, 7.4378662109375, 7.640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 8.0, 15.0, 9.0, 25.0, 16.0, 36.0, 36.0, 37.0, 47.0, 42.0, 53.0, 69.0, 76.0, 82.0, 61.0, 72.0, 54.0, 59.0, 41.0, 41.0, 18.0, 19.0, 18.0, 14.0, 10.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.57305908203125, -6.3297119140625, -6.08636474609375, -5.843017578125, -5.59967041015625, -5.3563232421875, -5.11297607421875, -4.86962890625, -4.62628173828125, -4.3829345703125, -4.13958740234375, -3.896240234375, -3.65289306640625, -3.4095458984375, -3.16619873046875, -2.9228515625, -2.67950439453125, -2.4361572265625, -2.19281005859375, -1.949462890625, -1.70611572265625, -1.4627685546875, -1.21942138671875, -0.97607421875, -0.73272705078125, -0.4893798828125, -0.24603271484375, -0.002685546875, 0.24066162109375, 0.4840087890625, 0.72735595703125, 0.970703125, 1.21405029296875, 1.4573974609375, 1.70074462890625, 1.944091796875, 2.18743896484375, 2.4307861328125, 2.67413330078125, 2.91748046875, 3.16082763671875, 3.4041748046875, 3.64752197265625, 3.890869140625, 4.13421630859375, 4.3775634765625, 4.62091064453125, 4.8642578125, 5.10760498046875, 5.3509521484375, 5.59429931640625, 5.837646484375, 6.08099365234375, 6.3243408203125, 6.56768798828125, 6.81103515625, 7.05438232421875, 7.2977294921875, 7.54107666015625, 7.784423828125, 8.02777099609375, 8.2711181640625, 8.51446533203125, 8.7578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 10.0, 10.0, 16.0, 18.0, 32.0, 48.0, 55.0, 89.0, 114.0, 229.0, 365.0, 668.0, 1236.0, 2589.0, 6101.0, 17402.0, 64899.0, 649301.0, 241469.0, 42044.0, 12585.0, 4787.0, 2068.0, 955.0, 560.0, 316.0, 204.0, 113.0, 67.0, 59.0, 33.0, 30.0, 8.0, 15.0, 15.0, 9.0, 5.0, 8.0, 3.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0947265625, -1.0614013671875, -1.028076171875, -0.9947509765625, -0.96142578125, -0.9281005859375, -0.894775390625, -0.8614501953125, -0.828125, -0.7947998046875, -0.761474609375, -0.7281494140625, -0.69482421875, -0.6614990234375, -0.628173828125, -0.5948486328125, -0.5615234375, -0.5281982421875, -0.494873046875, -0.4615478515625, -0.42822265625, -0.3948974609375, -0.361572265625, -0.3282470703125, -0.294921875, -0.2615966796875, -0.228271484375, -0.1949462890625, -0.16162109375, -0.1282958984375, -0.094970703125, -0.0616455078125, -0.0283203125, 0.0050048828125, 0.038330078125, 0.0716552734375, 0.10498046875, 0.1383056640625, 0.171630859375, 0.2049560546875, 0.23828125, 0.2716064453125, 0.304931640625, 0.3382568359375, 0.37158203125, 0.4049072265625, 0.438232421875, 0.4715576171875, 0.5048828125, 0.5382080078125, 0.571533203125, 0.6048583984375, 0.63818359375, 0.6715087890625, 0.704833984375, 0.7381591796875, 0.771484375, 0.8048095703125, 0.838134765625, 0.8714599609375, 0.90478515625, 0.9381103515625, 0.971435546875, 1.0047607421875, 1.0380859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 9.0, 6.0, 7.0, 11.0, 19.0, 18.0, 32.0, 52.0, 83.0, 163.0, 179.0, 153.0, 81.0, 55.0, 32.0, 28.0, 21.0, 11.0, 5.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003819465637207031, -0.0003694407641887665, -0.00035693496465682983, -0.0003444291651248932, -0.00033192336559295654, -0.0003194175660610199, -0.00030691176652908325, -0.0002944059669971466, -0.00028190016746520996, -0.0002693943679332733, -0.00025688856840133667, -0.0002443827688694, -0.00023187696933746338, -0.00021937116980552673, -0.0002068653702735901, -0.00019435957074165344, -0.0001818537712097168, -0.00016934797167778015, -0.0001568421721458435, -0.00014433637261390686, -0.00013183057308197021, -0.00011932477355003357, -0.00010681897401809692, -9.431317448616028e-05, -8.180737495422363e-05, -6.930157542228699e-05, -5.679577589035034e-05, -4.4289976358413696e-05, -3.178417682647705e-05, -1.9278377294540405e-05, -6.77257776260376e-06, 5.733221769332886e-06, 1.823902130126953e-05, 3.074482083320618e-05, 4.325062036514282e-05, 5.575641989707947e-05, 6.826221942901611e-05, 8.076801896095276e-05, 9.32738184928894e-05, 0.00010577961802482605, 0.0001182854175567627, 0.00013079121708869934, 0.00014329701662063599, 0.00015580281615257263, 0.00016830861568450928, 0.00018081441521644592, 0.00019332021474838257, 0.00020582601428031921, 0.00021833181381225586, 0.0002308376133441925, 0.00024334341287612915, 0.0002558492124080658, 0.00026835501194000244, 0.0002808608114719391, 0.00029336661100387573, 0.0003058724105358124, 0.000318378210067749, 0.00033088400959968567, 0.0003433898091316223, 0.00035589560866355896, 0.0003684014081954956, 0.00038090720772743225, 0.0003934130072593689, 0.00040591880679130554, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 3.0, 9.0, 9.0, 17.0, 18.0, 17.0, 22.0, 38.0, 48.0, 73.0, 99.0, 152.0, 286.0, 439.0, 687.0, 1379.0, 2646.0, 5924.0, 15234.0, 44145.0, 173070.0, 639764.0, 111210.0, 31990.0, 11600.0, 4651.0, 2276.0, 1046.0, 576.0, 380.0, 240.0, 151.0, 94.0, 71.0, 50.0, 37.0, 25.0, 18.0, 9.0, 15.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.8642578125, -0.8375473022460938, -0.8108367919921875, -0.7841262817382812, -0.757415771484375, -0.7307052612304688, -0.7039947509765625, -0.6772842407226562, -0.65057373046875, -0.6238632202148438, -0.5971527099609375, -0.5704421997070312, -0.543731689453125, -0.5170211791992188, -0.4903106689453125, -0.46360015869140625, -0.4368896484375, -0.41017913818359375, -0.3834686279296875, -0.35675811767578125, -0.330047607421875, -0.30333709716796875, -0.2766265869140625, -0.24991607666015625, -0.22320556640625, -0.19649505615234375, -0.1697845458984375, -0.14307403564453125, -0.116363525390625, -0.08965301513671875, -0.0629425048828125, -0.03623199462890625, -0.009521484375, 0.01718902587890625, 0.0438995361328125, 0.07061004638671875, 0.097320556640625, 0.12403106689453125, 0.1507415771484375, 0.17745208740234375, 0.20416259765625, 0.23087310791015625, 0.2575836181640625, 0.28429412841796875, 0.311004638671875, 0.33771514892578125, 0.3644256591796875, 0.39113616943359375, 0.4178466796875, 0.44455718994140625, 0.4712677001953125, 0.49797821044921875, 0.524688720703125, 0.5513992309570312, 0.5781097412109375, 0.6048202514648438, 0.63153076171875, 0.6582412719726562, 0.6849517822265625, 0.7116622924804688, 0.738372802734375, 0.7650833129882812, 0.7917938232421875, 0.8185043334960938, 0.84521484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 7.0, 9.0, 10.0, 14.0, 15.0, 8.0, 14.0, 23.0, 34.0, 32.0, 60.0, 65.0, 61.0, 107.0, 87.0, 90.0, 70.0, 61.0, 26.0, 32.0, 28.0, 22.0, 20.0, 12.0, 12.0, 14.0, 8.0, 1.0, 5.0, 9.0, 7.0, 8.0, 5.0, 1.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9130706787109375, -0.883758544921875, -0.8544464111328125, -0.82513427734375, -0.7958221435546875, -0.766510009765625, -0.7371978759765625, -0.7078857421875, -0.6785736083984375, -0.649261474609375, -0.6199493408203125, -0.59063720703125, -0.5613250732421875, -0.532012939453125, -0.5027008056640625, -0.473388671875, -0.4440765380859375, -0.414764404296875, -0.3854522705078125, -0.35614013671875, -0.3268280029296875, -0.297515869140625, -0.2682037353515625, -0.2388916015625, -0.2095794677734375, -0.180267333984375, -0.1509552001953125, -0.12164306640625, -0.0923309326171875, -0.063018798828125, -0.0337066650390625, -0.00439453125, 0.0249176025390625, 0.054229736328125, 0.0835418701171875, 0.11285400390625, 0.1421661376953125, 0.171478271484375, 0.2007904052734375, 0.2301025390625, 0.2594146728515625, 0.288726806640625, 0.3180389404296875, 0.34735107421875, 0.3766632080078125, 0.405975341796875, 0.4352874755859375, 0.464599609375, 0.4939117431640625, 0.523223876953125, 0.5525360107421875, 0.58184814453125, 0.6111602783203125, 0.640472412109375, 0.6697845458984375, 0.6990966796875, 0.7284088134765625, 0.757720947265625, 0.7870330810546875, 0.81634521484375, 0.8456573486328125, 0.874969482421875, 0.9042816162109375, 0.93359375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 8.0, 6.0, 32.0, 98.0, 235.0, 436.0, 125.0, 44.0, 13.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.7462158203125, -71.06510925292969, -69.38400268554688, -67.70289611816406, -66.02178955078125, -64.34068298339844, -62.659576416015625, -60.97846984863281, -59.29736328125, -57.61625671386719, -55.935150146484375, -54.25404357910156, -52.57293701171875, -50.89183044433594, -49.210723876953125, -47.52961730957031, -45.848514556884766, -44.16740798950195, -42.48630142211914, -40.80519485473633, -39.124088287353516, -37.4429817199707, -35.761878967285156, -34.080772399902344, -32.39966583251953, -30.71855926513672, -29.037452697753906, -27.356346130371094, -25.67523956298828, -23.99413299560547, -22.31302833557129, -20.631921768188477, -18.950809478759766, -17.269702911376953, -15.58859634399414, -13.907490730285645, -12.226384162902832, -10.54527759552002, -8.864171981811523, -7.183065414428711, -5.501958847045898, -3.820852518081665, -2.1397461891174316, -0.45864009857177734, 1.2224664688110352, 2.9035730361938477, 4.584678649902344, 6.265785217285156, 7.946891784667969, 9.627998352050781, 11.309104919433594, 12.99021053314209, 14.671317100524902, 16.35242462158203, 18.03352928161621, 19.714635848999023, 21.395742416381836, 23.07684898376465, 24.75795555114746, 26.43906021118164, 28.120166778564453, 29.801273345947266, 31.482379913330078, 33.16348648071289, 34.8445930480957]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 9.0, 10.0, 7.0, 8.0, 8.0, 8.0, 17.0, 15.0, 21.0, 18.0, 24.0, 20.0, 29.0, 38.0, 36.0, 36.0, 57.0, 78.0, 79.0, 82.0, 51.0, 27.0, 34.0, 31.0, 36.0, 22.0, 22.0, 21.0, 16.0, 17.0, 19.0, 11.0, 16.0, 14.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.586380004882812, -19.02099609375, -18.455612182617188, -17.890228271484375, -17.324844360351562, -16.75946044921875, -16.194076538085938, -15.628693580627441, -15.063309669494629, -14.497925758361816, -13.932541847229004, -13.367157936096191, -12.801774978637695, -12.236391067504883, -11.67100715637207, -11.105623245239258, -10.540239334106445, -9.974855422973633, -9.40947151184082, -8.844087600708008, -8.278703689575195, -7.713320255279541, -7.147936820983887, -6.582552909851074, -6.017168998718262, -5.451785087585449, -4.886401176452637, -4.321017742156982, -3.75563383102417, -3.1902499198913574, -2.624866247177124, -2.0594825744628906, -1.4940986633300781, -0.9287148714065552, -0.3633310794830322, 0.20205271244049072, 0.7674365043640137, 1.3328204154968262, 1.8982040882110596, 2.463587760925293, 3.0289716720581055, 3.594355583190918, 4.1597394943237305, 4.725122928619385, 5.290506839752197, 5.85589075088501, 6.421274185180664, 6.986658096313477, 7.552042007446289, 8.117425918579102, 8.682809829711914, 9.248193740844727, 9.813577651977539, 10.378961563110352, 10.944344520568848, 11.50972843170166, 12.075112342834473, 12.640496253967285, 13.205880165100098, 13.77126407623291, 14.336647033691406, 14.902030944824219, 15.467414855957031, 16.032798767089844, 16.598182678222656]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 12.0, 30.0, 24.0, 37.0, 74.0, 115.0, 118.0, 226.0, 344.0, 550.0, 967.0, 1677.0, 2992.0, 5797.0, 12573.0, 32298.0, 100127.0, 379982.0, 1376744.0, 1623772.0, 473419.0, 119078.0, 35896.0, 13466.0, 6291.0, 3196.0, 1721.0, 1028.0, 617.0, 393.0, 228.0, 151.0, 105.0, 68.0, 49.0, 32.0, 21.0, 17.0, 9.0, 11.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.427734375, -1.3832244873046875, -1.338714599609375, -1.2942047119140625, -1.24969482421875, -1.2051849365234375, -1.160675048828125, -1.1161651611328125, -1.0716552734375, -1.0271453857421875, -0.982635498046875, -0.9381256103515625, -0.89361572265625, -0.8491058349609375, -0.804595947265625, -0.7600860595703125, -0.715576171875, -0.6710662841796875, -0.626556396484375, -0.5820465087890625, -0.53753662109375, -0.4930267333984375, -0.448516845703125, -0.4040069580078125, -0.3594970703125, -0.3149871826171875, -0.270477294921875, -0.2259674072265625, -0.18145751953125, -0.1369476318359375, -0.092437744140625, -0.0479278564453125, -0.00341796875, 0.0410919189453125, 0.085601806640625, 0.1301116943359375, 0.17462158203125, 0.2191314697265625, 0.263641357421875, 0.3081512451171875, 0.3526611328125, 0.3971710205078125, 0.441680908203125, 0.4861907958984375, 0.53070068359375, 0.5752105712890625, 0.619720458984375, 0.6642303466796875, 0.708740234375, 0.7532501220703125, 0.797760009765625, 0.8422698974609375, 0.88677978515625, 0.9312896728515625, 0.975799560546875, 1.0203094482421875, 1.0648193359375, 1.1093292236328125, 1.153839111328125, 1.1983489990234375, 1.24285888671875, 1.2873687744140625, 1.331878662109375, 1.3763885498046875, 1.4208984375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 7.0, 6.0, 7.0, 13.0, 17.0, 17.0, 26.0, 21.0, 27.0, 23.0, 36.0, 48.0, 35.0, 50.0, 50.0, 48.0, 44.0, 55.0, 45.0, 31.0, 46.0, 34.0, 32.0, 51.0, 38.0, 20.0, 23.0, 27.0, 20.0, 17.0, 18.0, 11.0, 9.0, 6.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.265625, -1.2212066650390625, -1.176788330078125, -1.1323699951171875, -1.08795166015625, -1.0435333251953125, -0.999114990234375, -0.9546966552734375, -0.9102783203125, -0.8658599853515625, -0.821441650390625, -0.7770233154296875, -0.73260498046875, -0.6881866455078125, -0.643768310546875, -0.5993499755859375, -0.554931640625, -0.5105133056640625, -0.466094970703125, -0.4216766357421875, -0.37725830078125, -0.3328399658203125, -0.288421630859375, -0.2440032958984375, -0.1995849609375, -0.1551666259765625, -0.110748291015625, -0.0663299560546875, -0.02191162109375, 0.0225067138671875, 0.066925048828125, 0.1113433837890625, 0.15576171875, 0.2001800537109375, 0.244598388671875, 0.2890167236328125, 0.33343505859375, 0.3778533935546875, 0.422271728515625, 0.4666900634765625, 0.5111083984375, 0.5555267333984375, 0.599945068359375, 0.6443634033203125, 0.68878173828125, 0.7332000732421875, 0.777618408203125, 0.8220367431640625, 0.866455078125, 0.9108734130859375, 0.955291748046875, 0.9997100830078125, 1.04412841796875, 1.0885467529296875, 1.132965087890625, 1.1773834228515625, 1.2218017578125, 1.2662200927734375, 1.310638427734375, 1.3550567626953125, 1.39947509765625, 1.4438934326171875, 1.488311767578125, 1.5327301025390625, 1.5771484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 8.0, 9.0, 10.0, 13.0, 23.0, 42.0, 62.0, 99.0, 156.0, 307.0, 633.0, 1810.0, 6584.0, 43980.0, 1290650.0, 2766638.0, 70142.0, 9154.0, 2260.0, 806.0, 340.0, 211.0, 105.0, 70.0, 39.0, 35.0, 20.0, 21.0, 10.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.03326416015625, -3.8946533203125, -3.75604248046875, -3.617431640625, -3.47882080078125, -3.3402099609375, -3.20159912109375, -3.06298828125, -2.92437744140625, -2.7857666015625, -2.64715576171875, -2.508544921875, -2.36993408203125, -2.2313232421875, -2.09271240234375, -1.9541015625, -1.81549072265625, -1.6768798828125, -1.53826904296875, -1.399658203125, -1.26104736328125, -1.1224365234375, -0.98382568359375, -0.84521484375, -0.70660400390625, -0.5679931640625, -0.42938232421875, -0.290771484375, -0.15216064453125, -0.0135498046875, 0.12506103515625, 0.263671875, 0.40228271484375, 0.5408935546875, 0.67950439453125, 0.818115234375, 0.95672607421875, 1.0953369140625, 1.23394775390625, 1.37255859375, 1.51116943359375, 1.6497802734375, 1.78839111328125, 1.927001953125, 2.06561279296875, 2.2042236328125, 2.34283447265625, 2.4814453125, 2.62005615234375, 2.7586669921875, 2.89727783203125, 3.035888671875, 3.17449951171875, 3.3131103515625, 3.45172119140625, 3.59033203125, 3.72894287109375, 3.8675537109375, 4.00616455078125, 4.144775390625, 4.28338623046875, 4.4219970703125, 4.56060791015625, 4.69921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 9.0, 8.0, 17.0, 18.0, 28.0, 34.0, 43.0, 72.0, 91.0, 143.0, 244.0, 384.0, 490.0, 658.0, 587.0, 425.0, 252.0, 187.0, 92.0, 72.0, 51.0, 42.0, 28.0, 21.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.904296875, -2.80645751953125, -2.7086181640625, -2.61077880859375, -2.512939453125, -2.41510009765625, -2.3172607421875, -2.21942138671875, -2.12158203125, -2.02374267578125, -1.9259033203125, -1.82806396484375, -1.730224609375, -1.63238525390625, -1.5345458984375, -1.43670654296875, -1.3388671875, -1.24102783203125, -1.1431884765625, -1.04534912109375, -0.947509765625, -0.84967041015625, -0.7518310546875, -0.65399169921875, -0.55615234375, -0.45831298828125, -0.3604736328125, -0.26263427734375, -0.164794921875, -0.06695556640625, 0.0308837890625, 0.12872314453125, 0.2265625, 0.32440185546875, 0.4222412109375, 0.52008056640625, 0.617919921875, 0.71575927734375, 0.8135986328125, 0.91143798828125, 1.00927734375, 1.10711669921875, 1.2049560546875, 1.30279541015625, 1.400634765625, 1.49847412109375, 1.5963134765625, 1.69415283203125, 1.7919921875, 1.88983154296875, 1.9876708984375, 2.08551025390625, 2.183349609375, 2.28118896484375, 2.3790283203125, 2.47686767578125, 2.57470703125, 2.67254638671875, 2.7703857421875, 2.86822509765625, 2.966064453125, 3.06390380859375, 3.1617431640625, 3.25958251953125, 3.357421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 7.0, 23.0, 41.0, 78.0, 166.0, 235.0, 189.0, 121.0, 68.0, 31.0, 12.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.62327003479004, -25.504671096801758, -24.386072158813477, -23.267473220825195, -22.148874282836914, -21.030275344848633, -19.91167449951172, -18.793075561523438, -17.674476623535156, -16.555877685546875, -15.437278747558594, -14.318679809570312, -13.200080871582031, -12.08148193359375, -10.962882041931152, -9.844283103942871, -8.725685119628906, -7.607086181640625, -6.488487243652344, -5.369887828826904, -4.251288890838623, -3.132689952850342, -2.0140905380249023, -0.8954916000366211, 0.22310733795166016, 1.341706395149231, 2.4603054523468018, 3.578904628753662, 4.697503566741943, 5.816102504730225, 6.934701919555664, 8.053300857543945, 9.171897888183594, 10.290496826171875, 11.409095764160156, 12.527694702148438, 13.646293640136719, 14.764892578125, 15.883492469787598, 17.002090454101562, 18.120689392089844, 19.239288330078125, 20.357887268066406, 21.476486206054688, 22.59508514404297, 23.71368408203125, 24.83228302001953, 25.950881958007812, 27.069482803344727, 28.188081741333008, 29.30668067932129, 30.42527961730957, 31.54387855529785, 32.662479400634766, 33.78107833862305, 34.89967727661133, 36.01827621459961, 37.13687515258789, 38.25547409057617, 39.37407302856445, 40.492671966552734, 41.611270904541016, 42.7298698425293, 43.84846878051758, 44.96706771850586]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 2.0, 3.0, 8.0, 7.0, 14.0, 16.0, 14.0, 19.0, 24.0, 25.0, 26.0, 27.0, 31.0, 49.0, 56.0, 51.0, 55.0, 58.0, 63.0, 68.0, 57.0, 48.0, 40.0, 40.0, 33.0, 33.0, 30.0, 24.0, 15.0, 18.0, 10.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.758098602294922, -17.23614501953125, -16.71419334411621, -16.192241668701172, -15.6702880859375, -15.148335456848145, -14.626382827758789, -14.104430198669434, -13.582477569580078, -13.060524940490723, -12.538572311401367, -12.016619682312012, -11.494667053222656, -10.9727144241333, -10.450761795043945, -9.92880916595459, -9.406856536865234, -8.884903907775879, -8.362951278686523, -7.840998649597168, -7.3190460205078125, -6.797093391418457, -6.275140762329102, -5.753188133239746, -5.231235504150391, -4.709282875061035, -4.18733024597168, -3.665377616882324, -3.1434249877929688, -2.6214723587036133, -2.099519729614258, -1.5775671005249023, -1.0556135177612305, -0.533660888671875, -0.011708259582519531, 0.5102443695068359, 1.0321969985961914, 1.5541496276855469, 2.0761022567749023, 2.598054885864258, 3.1200075149536133, 3.6419601440429688, 4.163912773132324, 4.68586540222168, 5.207818031311035, 5.729770660400391, 6.251723289489746, 6.773675918579102, 7.295628547668457, 7.8175811767578125, 8.339533805847168, 8.861486434936523, 9.383439064025879, 9.905391693115234, 10.42734432220459, 10.949296951293945, 11.4712495803833, 11.993202209472656, 12.515154838562012, 13.037107467651367, 13.559060096740723, 14.081012725830078, 14.602965354919434, 15.124917984008789, 15.646870613098145]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 13.0, 23.0, 37.0, 42.0, 87.0, 106.0, 207.0, 322.0, 544.0, 954.0, 1706.0, 3124.0, 6114.0, 12372.0, 26622.0, 61524.0, 152858.0, 336855.0, 260089.0, 103394.0, 43077.0, 19143.0, 9007.0, 4582.0, 2453.0, 1380.0, 789.0, 436.0, 275.0, 156.0, 91.0, 63.0, 41.0, 27.0, 16.0, 10.0, 8.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6634979248046875, -1.601409912109375, -1.5393218994140625, -1.47723388671875, -1.4151458740234375, -1.353057861328125, -1.2909698486328125, -1.2288818359375, -1.1667938232421875, -1.104705810546875, -1.0426177978515625, -0.98052978515625, -0.9184417724609375, -0.856353759765625, -0.7942657470703125, -0.732177734375, -0.6700897216796875, -0.608001708984375, -0.5459136962890625, -0.48382568359375, -0.4217376708984375, -0.359649658203125, -0.2975616455078125, -0.2354736328125, -0.1733856201171875, -0.111297607421875, -0.0492095947265625, 0.01287841796875, 0.0749664306640625, 0.137054443359375, 0.1991424560546875, 0.26123046875, 0.3233184814453125, 0.385406494140625, 0.4474945068359375, 0.50958251953125, 0.5716705322265625, 0.633758544921875, 0.6958465576171875, 0.7579345703125, 0.8200225830078125, 0.882110595703125, 0.9441986083984375, 1.00628662109375, 1.0683746337890625, 1.130462646484375, 1.1925506591796875, 1.254638671875, 1.3167266845703125, 1.378814697265625, 1.4409027099609375, 1.50299072265625, 1.5650787353515625, 1.627166748046875, 1.6892547607421875, 1.7513427734375, 1.8134307861328125, 1.875518798828125, 1.9376068115234375, 1.99969482421875, 2.0617828369140625, 2.123870849609375, 2.1859588623046875, 2.248046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 7.0, 11.0, 6.0, 12.0, 16.0, 24.0, 22.0, 25.0, 25.0, 30.0, 34.0, 41.0, 44.0, 46.0, 59.0, 64.0, 53.0, 47.0, 58.0, 48.0, 41.0, 38.0, 32.0, 35.0, 29.0, 22.0, 27.0, 15.0, 19.0, 11.0, 9.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5947265625, -1.545379638671875, -1.49603271484375, -1.446685791015625, -1.3973388671875, -1.347991943359375, -1.29864501953125, -1.249298095703125, -1.199951171875, -1.150604248046875, -1.10125732421875, -1.051910400390625, -1.0025634765625, -0.953216552734375, -0.90386962890625, -0.854522705078125, -0.80517578125, -0.755828857421875, -0.70648193359375, -0.657135009765625, -0.6077880859375, -0.558441162109375, -0.50909423828125, -0.459747314453125, -0.410400390625, -0.361053466796875, -0.31170654296875, -0.262359619140625, -0.2130126953125, -0.163665771484375, -0.11431884765625, -0.064971923828125, -0.015625, 0.033721923828125, 0.08306884765625, 0.132415771484375, 0.1817626953125, 0.231109619140625, 0.28045654296875, 0.329803466796875, 0.379150390625, 0.428497314453125, 0.47784423828125, 0.527191162109375, 0.5765380859375, 0.625885009765625, 0.67523193359375, 0.724578857421875, 0.77392578125, 0.823272705078125, 0.87261962890625, 0.921966552734375, 0.9713134765625, 1.020660400390625, 1.07000732421875, 1.119354248046875, 1.168701171875, 1.218048095703125, 1.26739501953125, 1.316741943359375, 1.3660888671875, 1.415435791015625, 1.46478271484375, 1.514129638671875, 1.5634765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 13.0, 15.0, 13.0, 22.0, 33.0, 40.0, 67.0, 91.0, 136.0, 157.0, 232.0, 386.0, 594.0, 1037.0, 2234.0, 5914.0, 27791.0, 259635.0, 691972.0, 44079.0, 8200.0, 2670.0, 1226.0, 659.0, 445.0, 273.0, 175.0, 136.0, 84.0, 66.0, 49.0, 32.0, 18.0, 16.0, 10.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.3505859375, -4.201171875, -4.0517578125, -3.90234375, -3.7529296875, -3.603515625, -3.4541015625, -3.3046875, -3.1552734375, -3.005859375, -2.8564453125, -2.70703125, -2.5576171875, -2.408203125, -2.2587890625, -2.109375, -1.9599609375, -1.810546875, -1.6611328125, -1.51171875, -1.3623046875, -1.212890625, -1.0634765625, -0.9140625, -0.7646484375, -0.615234375, -0.4658203125, -0.31640625, -0.1669921875, -0.017578125, 0.1318359375, 0.28125, 0.4306640625, 0.580078125, 0.7294921875, 0.87890625, 1.0283203125, 1.177734375, 1.3271484375, 1.4765625, 1.6259765625, 1.775390625, 1.9248046875, 2.07421875, 2.2236328125, 2.373046875, 2.5224609375, 2.671875, 2.8212890625, 2.970703125, 3.1201171875, 3.26953125, 3.4189453125, 3.568359375, 3.7177734375, 3.8671875, 4.0166015625, 4.166015625, 4.3154296875, 4.46484375, 4.6142578125, 4.763671875, 4.9130859375, 5.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 7.0, 13.0, 4.0, 12.0, 10.0, 15.0, 11.0, 23.0, 22.0, 25.0, 37.0, 42.0, 38.0, 31.0, 51.0, 43.0, 52.0, 48.0, 51.0, 43.0, 58.0, 58.0, 39.0, 44.0, 35.0, 33.0, 26.0, 22.0, 15.0, 16.0, 12.0, 12.0, 13.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2763671875, -5.099609375, -4.9228515625, -4.74609375, -4.5693359375, -4.392578125, -4.2158203125, -4.0390625, -3.8623046875, -3.685546875, -3.5087890625, -3.33203125, -3.1552734375, -2.978515625, -2.8017578125, -2.625, -2.4482421875, -2.271484375, -2.0947265625, -1.91796875, -1.7412109375, -1.564453125, -1.3876953125, -1.2109375, -1.0341796875, -0.857421875, -0.6806640625, -0.50390625, -0.3271484375, -0.150390625, 0.0263671875, 0.203125, 0.3798828125, 0.556640625, 0.7333984375, 0.91015625, 1.0869140625, 1.263671875, 1.4404296875, 1.6171875, 1.7939453125, 1.970703125, 2.1474609375, 2.32421875, 2.5009765625, 2.677734375, 2.8544921875, 3.03125, 3.2080078125, 3.384765625, 3.5615234375, 3.73828125, 3.9150390625, 4.091796875, 4.2685546875, 4.4453125, 4.6220703125, 4.798828125, 4.9755859375, 5.15234375, 5.3291015625, 5.505859375, 5.6826171875, 5.859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 14.0, 8.0, 14.0, 13.0, 16.0, 24.0, 25.0, 36.0, 49.0, 63.0, 89.0, 137.0, 217.0, 360.0, 620.0, 1129.0, 2405.0, 5864.0, 18333.0, 100814.0, 803441.0, 87452.0, 17090.0, 5459.0, 2211.0, 1070.0, 571.0, 336.0, 198.0, 136.0, 89.0, 67.0, 43.0, 26.0, 19.0, 22.0, 14.0, 10.0, 9.0, 12.0, 8.0, 11.0, 4.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.9658203125, -0.9351272583007812, -0.9044342041015625, -0.8737411499023438, -0.843048095703125, -0.8123550415039062, -0.7816619873046875, -0.7509689331054688, -0.72027587890625, -0.6895828247070312, -0.6588897705078125, -0.6281967163085938, -0.597503662109375, -0.5668106079101562, -0.5361175537109375, -0.5054244995117188, -0.4747314453125, -0.44403839111328125, -0.4133453369140625, -0.38265228271484375, -0.351959228515625, -0.32126617431640625, -0.2905731201171875, -0.25988006591796875, -0.22918701171875, -0.19849395751953125, -0.1678009033203125, -0.13710784912109375, -0.106414794921875, -0.07572174072265625, -0.0450286865234375, -0.01433563232421875, 0.016357421875, 0.04705047607421875, 0.0777435302734375, 0.10843658447265625, 0.139129638671875, 0.16982269287109375, 0.2005157470703125, 0.23120880126953125, 0.26190185546875, 0.29259490966796875, 0.3232879638671875, 0.35398101806640625, 0.384674072265625, 0.41536712646484375, 0.4460601806640625, 0.47675323486328125, 0.5074462890625, 0.5381393432617188, 0.5688323974609375, 0.5995254516601562, 0.630218505859375, 0.6609115600585938, 0.6916046142578125, 0.7222976684570312, 0.75299072265625, 0.7836837768554688, 0.8143768310546875, 0.8450698852539062, 0.875762939453125, 0.9064559936523438, 0.9371490478515625, 0.9678421020507812, 0.99853515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 6.0, 1.0, 10.0, 6.0, 14.0, 11.0, 21.0, 33.0, 65.0, 99.0, 185.0, 234.0, 119.0, 70.0, 40.0, 21.0, 18.0, 12.0, 5.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005102157592773438, -0.0004960782825946808, -0.0004819408059120178, -0.00046780332922935486, -0.0004536658525466919, -0.00043952837586402893, -0.00042539089918136597, -0.000411253422498703, -0.00039711594581604004, -0.0003829784691333771, -0.0003688409924507141, -0.00035470351576805115, -0.0003405660390853882, -0.0003264285624027252, -0.00031229108572006226, -0.0002981536090373993, -0.00028401613235473633, -0.00026987865567207336, -0.0002557411789894104, -0.00024160370230674744, -0.00022746622562408447, -0.0002133287489414215, -0.00019919127225875854, -0.00018505379557609558, -0.00017091631889343262, -0.00015677884221076965, -0.0001426413655281067, -0.00012850388884544373, -0.00011436641216278076, -0.0001002289354801178, -8.609145879745483e-05, -7.195398211479187e-05, -5.7816505432128906e-05, -4.367902874946594e-05, -2.954155206680298e-05, -1.5404075384140015e-05, -1.2665987014770508e-06, 1.2870877981185913e-05, 2.7008354663848877e-05, 4.114583134651184e-05, 5.5283308029174805e-05, 6.942078471183777e-05, 8.355826139450073e-05, 9.76957380771637e-05, 0.00011183321475982666, 0.00012597069144248962, 0.0001401081681251526, 0.00015424564480781555, 0.00016838312149047852, 0.00018252059817314148, 0.00019665807485580444, 0.0002107955515384674, 0.00022493302822113037, 0.00023907050490379333, 0.0002532079815864563, 0.00026734545826911926, 0.0002814829349517822, 0.0002956204116344452, 0.00030975788831710815, 0.0003238953649997711, 0.0003380328416824341, 0.00035217031836509705, 0.00036630779504776, 0.000380445271730423, 0.00039458274841308594]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 13.0, 11.0, 8.0, 18.0, 28.0, 36.0, 50.0, 78.0, 128.0, 207.0, 395.0, 624.0, 1321.0, 2905.0, 8016.0, 30065.0, 205953.0, 718225.0, 59230.0, 13203.0, 4304.0, 1711.0, 857.0, 457.0, 231.0, 169.0, 98.0, 75.0, 36.0, 29.0, 22.0, 8.0, 13.0, 10.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9812469482421875, -0.949798583984375, -0.9183502197265625, -0.88690185546875, -0.8554534912109375, -0.824005126953125, -0.7925567626953125, -0.7611083984375, -0.7296600341796875, -0.698211669921875, -0.6667633056640625, -0.63531494140625, -0.6038665771484375, -0.572418212890625, -0.5409698486328125, -0.509521484375, -0.4780731201171875, -0.446624755859375, -0.4151763916015625, -0.38372802734375, -0.3522796630859375, -0.320831298828125, -0.2893829345703125, -0.2579345703125, -0.2264862060546875, -0.195037841796875, -0.1635894775390625, -0.13214111328125, -0.1006927490234375, -0.069244384765625, -0.0377960205078125, -0.00634765625, 0.0251007080078125, 0.056549072265625, 0.0879974365234375, 0.11944580078125, 0.1508941650390625, 0.182342529296875, 0.2137908935546875, 0.2452392578125, 0.2766876220703125, 0.308135986328125, 0.3395843505859375, 0.37103271484375, 0.4024810791015625, 0.433929443359375, 0.4653778076171875, 0.496826171875, 0.5282745361328125, 0.559722900390625, 0.5911712646484375, 0.62261962890625, 0.6540679931640625, 0.685516357421875, 0.7169647216796875, 0.7484130859375, 0.7798614501953125, 0.811309814453125, 0.8427581787109375, 0.87420654296875, 0.9056549072265625, 0.937103271484375, 0.9685516357421875, 1.0]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 14.0, 8.0, 8.0, 11.0, 18.0, 19.0, 27.0, 27.0, 33.0, 54.0, 71.0, 74.0, 87.0, 111.0, 98.0, 81.0, 42.0, 47.0, 30.0, 31.0, 18.0, 13.0, 13.0, 15.0, 14.0, 3.0, 5.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90673828125, -0.8785171508789062, -0.8502960205078125, -0.8220748901367188, -0.793853759765625, -0.7656326293945312, -0.7374114990234375, -0.7091903686523438, -0.68096923828125, -0.6527481079101562, -0.6245269775390625, -0.5963058471679688, -0.568084716796875, -0.5398635864257812, -0.5116424560546875, -0.48342132568359375, -0.4552001953125, -0.42697906494140625, -0.3987579345703125, -0.37053680419921875, -0.342315673828125, -0.31409454345703125, -0.2858734130859375, -0.25765228271484375, -0.22943115234375, -0.20121002197265625, -0.1729888916015625, -0.14476776123046875, -0.116546630859375, -0.08832550048828125, -0.0601043701171875, -0.03188323974609375, -0.003662109375, 0.02455902099609375, 0.0527801513671875, 0.08100128173828125, 0.109222412109375, 0.13744354248046875, 0.1656646728515625, 0.19388580322265625, 0.22210693359375, 0.25032806396484375, 0.2785491943359375, 0.30677032470703125, 0.334991455078125, 0.36321258544921875, 0.3914337158203125, 0.41965484619140625, 0.4478759765625, 0.47609710693359375, 0.5043182373046875, 0.5325393676757812, 0.560760498046875, 0.5889816284179688, 0.6172027587890625, 0.6454238891601562, 0.67364501953125, 0.7018661499023438, 0.7300872802734375, 0.7583084106445312, 0.786529541015625, 0.8147506713867188, 0.8429718017578125, 0.8711929321289062, 0.8994140625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 26.0, 66.0, 189.0, 484.0, 152.0, 42.0, 14.0, 10.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.89264678955078, -54.26520538330078, -52.63776397705078, -51.01032257080078, -49.38288116455078, -47.75543975830078, -46.12799835205078, -44.50055694580078, -42.87311553955078, -41.24567413330078, -39.61823272705078, -37.99079132080078, -36.36334991455078, -34.73590850830078, -33.10846710205078, -31.48102378845215, -29.853580474853516, -28.226139068603516, -26.598697662353516, -24.971256256103516, -23.343814849853516, -21.716373443603516, -20.088930130004883, -18.461488723754883, -16.834047317504883, -15.206605911254883, -13.579164505004883, -11.951722145080566, -10.324280738830566, -8.696839332580566, -7.06939697265625, -5.44195556640625, -3.81451416015625, -2.187072515487671, -0.5596308708190918, 1.0678110122680664, 2.6952524185180664, 4.322693824768066, 5.950136184692383, 7.577577590942383, 9.205018997192383, 10.832460403442383, 12.459901809692383, 14.0873441696167, 15.7147855758667, 17.342227935791016, 18.969669342041016, 20.597110748291016, 22.224552154541016, 23.851993560791016, 25.479434967041016, 27.106876373291016, 28.734317779541016, 30.361759185791016, 31.98920249938965, 33.61664581298828, 35.24408721923828, 36.87152862548828, 38.49897003173828, 40.12641143798828, 41.75385284423828, 43.38129425048828, 45.00873565673828, 46.63617706298828, 48.26361846923828]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 12.0, 17.0, 14.0, 18.0, 14.0, 19.0, 14.0, 24.0, 20.0, 30.0, 29.0, 25.0, 44.0, 71.0, 129.0, 140.0, 65.0, 40.0, 28.0, 28.0, 29.0, 29.0, 25.0, 19.0, 21.0, 12.0, 13.0, 13.0, 11.0, 8.0, 2.0, 5.0, 5.0, 10.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.746797561645508, -22.081905364990234, -21.417015075683594, -20.75212287902832, -20.087230682373047, -19.422338485717773, -18.757448196411133, -18.09255599975586, -17.427663803100586, -16.762771606445312, -16.097881317138672, -15.432989120483398, -14.768096923828125, -14.103205680847168, -13.438314437866211, -12.773422241210938, -12.10853099822998, -11.443639755249023, -10.77874755859375, -10.113856315612793, -9.44896411895752, -8.784072875976562, -8.119180679321289, -7.454289436340332, -6.789397716522217, -6.124505996704102, -5.459614276885986, -4.794722557067871, -4.129831314086914, -3.4649393558502197, -2.8000478744506836, -2.1351561546325684, -1.4702644348144531, -0.8053727746009827, -0.1404811143875122, 0.5244104862213135, 1.1893022060394287, 1.854193925857544, 2.51908540725708, 3.1839771270751953, 3.8488688468933105, 4.513760566711426, 5.178652286529541, 5.843544006347656, 6.508435249328613, 7.173327445983887, 7.838218688964844, 8.503110885620117, 9.168002128601074, 9.832893371582031, 10.497785568237305, 11.162676811218262, 11.827569007873535, 12.492460250854492, 13.157352447509766, 13.822243690490723, 14.48713493347168, 15.152026176452637, 15.81691837310791, 16.481809616088867, 17.14670181274414, 17.811594009399414, 18.476484298706055, 19.141376495361328, 19.8062686920166]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 8.0, 14.0, 15.0, 31.0, 54.0, 66.0, 122.0, 184.0, 288.0, 413.0, 698.0, 1301.0, 2582.0, 5823.0, 17117.0, 71135.0, 431678.0, 1988048.0, 1366930.0, 244886.0, 42257.0, 11644.0, 4317.0, 2004.0, 979.0, 585.0, 390.0, 234.0, 130.0, 102.0, 77.0, 51.0, 31.0, 26.0, 14.0, 13.0, 7.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.32879638671875, -2.2532958984375, -2.17779541015625, -2.102294921875, -2.02679443359375, -1.9512939453125, -1.87579345703125, -1.80029296875, -1.72479248046875, -1.6492919921875, -1.57379150390625, -1.498291015625, -1.42279052734375, -1.3472900390625, -1.27178955078125, -1.1962890625, -1.12078857421875, -1.0452880859375, -0.96978759765625, -0.894287109375, -0.81878662109375, -0.7432861328125, -0.66778564453125, -0.59228515625, -0.51678466796875, -0.4412841796875, -0.36578369140625, -0.290283203125, -0.21478271484375, -0.1392822265625, -0.06378173828125, 0.01171875, 0.08721923828125, 0.1627197265625, 0.23822021484375, 0.313720703125, 0.38922119140625, 0.4647216796875, 0.54022216796875, 0.61572265625, 0.69122314453125, 0.7667236328125, 0.84222412109375, 0.917724609375, 0.99322509765625, 1.0687255859375, 1.14422607421875, 1.2197265625, 1.29522705078125, 1.3707275390625, 1.44622802734375, 1.521728515625, 1.59722900390625, 1.6727294921875, 1.74822998046875, 1.82373046875, 1.89923095703125, 1.9747314453125, 2.05023193359375, 2.125732421875, 2.20123291015625, 2.2767333984375, 2.35223388671875, 2.427734375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 8.0, 15.0, 7.0, 21.0, 9.0, 21.0, 20.0, 31.0, 24.0, 31.0, 35.0, 37.0, 39.0, 58.0, 37.0, 52.0, 52.0, 56.0, 57.0, 51.0, 55.0, 41.0, 35.0, 22.0, 41.0, 24.0, 24.0, 15.0, 10.0, 17.0, 17.0, 9.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.494140625, -1.446868896484375, -1.39959716796875, -1.352325439453125, -1.3050537109375, -1.257781982421875, -1.21051025390625, -1.163238525390625, -1.115966796875, -1.068695068359375, -1.02142333984375, -0.974151611328125, -0.9268798828125, -0.879608154296875, -0.83233642578125, -0.785064697265625, -0.73779296875, -0.690521240234375, -0.64324951171875, -0.595977783203125, -0.5487060546875, -0.501434326171875, -0.45416259765625, -0.406890869140625, -0.359619140625, -0.312347412109375, -0.26507568359375, -0.217803955078125, -0.1705322265625, -0.123260498046875, -0.07598876953125, -0.028717041015625, 0.0185546875, 0.065826416015625, 0.11309814453125, 0.160369873046875, 0.2076416015625, 0.254913330078125, 0.30218505859375, 0.349456787109375, 0.396728515625, 0.444000244140625, 0.49127197265625, 0.538543701171875, 0.5858154296875, 0.633087158203125, 0.68035888671875, 0.727630615234375, 0.77490234375, 0.822174072265625, 0.86944580078125, 0.916717529296875, 0.9639892578125, 1.011260986328125, 1.05853271484375, 1.105804443359375, 1.153076171875, 1.200347900390625, 1.24761962890625, 1.294891357421875, 1.3421630859375, 1.389434814453125, 1.43670654296875, 1.483978271484375, 1.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 3.0, 8.0, 19.0, 27.0, 28.0, 54.0, 78.0, 136.0, 184.0, 248.0, 496.0, 891.0, 1831.0, 5546.0, 33326.0, 2261669.0, 1850124.0, 30638.0, 5081.0, 1783.0, 854.0, 458.0, 269.0, 170.0, 107.0, 80.0, 46.0, 22.0, 15.0, 30.0, 10.0, 10.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.50390625, -7.301025390625, -7.09814453125, -6.895263671875, -6.6923828125, -6.489501953125, -6.28662109375, -6.083740234375, -5.880859375, -5.677978515625, -5.47509765625, -5.272216796875, -5.0693359375, -4.866455078125, -4.66357421875, -4.460693359375, -4.2578125, -4.054931640625, -3.85205078125, -3.649169921875, -3.4462890625, -3.243408203125, -3.04052734375, -2.837646484375, -2.634765625, -2.431884765625, -2.22900390625, -2.026123046875, -1.8232421875, -1.620361328125, -1.41748046875, -1.214599609375, -1.01171875, -0.808837890625, -0.60595703125, -0.403076171875, -0.2001953125, 0.002685546875, 0.20556640625, 0.408447265625, 0.611328125, 0.814208984375, 1.01708984375, 1.219970703125, 1.4228515625, 1.625732421875, 1.82861328125, 2.031494140625, 2.234375, 2.437255859375, 2.64013671875, 2.843017578125, 3.0458984375, 3.248779296875, 3.45166015625, 3.654541015625, 3.857421875, 4.060302734375, 4.26318359375, 4.466064453125, 4.6689453125, 4.871826171875, 5.07470703125, 5.277587890625, 5.48046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 9.0, 11.0, 30.0, 14.0, 28.0, 48.0, 52.0, 83.0, 127.0, 168.0, 290.0, 479.0, 652.0, 676.0, 473.0, 305.0, 181.0, 142.0, 98.0, 74.0, 35.0, 25.0, 22.0, 15.0, 9.0, 6.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0474853515625, -4.899658203125, -4.7518310546875, -4.60400390625, -4.4561767578125, -4.308349609375, -4.1605224609375, -4.0126953125, -3.8648681640625, -3.717041015625, -3.5692138671875, -3.42138671875, -3.2735595703125, -3.125732421875, -2.9779052734375, -2.830078125, -2.6822509765625, -2.534423828125, -2.3865966796875, -2.23876953125, -2.0909423828125, -1.943115234375, -1.7952880859375, -1.6474609375, -1.4996337890625, -1.351806640625, -1.2039794921875, -1.05615234375, -0.9083251953125, -0.760498046875, -0.6126708984375, -0.46484375, -0.3170166015625, -0.169189453125, -0.0213623046875, 0.12646484375, 0.2742919921875, 0.422119140625, 0.5699462890625, 0.7177734375, 0.8656005859375, 1.013427734375, 1.1612548828125, 1.30908203125, 1.4569091796875, 1.604736328125, 1.7525634765625, 1.900390625, 2.0482177734375, 2.196044921875, 2.3438720703125, 2.49169921875, 2.6395263671875, 2.787353515625, 2.9351806640625, 3.0830078125, 3.2308349609375, 3.378662109375, 3.5264892578125, 3.67431640625, 3.8221435546875, 3.969970703125, 4.1177978515625, 4.265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 4.0, 14.0, 13.0, 26.0, 50.0, 73.0, 158.0, 195.0, 179.0, 127.0, 61.0, 35.0, 15.0, 12.0, 10.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.82004165649414, -52.127037048339844, -50.43403244018555, -48.74102783203125, -47.04801940917969, -45.35501480102539, -43.662010192871094, -41.9690055847168, -40.2760009765625, -38.5829963684082, -36.889991760253906, -35.196983337402344, -33.50397872924805, -31.81097412109375, -30.117969512939453, -28.424964904785156, -26.731956481933594, -25.038951873779297, -23.345945358276367, -21.65294075012207, -19.95993423461914, -18.266929626464844, -16.573925018310547, -14.880919456481934, -13.18791389465332, -11.494908332824707, -9.801902770996094, -8.108898162841797, -6.415892601013184, -4.72288703918457, -3.0298824310302734, -1.3368768692016602, 0.35613250732421875, 2.049137830734253, 3.742143154144287, 5.435148239135742, 7.1281538009643555, 8.821159362792969, 10.514163970947266, 12.207169532775879, 13.900175094604492, 15.593180656433105, 17.28618621826172, 18.979190826416016, 20.672195434570312, 22.365201950073242, 24.05820655822754, 25.75121307373047, 27.444217681884766, 29.137222290039062, 30.830228805541992, 32.523231506347656, 34.21623992919922, 35.909244537353516, 37.60224914550781, 39.29525375366211, 40.988258361816406, 42.6812629699707, 44.374267578125, 46.06727600097656, 47.76028060913086, 49.453285217285156, 51.14628982543945, 52.83929443359375, 54.53230285644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 10.0, 10.0, 11.0, 14.0, 20.0, 23.0, 27.0, 25.0, 21.0, 22.0, 34.0, 31.0, 54.0, 43.0, 47.0, 56.0, 41.0, 51.0, 58.0, 56.0, 41.0, 41.0, 30.0, 27.0, 23.0, 23.0, 18.0, 29.0, 9.0, 13.0, 13.0, 12.0, 5.0, 7.0, 8.0, 5.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.02021026611328, -17.3231201171875, -16.626028060913086, -15.928937911987305, -15.231846809387207, -14.53475570678711, -13.837665557861328, -13.14057445526123, -12.443483352661133, -11.746392250061035, -11.049301147460938, -10.352210998535156, -9.655119895935059, -8.958028793334961, -8.26093864440918, -7.563847541809082, -6.866756439208984, -6.169665336608887, -5.472574710845947, -4.775484085083008, -4.07839298248291, -3.3813021183013916, -2.684211254119873, -1.9871206283569336, -1.290029525756836, -0.5929386615753174, 0.10415220260620117, 0.8012430667877197, 1.4983339309692383, 2.195424795150757, 2.8925156593322754, 3.589606285095215, 4.2866973876953125, 4.98378849029541, 5.68087911605835, 6.377969741821289, 7.075060844421387, 7.772151947021484, 8.469242095947266, 9.166333198547363, 9.863424301147461, 10.560515403747559, 11.257606506347656, 11.954696655273438, 12.651787757873535, 13.348878860473633, 14.045969009399414, 14.743060111999512, 15.44015121459961, 16.13724136352539, 16.834333419799805, 17.531423568725586, 18.228515625, 18.92560577392578, 19.622695922851562, 20.319786071777344, 21.016878128051758, 21.71396827697754, 22.411060333251953, 23.108150482177734, 23.805240631103516, 24.50233268737793, 25.19942283630371, 25.896514892578125, 26.593605041503906]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 12.0, 17.0, 27.0, 27.0, 50.0, 78.0, 133.0, 203.0, 311.0, 548.0, 944.0, 1706.0, 3281.0, 6772.0, 15385.0, 39900.0, 124656.0, 469070.0, 264949.0, 73905.0, 25455.0, 10606.0, 4853.0, 2465.0, 1266.0, 753.0, 432.0, 256.0, 170.0, 104.0, 67.0, 43.0, 32.0, 21.0, 21.0, 8.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9609375, -1.890350341796875, -1.81976318359375, -1.749176025390625, -1.6785888671875, -1.608001708984375, -1.53741455078125, -1.466827392578125, -1.396240234375, -1.325653076171875, -1.25506591796875, -1.184478759765625, -1.1138916015625, -1.043304443359375, -0.97271728515625, -0.902130126953125, -0.83154296875, -0.760955810546875, -0.69036865234375, -0.619781494140625, -0.5491943359375, -0.478607177734375, -0.40802001953125, -0.337432861328125, -0.266845703125, -0.196258544921875, -0.12567138671875, -0.055084228515625, 0.0155029296875, 0.086090087890625, 0.15667724609375, 0.227264404296875, 0.2978515625, 0.368438720703125, 0.43902587890625, 0.509613037109375, 0.5802001953125, 0.650787353515625, 0.72137451171875, 0.791961669921875, 0.862548828125, 0.933135986328125, 1.00372314453125, 1.074310302734375, 1.1448974609375, 1.215484619140625, 1.28607177734375, 1.356658935546875, 1.42724609375, 1.497833251953125, 1.56842041015625, 1.639007568359375, 1.7095947265625, 1.780181884765625, 1.85076904296875, 1.921356201171875, 1.991943359375, 2.062530517578125, 2.13311767578125, 2.203704833984375, 2.2742919921875, 2.344879150390625, 2.41546630859375, 2.486053466796875, 2.556640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 11.0, 12.0, 15.0, 14.0, 22.0, 24.0, 34.0, 35.0, 35.0, 56.0, 58.0, 53.0, 66.0, 66.0, 60.0, 71.0, 54.0, 65.0, 41.0, 38.0, 34.0, 28.0, 26.0, 22.0, 15.0, 17.0, 10.0, 7.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94140625, -1.87445068359375, -1.8074951171875, -1.74053955078125, -1.673583984375, -1.60662841796875, -1.5396728515625, -1.47271728515625, -1.40576171875, -1.33880615234375, -1.2718505859375, -1.20489501953125, -1.137939453125, -1.07098388671875, -1.0040283203125, -0.93707275390625, -0.8701171875, -0.80316162109375, -0.7362060546875, -0.66925048828125, -0.602294921875, -0.53533935546875, -0.4683837890625, -0.40142822265625, -0.33447265625, -0.26751708984375, -0.2005615234375, -0.13360595703125, -0.066650390625, 0.00030517578125, 0.0672607421875, 0.13421630859375, 0.201171875, 0.26812744140625, 0.3350830078125, 0.40203857421875, 0.468994140625, 0.53594970703125, 0.6029052734375, 0.66986083984375, 0.73681640625, 0.80377197265625, 0.8707275390625, 0.93768310546875, 1.004638671875, 1.07159423828125, 1.1385498046875, 1.20550537109375, 1.2724609375, 1.33941650390625, 1.4063720703125, 1.47332763671875, 1.540283203125, 1.60723876953125, 1.6741943359375, 1.74114990234375, 1.80810546875, 1.87506103515625, 1.9420166015625, 2.00897216796875, 2.075927734375, 2.14288330078125, 2.2098388671875, 2.27679443359375, 2.34375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 0.0, 3.0, 4.0, 5.0, 12.0, 7.0, 18.0, 21.0, 22.0, 30.0, 27.0, 48.0, 61.0, 100.0, 137.0, 272.0, 413.0, 940.0, 2727.0, 12085.0, 145577.0, 839007.0, 38117.0, 5751.0, 1583.0, 650.0, 356.0, 184.0, 114.0, 95.0, 53.0, 40.0, 27.0, 23.0, 11.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.697265625, -3.57904052734375, -3.4608154296875, -3.34259033203125, -3.224365234375, -3.10614013671875, -2.9879150390625, -2.86968994140625, -2.75146484375, -2.63323974609375, -2.5150146484375, -2.39678955078125, -2.278564453125, -2.16033935546875, -2.0421142578125, -1.92388916015625, -1.8056640625, -1.68743896484375, -1.5692138671875, -1.45098876953125, -1.332763671875, -1.21453857421875, -1.0963134765625, -0.97808837890625, -0.85986328125, -0.74163818359375, -0.6234130859375, -0.50518798828125, -0.386962890625, -0.26873779296875, -0.1505126953125, -0.03228759765625, 0.0859375, 0.20416259765625, 0.3223876953125, 0.44061279296875, 0.558837890625, 0.67706298828125, 0.7952880859375, 0.91351318359375, 1.03173828125, 1.14996337890625, 1.2681884765625, 1.38641357421875, 1.504638671875, 1.62286376953125, 1.7410888671875, 1.85931396484375, 1.9775390625, 2.09576416015625, 2.2139892578125, 2.33221435546875, 2.450439453125, 2.56866455078125, 2.6868896484375, 2.80511474609375, 2.92333984375, 3.04156494140625, 3.1597900390625, 3.27801513671875, 3.396240234375, 3.51446533203125, 3.6326904296875, 3.75091552734375, 3.869140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 6.0, 8.0, 8.0, 6.0, 5.0, 13.0, 13.0, 12.0, 18.0, 28.0, 31.0, 26.0, 35.0, 35.0, 45.0, 54.0, 84.0, 79.0, 80.0, 74.0, 67.0, 54.0, 35.0, 42.0, 22.0, 18.0, 14.0, 12.0, 12.0, 11.0, 11.0, 17.0, 5.0, 5.0, 0.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.03125, -7.8194580078125, -7.607666015625, -7.3958740234375, -7.18408203125, -6.9722900390625, -6.760498046875, -6.5487060546875, -6.3369140625, -6.1251220703125, -5.913330078125, -5.7015380859375, -5.48974609375, -5.2779541015625, -5.066162109375, -4.8543701171875, -4.642578125, -4.4307861328125, -4.218994140625, -4.0072021484375, -3.79541015625, -3.5836181640625, -3.371826171875, -3.1600341796875, -2.9482421875, -2.7364501953125, -2.524658203125, -2.3128662109375, -2.10107421875, -1.8892822265625, -1.677490234375, -1.4656982421875, -1.25390625, -1.0421142578125, -0.830322265625, -0.6185302734375, -0.40673828125, -0.1949462890625, 0.016845703125, 0.2286376953125, 0.4404296875, 0.6522216796875, 0.864013671875, 1.0758056640625, 1.28759765625, 1.4993896484375, 1.711181640625, 1.9229736328125, 2.134765625, 2.3465576171875, 2.558349609375, 2.7701416015625, 2.98193359375, 3.1937255859375, 3.405517578125, 3.6173095703125, 3.8291015625, 4.0408935546875, 4.252685546875, 4.4644775390625, 4.67626953125, 4.8880615234375, 5.099853515625, 5.3116455078125, 5.5234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 13.0, 11.0, 13.0, 23.0, 20.0, 31.0, 42.0, 66.0, 92.0, 152.0, 340.0, 702.0, 1585.0, 4555.0, 18138.0, 149916.0, 828623.0, 32985.0, 7054.0, 2213.0, 930.0, 409.0, 227.0, 132.0, 67.0, 43.0, 24.0, 24.0, 28.0, 20.0, 13.0, 12.0, 6.0, 5.0, 3.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5740737915039062, -0.5543975830078125, -0.5347213745117188, -0.515045166015625, -0.49536895751953125, -0.4756927490234375, -0.45601654052734375, -0.43634033203125, -0.41666412353515625, -0.3969879150390625, -0.37731170654296875, -0.357635498046875, -0.33795928955078125, -0.3182830810546875, -0.29860687255859375, -0.2789306640625, -0.25925445556640625, -0.2395782470703125, -0.21990203857421875, -0.200225830078125, -0.18054962158203125, -0.1608734130859375, -0.14119720458984375, -0.12152099609375, -0.10184478759765625, -0.0821685791015625, -0.06249237060546875, -0.042816162109375, -0.02313995361328125, -0.0034637451171875, 0.01621246337890625, 0.035888671875, 0.05556488037109375, 0.0752410888671875, 0.09491729736328125, 0.114593505859375, 0.13426971435546875, 0.1539459228515625, 0.17362213134765625, 0.19329833984375, 0.21297454833984375, 0.2326507568359375, 0.25232696533203125, 0.272003173828125, 0.29167938232421875, 0.3113555908203125, 0.33103179931640625, 0.3507080078125, 0.37038421630859375, 0.3900604248046875, 0.40973663330078125, 0.429412841796875, 0.44908905029296875, 0.4687652587890625, 0.48844146728515625, 0.50811767578125, 0.5277938842773438, 0.5474700927734375, 0.5671463012695312, 0.586822509765625, 0.6064987182617188, 0.6261749267578125, 0.6458511352539062, 0.66552734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 11.0, 7.0, 14.0, 14.0, 24.0, 45.0, 43.0, 103.0, 130.0, 141.0, 144.0, 87.0, 50.0, 37.0, 19.0, 24.0, 21.0, 9.0, 5.0, 10.0, 9.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017118453979492188, -0.00016557052731513977, -0.00015995651483535767, -0.00015434250235557556, -0.00014872848987579346, -0.00014311447739601135, -0.00013750046491622925, -0.00013188645243644714, -0.00012627243995666504, -0.00012065842747688293, -0.00011504441499710083, -0.00010943040251731873, -0.00010381639003753662, -9.820237755775452e-05, -9.258836507797241e-05, -8.697435259819031e-05, -8.13603401184082e-05, -7.57463276386261e-05, -7.0132315158844e-05, -6.451830267906189e-05, -5.8904290199279785e-05, -5.329027771949768e-05, -4.7676265239715576e-05, -4.206225275993347e-05, -3.644824028015137e-05, -3.083422780036926e-05, -2.5220215320587158e-05, -1.9606202840805054e-05, -1.399219036102295e-05, -8.378177881240845e-06, -2.7641654014587402e-06, 2.8498470783233643e-06, 8.463859558105469e-06, 1.4077872037887573e-05, 1.9691884517669678e-05, 2.5305896997451782e-05, 3.091990947723389e-05, 3.653392195701599e-05, 4.2147934436798096e-05, 4.77619469165802e-05, 5.3375959396362305e-05, 5.898997187614441e-05, 6.460398435592651e-05, 7.021799683570862e-05, 7.583200931549072e-05, 8.144602179527283e-05, 8.706003427505493e-05, 9.267404675483704e-05, 9.828805923461914e-05, 0.00010390207171440125, 0.00010951608419418335, 0.00011513009667396545, 0.00012074410915374756, 0.00012635812163352966, 0.00013197213411331177, 0.00013758614659309387, 0.00014320015907287598, 0.00014881417155265808, 0.00015442818403244019, 0.0001600421965122223, 0.0001656562089920044, 0.0001712702214717865, 0.0001768842339515686, 0.0001824982464313507, 0.0001881122589111328]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 20.0, 23.0, 37.0, 51.0, 77.0, 111.0, 208.0, 342.0, 613.0, 1231.0, 2872.0, 7350.0, 21821.0, 92823.0, 797953.0, 89120.0, 20988.0, 7227.0, 2885.0, 1279.0, 608.0, 330.0, 200.0, 115.0, 89.0, 55.0, 28.0, 18.0, 17.0, 14.0, 10.0, 2.0, 8.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4002571105957031, -0.38620758056640625, -0.3721580505371094, -0.3581085205078125, -0.3440589904785156, -0.33000946044921875, -0.3159599304199219, -0.301910400390625, -0.2878608703613281, -0.27381134033203125, -0.2597618103027344, -0.2457122802734375, -0.23166275024414062, -0.21761322021484375, -0.20356369018554688, -0.18951416015625, -0.17546463012695312, -0.16141510009765625, -0.14736557006835938, -0.1333160400390625, -0.11926651000976562, -0.10521697998046875, -0.09116744995117188, -0.077117919921875, -0.06306838989257812, -0.04901885986328125, -0.034969329833984375, -0.0209197998046875, -0.006870269775390625, 0.00717926025390625, 0.021228790283203125, 0.0352783203125, 0.049327850341796875, 0.06337738037109375, 0.07742691040039062, 0.0914764404296875, 0.10552597045898438, 0.11957550048828125, 0.13362503051757812, 0.147674560546875, 0.16172409057617188, 0.17577362060546875, 0.18982315063476562, 0.2038726806640625, 0.21792221069335938, 0.23197174072265625, 0.24602127075195312, 0.26007080078125, 0.2741203308105469, 0.28816986083984375, 0.3022193908691406, 0.3162689208984375, 0.3303184509277344, 0.34436798095703125, 0.3584175109863281, 0.372467041015625, 0.3865165710449219, 0.40056610107421875, 0.4146156311035156, 0.4286651611328125, 0.4427146911621094, 0.45676422119140625, 0.4708137512207031, 0.48486328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 9.0, 7.0, 17.0, 14.0, 20.0, 24.0, 47.0, 50.0, 85.0, 88.0, 108.0, 106.0, 97.0, 70.0, 56.0, 26.0, 35.0, 24.0, 19.0, 12.0, 17.0, 15.0, 8.0, 9.0, 9.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5520782470703125, -0.534332275390625, -0.5165863037109375, -0.49884033203125, -0.4810943603515625, -0.463348388671875, -0.4456024169921875, -0.4278564453125, -0.4101104736328125, -0.392364501953125, -0.3746185302734375, -0.35687255859375, -0.3391265869140625, -0.321380615234375, -0.3036346435546875, -0.285888671875, -0.2681427001953125, -0.250396728515625, -0.2326507568359375, -0.21490478515625, -0.1971588134765625, -0.179412841796875, -0.1616668701171875, -0.1439208984375, -0.1261749267578125, -0.108428955078125, -0.0906829833984375, -0.07293701171875, -0.0551910400390625, -0.037445068359375, -0.0196990966796875, -0.001953125, 0.0157928466796875, 0.033538818359375, 0.0512847900390625, 0.06903076171875, 0.0867767333984375, 0.104522705078125, 0.1222686767578125, 0.1400146484375, 0.1577606201171875, 0.175506591796875, 0.1932525634765625, 0.21099853515625, 0.2287445068359375, 0.246490478515625, 0.2642364501953125, 0.281982421875, 0.2997283935546875, 0.317474365234375, 0.3352203369140625, 0.35296630859375, 0.3707122802734375, 0.388458251953125, 0.4062042236328125, 0.4239501953125, 0.4416961669921875, 0.459442138671875, 0.4771881103515625, 0.49493408203125, 0.5126800537109375, 0.530426025390625, 0.5481719970703125, 0.56591796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 29.0, 89.0, 517.0, 273.0, 68.0, 13.0, 9.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.38037872314453, -33.6751708984375, -31.969966888427734, -30.264760971069336, -28.559555053710938, -26.85434913635254, -25.14914321899414, -23.443937301635742, -21.738731384277344, -20.033525466918945, -18.328319549560547, -16.62311363220215, -14.91790771484375, -13.212701797485352, -11.507495880126953, -9.802289962768555, -8.097084045410156, -6.391878128051758, -4.686672210693359, -2.981466293334961, -1.2762603759765625, 0.42894554138183594, 2.1341514587402344, 3.839357376098633, 5.544563293457031, 7.24976921081543, 8.954975128173828, 10.660181045532227, 12.365386962890625, 14.070592880249023, 15.775798797607422, 17.48100471496582, 19.18621063232422, 20.891416549682617, 22.596622467041016, 24.301828384399414, 26.007034301757812, 27.71224021911621, 29.41744613647461, 31.122652053833008, 32.827857971191406, 34.53306579589844, 36.2382698059082, 37.94347381591797, 39.648681640625, 41.35388946533203, 43.0590934753418, 44.76429748535156, 46.469505310058594, 48.174713134765625, 49.87991714477539, 51.585121154785156, 53.29032897949219, 54.99553680419922, 56.700740814208984, 58.40594482421875, 60.11115264892578, 61.81636047363281, 63.52156448364258, 65.22676849365234, 66.93197631835938, 68.6371841430664, 70.34239196777344, 72.04759216308594, 73.75279998779297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 2.0, 5.0, 8.0, 4.0, 12.0, 11.0, 14.0, 19.0, 10.0, 21.0, 19.0, 20.0, 27.0, 101.0, 123.0, 53.0, 55.0, 63.0, 153.0, 91.0, 21.0, 22.0, 22.0, 14.0, 11.0, 10.0, 19.0, 12.0, 12.0, 10.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.678874969482422, -16.091264724731445, -15.503654479980469, -14.916044235229492, -14.328433990478516, -13.740823745727539, -13.153213500976562, -12.565603256225586, -11.97799301147461, -11.390382766723633, -10.802772521972656, -10.21516227722168, -9.627552032470703, -9.039941787719727, -8.45233154296875, -7.864721775054932, -7.277112007141113, -6.689501762390137, -6.10189151763916, -5.514281272888184, -4.926671028137207, -4.3390607833862305, -3.751451015472412, -3.1638407707214355, -2.576230525970459, -1.9886202812194824, -1.4010101556777954, -0.8134000301361084, -0.22578978538513184, 0.3618204593658447, 0.9494304656982422, 1.5370407104492188, 2.1246509552001953, 2.712261199951172, 3.2998714447021484, 3.887481451034546, 4.475091934204102, 5.062702178955078, 5.6503119468688965, 6.237922191619873, 6.82553243637085, 7.413142681121826, 8.000752449035645, 8.588362693786621, 9.175972938537598, 9.763583183288574, 10.35119342803955, 10.938803672790527, 11.526413917541504, 12.11402416229248, 12.701634407043457, 13.289244651794434, 13.87685489654541, 14.464465141296387, 15.052074432373047, 15.639684677124023, 16.227294921875, 16.814905166625977, 17.402515411376953, 17.99012565612793, 18.577735900878906, 19.165346145629883, 19.75295639038086, 20.340566635131836, 20.928176879882812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 8.0, 14.0, 22.0, 8.0, 21.0, 29.0, 26.0, 37.0, 42.0, 44.0, 91.0, 254.0, 92.0, 42.0, 35.0, 28.0, 26.0, 27.0, 19.0, 12.0, 8.0, 16.0, 15.0, 10.0, 9.0, 8.0, 5.0, 6.0, 2.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5419921875, -1.48944091796875, -1.4368896484375, -1.38433837890625, -1.331787109375, -1.27923583984375, -1.2266845703125, -1.17413330078125, -1.12158203125, -1.06903076171875, -1.0164794921875, -0.96392822265625, -0.911376953125, -0.85882568359375, -0.8062744140625, -0.75372314453125, -0.701171875, -0.64862060546875, -0.5960693359375, -0.54351806640625, -0.490966796875, -0.43841552734375, -0.3858642578125, -0.33331298828125, -0.28076171875, -0.22821044921875, -0.1756591796875, -0.12310791015625, -0.070556640625, -0.01800537109375, 0.0345458984375, 0.08709716796875, 0.1396484375, 0.19219970703125, 0.2447509765625, 0.29730224609375, 0.349853515625, 0.40240478515625, 0.4549560546875, 0.50750732421875, 0.56005859375, 0.61260986328125, 0.6651611328125, 0.71771240234375, 0.770263671875, 0.82281494140625, 0.8753662109375, 0.92791748046875, 0.98046875, 1.03302001953125, 1.0855712890625, 1.13812255859375, 1.190673828125, 1.24322509765625, 1.2957763671875, 1.34832763671875, 1.40087890625, 1.45343017578125, 1.5059814453125, 1.55853271484375, 1.611083984375, 1.66363525390625, 1.7161865234375, 1.76873779296875, 1.8212890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 15.0, 6.0, 3.0, 14.0, 15.0, 49.0, 73.0, 121.0, 240.0, 799.0, 3983.0, 7760645.0, 617933.0, 3522.0, 697.0, 239.0, 108.0, 62.0, 19.0, 16.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.386871337890625, -29.542442321777344, -28.698013305664062, -27.85358428955078, -27.0091552734375, -26.16472625732422, -25.320297241210938, -24.475868225097656, -23.631439208984375, -22.787010192871094, -21.942581176757812, -21.09815216064453, -20.25372314453125, -19.40929412841797, -18.564865112304688, -17.720436096191406, -16.876007080078125, -16.031578063964844, -15.187149047851562, -14.342720031738281, -13.498291015625, -12.653861999511719, -11.809432983398438, -10.965003967285156, -10.120574951171875, -9.276145935058594, -8.431716918945312, -7.587287902832031, -6.74285888671875, -5.898429870605469, -5.0540008544921875, -4.209571838378906, -3.365142822265625, -2.5207138061523438, -1.6762847900390625, -0.8318557739257812, 0.0125732421875, 0.8570022583007812, 1.7014312744140625, 2.5458602905273438, 3.390289306640625, 4.234718322753906, 5.0791473388671875, 5.923576354980469, 6.76800537109375, 7.612434387207031, 8.456863403320312, 9.301292419433594, 10.145721435546875, 10.990150451660156, 11.834579467773438, 12.679008483886719, 13.5234375, 14.367866516113281, 15.212295532226562, 16.056724548339844, 16.901153564453125, 17.745582580566406, 18.590011596679688, 19.43444061279297, 20.27886962890625, 21.12329864501953, 21.967727661132812, 22.812156677246094, 23.656585693359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 9.0, 8.0, 0.0, 5.0, 3.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.01439094543457, -28.215744018554688, -27.417095184326172, -26.61844825744629, -25.819801330566406, -25.02115249633789, -24.222505569458008, -23.423858642578125, -22.62520980834961, -21.826562881469727, -21.02791404724121, -20.229267120361328, -19.430620193481445, -18.63197135925293, -17.833324432373047, -17.03467559814453, -16.23603057861328, -15.437382698059082, -14.6387357711792, -13.840087890625, -13.0414400100708, -12.242792129516602, -11.444145202636719, -10.64549732208252, -9.84684944152832, -9.048201560974121, -8.249554634094238, -7.450906753540039, -6.65225887298584, -5.853611469268799, -5.054964065551758, -4.256316184997559, -3.4576683044433594, -2.6590206623077393, -1.8603731393814087, -1.0617256164550781, -0.263077974319458, 0.5355696678161621, 1.3342170715332031, 2.1328649520874023, 2.9315123558044434, 3.7301599979400635, 4.528807640075684, 5.327455043792725, 6.126102447509766, 6.924750328063965, 7.723397731781006, 8.522045135498047, 9.320693016052246, 10.119340896606445, 10.917987823486328, 11.716635704040527, 12.515283584594727, 13.31393051147461, 14.112578392028809, 14.911226272583008, 15.70987319946289, 16.508520126342773, 17.30716896057129, 18.105815887451172, 18.904462814331055, 19.70311164855957, 20.501758575439453, 21.30040740966797, 22.09905433654785]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 8.0, 20.0, 16.0, 21.0, 44.0, 66.0, 99.0, 154.0, 232.0, 375.0, 684.0, 1322.0, 2851.0, 6344.0, 14290.0, 34784.0, 85534.0, 167712.0, 121103.0, 50709.0, 20856.0, 8786.0, 4090.0, 1827.0, 968.0, 513.0, 323.0, 191.0, 112.0, 62.0, 42.0, 28.0, 15.0, 24.0, 20.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.59375, -12.2308349609375, -11.867919921875, -11.5050048828125, -11.14208984375, -10.7791748046875, -10.416259765625, -10.0533447265625, -9.6904296875, -9.3275146484375, -8.964599609375, -8.6016845703125, -8.23876953125, -7.8758544921875, -7.512939453125, -7.1500244140625, -6.787109375, -6.4241943359375, -6.061279296875, -5.6983642578125, -5.33544921875, -4.9725341796875, -4.609619140625, -4.2467041015625, -3.8837890625, -3.5208740234375, -3.157958984375, -2.7950439453125, -2.43212890625, -2.0692138671875, -1.706298828125, -1.3433837890625, -0.98046875, -0.6175537109375, -0.254638671875, 0.1082763671875, 0.47119140625, 0.8341064453125, 1.197021484375, 1.5599365234375, 1.9228515625, 2.2857666015625, 2.648681640625, 3.0115966796875, 3.37451171875, 3.7374267578125, 4.100341796875, 4.4632568359375, 4.826171875, 5.1890869140625, 5.552001953125, 5.9149169921875, 6.27783203125, 6.6407470703125, 7.003662109375, 7.3665771484375, 7.7294921875, 8.0924072265625, 8.455322265625, 8.8182373046875, 9.18115234375, 9.5440673828125, 9.906982421875, 10.2698974609375, 10.6328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 8.0, 6.0, 8.0, 5.0, 13.0, 5.0, 14.0, 18.0, 18.0, 14.0, 32.0, 23.0, 31.0, 34.0, 31.0, 45.0, 49.0, 62.0, 55.0, 67.0, 53.0, 62.0, 40.0, 51.0, 40.0, 37.0, 30.0, 31.0, 26.0, 13.0, 11.0, 17.0, 7.0, 9.0, 7.0, 7.0, 4.0, 10.0, 8.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4193267822265625, -1.365020751953125, -1.3107147216796875, -1.25640869140625, -1.2021026611328125, -1.147796630859375, -1.0934906005859375, -1.0391845703125, -0.9848785400390625, -0.930572509765625, -0.8762664794921875, -0.82196044921875, -0.7676544189453125, -0.713348388671875, -0.6590423583984375, -0.604736328125, -0.5504302978515625, -0.496124267578125, -0.4418182373046875, -0.38751220703125, -0.3332061767578125, -0.278900146484375, -0.2245941162109375, -0.1702880859375, -0.1159820556640625, -0.061676025390625, -0.0073699951171875, 0.04693603515625, 0.1012420654296875, 0.155548095703125, 0.2098541259765625, 0.26416015625, 0.3184661865234375, 0.372772216796875, 0.4270782470703125, 0.48138427734375, 0.5356903076171875, 0.589996337890625, 0.6443023681640625, 0.6986083984375, 0.7529144287109375, 0.807220458984375, 0.8615264892578125, 0.91583251953125, 0.9701385498046875, 1.024444580078125, 1.0787506103515625, 1.133056640625, 1.1873626708984375, 1.241668701171875, 1.2959747314453125, 1.35028076171875, 1.4045867919921875, 1.458892822265625, 1.5131988525390625, 1.5675048828125, 1.6218109130859375, 1.676116943359375, 1.7304229736328125, 1.78472900390625, 1.8390350341796875, 1.893341064453125, 1.9476470947265625, 2.001953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 22.0, 35.0, 55.0, 97.0, 71.0, 75.0, 34.0, 17.0, 11.0, 12.0, 4.0, 9.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.008161544799805, -15.497745513916016, -14.98732852935791, -14.476912498474121, -13.966495513916016, -13.456079483032227, -12.945663452148438, -12.435246467590332, -11.924829483032227, -11.414413452148438, -10.903996467590332, -10.393580436706543, -9.883163452148438, -9.372747421264648, -8.86233139038086, -8.351914405822754, -7.841498374938965, -7.331081867218018, -6.82066535949707, -6.310249328613281, -5.799832344055176, -5.289416313171387, -4.7789998054504395, -4.268583297729492, -3.758166790008545, -3.2477502822875977, -2.7373337745666504, -2.2269175052642822, -1.716500997543335, -1.2060844898223877, -0.6956682205200195, -0.18525171279907227, 0.325164794921875, 0.8355812430381775, 1.34599769115448, 1.8564140796661377, 2.366830587387085, 2.8772470951080322, 3.3876633644104004, 3.8980798721313477, 4.408496379852295, 4.918912887573242, 5.4293293952941895, 5.939745903015137, 6.450161933898926, 6.960578918457031, 7.47099494934082, 7.981411457061768, 8.491827964782715, 9.002243995666504, 9.51266098022461, 10.023077011108398, 10.533493995666504, 11.043910026550293, 11.554327011108398, 12.064743041992188, 12.575159072875977, 13.085575103759766, 13.595992088317871, 14.10640811920166, 14.616825103759766, 15.127241134643555, 15.637657165527344, 16.148075103759766, 16.658491134643555]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 5.0, 10.0, 12.0, 20.0, 38.0, 46.0, 58.0, 62.0, 59.0, 37.0, 31.0, 18.0, 12.0, 8.0, 7.0, 6.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081541538238525, -6.814149379730225, -6.546757698059082, -6.279365539550781, -6.0119733810424805, -5.744581699371338, -5.477189540863037, -5.2097978591918945, -4.942405700683594, -4.675013542175293, -4.40762186050415, -4.14022970199585, -3.872837781906128, -3.6054458618164062, -3.3380537033081055, -3.070661783218384, -2.803269863128662, -2.5358779430389404, -2.2684860229492188, -2.001093864440918, -1.7337019443511963, -1.4663100242614746, -1.1989179849624634, -0.9315259456634521, -0.6641340255737305, -0.396742045879364, -0.12935006618499756, 0.1380419135093689, 0.40543389320373535, 0.672825813293457, 0.9402178525924683, 1.2076098918914795, 1.4750022888183594, 1.742394208908081, 2.0097861289978027, 2.2771782875061035, 2.544570207595825, 2.811962127685547, 3.0793542861938477, 3.3467462062835693, 3.614138126373291, 3.8815300464630127, 4.148921966552734, 4.416314125061035, 4.683706283569336, 4.9510979652404785, 5.218490123748779, 5.485881805419922, 5.753273963928223, 6.020666122436523, 6.288057804107666, 6.555449962615967, 6.822841644287109, 7.09023380279541, 7.357625961303711, 7.625018119812012, 7.892409801483154, 8.159801483154297, 8.427193641662598, 8.694585800170898, 8.9619779586792, 9.2293701171875, 9.496761322021484, 9.764153480529785, 10.031545639038086]}, "eval/loss": 1.8364678621292114, "eval/wer": 0.2812376041253471, "eval/runtime": 832.195, "eval/samples_per_second": 3.175, "eval/steps_per_second": 0.398} \ No newline at end of file